1/*
2 * Copyright (C) 2005 Junio C Hamano
3 */
4#include <sys/types.h>
5#include <sys/wait.h>
6#include <signal.h>
7#include "cache.h"
8#include "quote.h"
9#include "diff.h"
10#include "diffcore.h"
11#include "delta.h"
12#include "xdiff-interface.h"
13
14static int use_size_cache;
15
16static int diff_detect_rename_default = 0;
17static int diff_rename_limit_default = -1;
18static int diff_use_color_default = 0;
19
20enum color_diff {
21 DIFF_RESET = 0,
22 DIFF_PLAIN = 1,
23 DIFF_METAINFO = 2,
24 DIFF_FRAGINFO = 3,
25 DIFF_FILE_OLD = 4,
26 DIFF_FILE_NEW = 5,
27};
28
29/* "\033[1;38;5;2xx;48;5;2xxm\0" is 23 bytes */
30static char diff_colors[][24] = {
31 "\033[m", /* reset */
32 "", /* normal */
33 "\033[1m", /* bold */
34 "\033[36m", /* cyan */
35 "\033[31m", /* red */
36 "\033[32m" /* green */
37};
38
39static int parse_diff_color_slot(const char *var, int ofs)
40{
41 if (!strcasecmp(var+ofs, "plain"))
42 return DIFF_PLAIN;
43 if (!strcasecmp(var+ofs, "meta"))
44 return DIFF_METAINFO;
45 if (!strcasecmp(var+ofs, "frag"))
46 return DIFF_FRAGINFO;
47 if (!strcasecmp(var+ofs, "old"))
48 return DIFF_FILE_OLD;
49 if (!strcasecmp(var+ofs, "new"))
50 return DIFF_FILE_NEW;
51 die("bad config variable '%s'", var);
52}
53
54static int parse_color(const char *name, int len)
55{
56 static const char * const color_names[] = {
57 "normal", "black", "red", "green", "yellow",
58 "blue", "magenta", "cyan", "white"
59 };
60 char *end;
61 int i;
62 for (i = 0; i < ARRAY_SIZE(color_names); i++) {
63 const char *str = color_names[i];
64 if (!strncasecmp(name, str, len) && !str[len])
65 return i - 1;
66 }
67 i = strtol(name, &end, 10);
68 if (*name && !*end && i >= -1 && i <= 255)
69 return i;
70 return -2;
71}
72
73static int parse_attr(const char *name, int len)
74{
75 static const int attr_values[] = { 1, 2, 4, 5, 7 };
76 static const char * const attr_names[] = {
77 "bold", "dim", "ul", "blink", "reverse"
78 };
79 int i;
80 for (i = 0; i < ARRAY_SIZE(attr_names); i++) {
81 const char *str = attr_names[i];
82 if (!strncasecmp(name, str, len) && !str[len])
83 return attr_values[i];
84 }
85 return -1;
86}
87
88static void parse_diff_color_value(const char *value, const char *var, char *dst)
89{
90 const char *ptr = value;
91 int attr = -1;
92 int fg = -2;
93 int bg = -2;
94
95 if (!strcasecmp(value, "reset")) {
96 strcpy(dst, "\033[m");
97 return;
98 }
99
100 /* [fg [bg]] [attr] */
101 while (*ptr) {
102 const char *word = ptr;
103 int val, len = 0;
104
105 while (word[len] && !isspace(word[len]))
106 len++;
107
108 ptr = word + len;
109 while (*ptr && isspace(*ptr))
110 ptr++;
111
112 val = parse_color(word, len);
113 if (val >= -1) {
114 if (fg == -2) {
115 fg = val;
116 continue;
117 }
118 if (bg == -2) {
119 bg = val;
120 continue;
121 }
122 goto bad;
123 }
124 val = parse_attr(word, len);
125 if (val < 0 || attr != -1)
126 goto bad;
127 attr = val;
128 }
129
130 if (attr >= 0 || fg >= 0 || bg >= 0) {
131 int sep = 0;
132
133 *dst++ = '\033';
134 *dst++ = '[';
135 if (attr >= 0) {
136 *dst++ = '0' + attr;
137 sep++;
138 }
139 if (fg >= 0) {
140 if (sep++)
141 *dst++ = ';';
142 if (fg < 8) {
143 *dst++ = '3';
144 *dst++ = '0' + fg;
145 } else {
146 dst += sprintf(dst, "38;5;%d", fg);
147 }
148 }
149 if (bg >= 0) {
150 if (sep++)
151 *dst++ = ';';
152 if (bg < 8) {
153 *dst++ = '4';
154 *dst++ = '0' + bg;
155 } else {
156 dst += sprintf(dst, "48;5;%d", bg);
157 }
158 }
159 *dst++ = 'm';
160 }
161 *dst = 0;
162 return;
163bad:
164 die("bad config value '%s' for variable '%s'", value, var);
165}
166
167/*
168 * These are to give UI layer defaults.
169 * The core-level commands such as git-diff-files should
170 * never be affected by the setting of diff.renames
171 * the user happens to have in the configuration file.
172 */
173int git_diff_ui_config(const char *var, const char *value)
174{
175 if (!strcmp(var, "diff.renamelimit")) {
176 diff_rename_limit_default = git_config_int(var, value);
177 return 0;
178 }
179 if (!strcmp(var, "diff.color")) {
180 if (!value)
181 diff_use_color_default = 1; /* bool */
182 else if (!strcasecmp(value, "auto")) {
183 diff_use_color_default = 0;
184 if (isatty(1) || pager_in_use) {
185 char *term = getenv("TERM");
186 if (term && strcmp(term, "dumb"))
187 diff_use_color_default = 1;
188 }
189 }
190 else if (!strcasecmp(value, "never"))
191 diff_use_color_default = 0;
192 else if (!strcasecmp(value, "always"))
193 diff_use_color_default = 1;
194 else
195 diff_use_color_default = git_config_bool(var, value);
196 return 0;
197 }
198 if (!strcmp(var, "diff.renames")) {
199 if (!value)
200 diff_detect_rename_default = DIFF_DETECT_RENAME;
201 else if (!strcasecmp(value, "copies") ||
202 !strcasecmp(value, "copy"))
203 diff_detect_rename_default = DIFF_DETECT_COPY;
204 else if (git_config_bool(var,value))
205 diff_detect_rename_default = DIFF_DETECT_RENAME;
206 return 0;
207 }
208 if (!strncmp(var, "diff.color.", 11)) {
209 int slot = parse_diff_color_slot(var, 11);
210 parse_diff_color_value(value, var, diff_colors[slot]);
211 return 0;
212 }
213 return git_default_config(var, value);
214}
215
216static char *quote_one(const char *str)
217{
218 int needlen;
219 char *xp;
220
221 if (!str)
222 return NULL;
223 needlen = quote_c_style(str, NULL, NULL, 0);
224 if (!needlen)
225 return strdup(str);
226 xp = xmalloc(needlen + 1);
227 quote_c_style(str, xp, NULL, 0);
228 return xp;
229}
230
231static char *quote_two(const char *one, const char *two)
232{
233 int need_one = quote_c_style(one, NULL, NULL, 1);
234 int need_two = quote_c_style(two, NULL, NULL, 1);
235 char *xp;
236
237 if (need_one + need_two) {
238 if (!need_one) need_one = strlen(one);
239 if (!need_two) need_one = strlen(two);
240
241 xp = xmalloc(need_one + need_two + 3);
242 xp[0] = '"';
243 quote_c_style(one, xp + 1, NULL, 1);
244 quote_c_style(two, xp + need_one + 1, NULL, 1);
245 strcpy(xp + need_one + need_two + 1, "\"");
246 return xp;
247 }
248 need_one = strlen(one);
249 need_two = strlen(two);
250 xp = xmalloc(need_one + need_two + 1);
251 strcpy(xp, one);
252 strcpy(xp + need_one, two);
253 return xp;
254}
255
256static const char *external_diff(void)
257{
258 static const char *external_diff_cmd = NULL;
259 static int done_preparing = 0;
260
261 if (done_preparing)
262 return external_diff_cmd;
263 external_diff_cmd = getenv("GIT_EXTERNAL_DIFF");
264 done_preparing = 1;
265 return external_diff_cmd;
266}
267
268#define TEMPFILE_PATH_LEN 50
269
270static struct diff_tempfile {
271 const char *name; /* filename external diff should read from */
272 char hex[41];
273 char mode[10];
274 char tmp_path[TEMPFILE_PATH_LEN];
275} diff_temp[2];
276
277static int count_lines(const char *data, int size)
278{
279 int count, ch, completely_empty = 1, nl_just_seen = 0;
280 count = 0;
281 while (0 < size--) {
282 ch = *data++;
283 if (ch == '\n') {
284 count++;
285 nl_just_seen = 1;
286 completely_empty = 0;
287 }
288 else {
289 nl_just_seen = 0;
290 completely_empty = 0;
291 }
292 }
293 if (completely_empty)
294 return 0;
295 if (!nl_just_seen)
296 count++; /* no trailing newline */
297 return count;
298}
299
300static void print_line_count(int count)
301{
302 switch (count) {
303 case 0:
304 printf("0,0");
305 break;
306 case 1:
307 printf("1");
308 break;
309 default:
310 printf("1,%d", count);
311 break;
312 }
313}
314
315static void copy_file(int prefix, const char *data, int size)
316{
317 int ch, nl_just_seen = 1;
318 while (0 < size--) {
319 ch = *data++;
320 if (nl_just_seen)
321 putchar(prefix);
322 putchar(ch);
323 if (ch == '\n')
324 nl_just_seen = 1;
325 else
326 nl_just_seen = 0;
327 }
328 if (!nl_just_seen)
329 printf("\n\\ No newline at end of file\n");
330}
331
332static void emit_rewrite_diff(const char *name_a,
333 const char *name_b,
334 struct diff_filespec *one,
335 struct diff_filespec *two)
336{
337 int lc_a, lc_b;
338 diff_populate_filespec(one, 0);
339 diff_populate_filespec(two, 0);
340 lc_a = count_lines(one->data, one->size);
341 lc_b = count_lines(two->data, two->size);
342 printf("--- %s\n+++ %s\n@@ -", name_a, name_b);
343 print_line_count(lc_a);
344 printf(" +");
345 print_line_count(lc_b);
346 printf(" @@\n");
347 if (lc_a)
348 copy_file('-', one->data, one->size);
349 if (lc_b)
350 copy_file('+', two->data, two->size);
351}
352
353static int fill_mmfile(mmfile_t *mf, struct diff_filespec *one)
354{
355 if (!DIFF_FILE_VALID(one)) {
356 mf->ptr = (char *)""; /* does not matter */
357 mf->size = 0;
358 return 0;
359 }
360 else if (diff_populate_filespec(one, 0))
361 return -1;
362 mf->ptr = one->data;
363 mf->size = one->size;
364 return 0;
365}
366
367struct emit_callback {
368 struct xdiff_emit_state xm;
369 int nparents, color_diff;
370 const char **label_path;
371};
372
373static inline const char *get_color(int diff_use_color, enum color_diff ix)
374{
375 if (diff_use_color)
376 return diff_colors[ix];
377 return "";
378}
379
380static void fn_out_consume(void *priv, char *line, unsigned long len)
381{
382 int i;
383 struct emit_callback *ecbdata = priv;
384 const char *set = get_color(ecbdata->color_diff, DIFF_METAINFO);
385 const char *reset = get_color(ecbdata->color_diff, DIFF_RESET);
386
387 if (ecbdata->label_path[0]) {
388 printf("%s--- %s%s\n", set, ecbdata->label_path[0], reset);
389 printf("%s+++ %s%s\n", set, ecbdata->label_path[1], reset);
390 ecbdata->label_path[0] = ecbdata->label_path[1] = NULL;
391 }
392
393 /* This is not really necessary for now because
394 * this codepath only deals with two-way diffs.
395 */
396 for (i = 0; i < len && line[i] == '@'; i++)
397 ;
398 if (2 <= i && i < len && line[i] == ' ') {
399 ecbdata->nparents = i - 1;
400 set = get_color(ecbdata->color_diff, DIFF_FRAGINFO);
401 }
402 else if (len < ecbdata->nparents)
403 set = reset;
404 else {
405 int nparents = ecbdata->nparents;
406 int color = DIFF_PLAIN;
407 for (i = 0; i < nparents && len; i++) {
408 if (line[i] == '-')
409 color = DIFF_FILE_OLD;
410 else if (line[i] == '+')
411 color = DIFF_FILE_NEW;
412 }
413 set = get_color(ecbdata->color_diff, color);
414 }
415 if (len > 0 && line[len-1] == '\n')
416 len--;
417 fputs (set, stdout);
418 fwrite (line, len, 1, stdout);
419 puts (reset);
420}
421
422static char *pprint_rename(const char *a, const char *b)
423{
424 const char *old = a;
425 const char *new = b;
426 char *name = NULL;
427 int pfx_length, sfx_length;
428 int len_a = strlen(a);
429 int len_b = strlen(b);
430
431 /* Find common prefix */
432 pfx_length = 0;
433 while (*old && *new && *old == *new) {
434 if (*old == '/')
435 pfx_length = old - a + 1;
436 old++;
437 new++;
438 }
439
440 /* Find common suffix */
441 old = a + len_a;
442 new = b + len_b;
443 sfx_length = 0;
444 while (a <= old && b <= new && *old == *new) {
445 if (*old == '/')
446 sfx_length = len_a - (old - a);
447 old--;
448 new--;
449 }
450
451 /*
452 * pfx{mid-a => mid-b}sfx
453 * {pfx-a => pfx-b}sfx
454 * pfx{sfx-a => sfx-b}
455 * name-a => name-b
456 */
457 if (pfx_length + sfx_length) {
458 int a_midlen = len_a - pfx_length - sfx_length;
459 int b_midlen = len_b - pfx_length - sfx_length;
460 if (a_midlen < 0) a_midlen = 0;
461 if (b_midlen < 0) b_midlen = 0;
462
463 name = xmalloc(pfx_length + a_midlen + b_midlen + sfx_length + 7);
464 sprintf(name, "%.*s{%.*s => %.*s}%s",
465 pfx_length, a,
466 a_midlen, a + pfx_length,
467 b_midlen, b + pfx_length,
468 a + len_a - sfx_length);
469 }
470 else {
471 name = xmalloc(len_a + len_b + 5);
472 sprintf(name, "%s => %s", a, b);
473 }
474 return name;
475}
476
477struct diffstat_t {
478 struct xdiff_emit_state xm;
479
480 int nr;
481 int alloc;
482 struct diffstat_file {
483 char *name;
484 unsigned is_unmerged:1;
485 unsigned is_binary:1;
486 unsigned is_renamed:1;
487 unsigned int added, deleted;
488 } **files;
489};
490
491static struct diffstat_file *diffstat_add(struct diffstat_t *diffstat,
492 const char *name_a,
493 const char *name_b)
494{
495 struct diffstat_file *x;
496 x = xcalloc(sizeof (*x), 1);
497 if (diffstat->nr == diffstat->alloc) {
498 diffstat->alloc = alloc_nr(diffstat->alloc);
499 diffstat->files = xrealloc(diffstat->files,
500 diffstat->alloc * sizeof(x));
501 }
502 diffstat->files[diffstat->nr++] = x;
503 if (name_b) {
504 x->name = pprint_rename(name_a, name_b);
505 x->is_renamed = 1;
506 }
507 else
508 x->name = strdup(name_a);
509 return x;
510}
511
512static void diffstat_consume(void *priv, char *line, unsigned long len)
513{
514 struct diffstat_t *diffstat = priv;
515 struct diffstat_file *x = diffstat->files[diffstat->nr - 1];
516
517 if (line[0] == '+')
518 x->added++;
519 else if (line[0] == '-')
520 x->deleted++;
521}
522
523static const char pluses[] = "++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++";
524static const char minuses[]= "----------------------------------------------------------------------";
525const char mime_boundary_leader[] = "------------";
526
527static void show_stats(struct diffstat_t* data)
528{
529 int i, len, add, del, total, adds = 0, dels = 0;
530 int max, max_change = 0, max_len = 0;
531 int total_files = data->nr;
532
533 if (data->nr == 0)
534 return;
535
536 for (i = 0; i < data->nr; i++) {
537 struct diffstat_file *file = data->files[i];
538
539 len = strlen(file->name);
540 if (max_len < len)
541 max_len = len;
542
543 if (file->is_binary || file->is_unmerged)
544 continue;
545 if (max_change < file->added + file->deleted)
546 max_change = file->added + file->deleted;
547 }
548
549 for (i = 0; i < data->nr; i++) {
550 const char *prefix = "";
551 char *name = data->files[i]->name;
552 int added = data->files[i]->added;
553 int deleted = data->files[i]->deleted;
554
555 if (0 < (len = quote_c_style(name, NULL, NULL, 0))) {
556 char *qname = xmalloc(len + 1);
557 quote_c_style(name, qname, NULL, 0);
558 free(name);
559 data->files[i]->name = name = qname;
560 }
561
562 /*
563 * "scale" the filename
564 */
565 len = strlen(name);
566 max = max_len;
567 if (max > 50)
568 max = 50;
569 if (len > max) {
570 char *slash;
571 prefix = "...";
572 max -= 3;
573 name += len - max;
574 slash = strchr(name, '/');
575 if (slash)
576 name = slash;
577 }
578 len = max;
579
580 /*
581 * scale the add/delete
582 */
583 max = max_change;
584 if (max + len > 70)
585 max = 70 - len;
586
587 if (data->files[i]->is_binary) {
588 printf(" %s%-*s | Bin\n", prefix, len, name);
589 goto free_diffstat_file;
590 }
591 else if (data->files[i]->is_unmerged) {
592 printf(" %s%-*s | Unmerged\n", prefix, len, name);
593 goto free_diffstat_file;
594 }
595 else if (!data->files[i]->is_renamed &&
596 (added + deleted == 0)) {
597 total_files--;
598 goto free_diffstat_file;
599 }
600
601 add = added;
602 del = deleted;
603 total = add + del;
604 adds += add;
605 dels += del;
606
607 if (max_change > 0) {
608 total = (total * max + max_change / 2) / max_change;
609 add = (add * max + max_change / 2) / max_change;
610 del = total - add;
611 }
612 printf(" %s%-*s |%5d %.*s%.*s\n", prefix,
613 len, name, added + deleted,
614 add, pluses, del, minuses);
615 free_diffstat_file:
616 free(data->files[i]->name);
617 free(data->files[i]);
618 }
619 free(data->files);
620 printf(" %d files changed, %d insertions(+), %d deletions(-)\n",
621 total_files, adds, dels);
622}
623
624struct checkdiff_t {
625 struct xdiff_emit_state xm;
626 const char *filename;
627 int lineno;
628};
629
630static void checkdiff_consume(void *priv, char *line, unsigned long len)
631{
632 struct checkdiff_t *data = priv;
633
634 if (line[0] == '+') {
635 int i, spaces = 0;
636
637 data->lineno++;
638
639 /* check space before tab */
640 for (i = 1; i < len && (line[i] == ' ' || line[i] == '\t'); i++)
641 if (line[i] == ' ')
642 spaces++;
643 if (line[i - 1] == '\t' && spaces)
644 printf("%s:%d: space before tab:%.*s\n",
645 data->filename, data->lineno, (int)len, line);
646
647 /* check white space at line end */
648 if (line[len - 1] == '\n')
649 len--;
650 if (isspace(line[len - 1]))
651 printf("%s:%d: white space at end: %.*s\n",
652 data->filename, data->lineno, (int)len, line);
653 } else if (line[0] == ' ')
654 data->lineno++;
655 else if (line[0] == '@') {
656 char *plus = strchr(line, '+');
657 if (plus)
658 data->lineno = strtol(plus, NULL, 10);
659 else
660 die("invalid diff");
661 }
662}
663
664static unsigned char *deflate_it(char *data,
665 unsigned long size,
666 unsigned long *result_size)
667{
668 int bound;
669 unsigned char *deflated;
670 z_stream stream;
671
672 memset(&stream, 0, sizeof(stream));
673 deflateInit(&stream, zlib_compression_level);
674 bound = deflateBound(&stream, size);
675 deflated = xmalloc(bound);
676 stream.next_out = deflated;
677 stream.avail_out = bound;
678
679 stream.next_in = (unsigned char *)data;
680 stream.avail_in = size;
681 while (deflate(&stream, Z_FINISH) == Z_OK)
682 ; /* nothing */
683 deflateEnd(&stream);
684 *result_size = stream.total_out;
685 return deflated;
686}
687
688static void emit_binary_diff(mmfile_t *one, mmfile_t *two)
689{
690 void *cp;
691 void *delta;
692 void *deflated;
693 void *data;
694 unsigned long orig_size;
695 unsigned long delta_size;
696 unsigned long deflate_size;
697 unsigned long data_size;
698
699 printf("GIT binary patch\n");
700 /* We could do deflated delta, or we could do just deflated two,
701 * whichever is smaller.
702 */
703 delta = NULL;
704 deflated = deflate_it(two->ptr, two->size, &deflate_size);
705 if (one->size && two->size) {
706 delta = diff_delta(one->ptr, one->size,
707 two->ptr, two->size,
708 &delta_size, deflate_size);
709 if (delta) {
710 void *to_free = delta;
711 orig_size = delta_size;
712 delta = deflate_it(delta, delta_size, &delta_size);
713 free(to_free);
714 }
715 }
716
717 if (delta && delta_size < deflate_size) {
718 printf("delta %lu\n", orig_size);
719 free(deflated);
720 data = delta;
721 data_size = delta_size;
722 }
723 else {
724 printf("literal %lu\n", two->size);
725 free(delta);
726 data = deflated;
727 data_size = deflate_size;
728 }
729
730 /* emit data encoded in base85 */
731 cp = data;
732 while (data_size) {
733 int bytes = (52 < data_size) ? 52 : data_size;
734 char line[70];
735 data_size -= bytes;
736 if (bytes <= 26)
737 line[0] = bytes + 'A' - 1;
738 else
739 line[0] = bytes - 26 + 'a' - 1;
740 encode_85(line + 1, cp, bytes);
741 cp = (char *) cp + bytes;
742 puts(line);
743 }
744 printf("\n");
745 free(data);
746}
747
748#define FIRST_FEW_BYTES 8000
749static int mmfile_is_binary(mmfile_t *mf)
750{
751 long sz = mf->size;
752 if (FIRST_FEW_BYTES < sz)
753 sz = FIRST_FEW_BYTES;
754 if (memchr(mf->ptr, 0, sz))
755 return 1;
756 return 0;
757}
758
759static void builtin_diff(const char *name_a,
760 const char *name_b,
761 struct diff_filespec *one,
762 struct diff_filespec *two,
763 const char *xfrm_msg,
764 struct diff_options *o,
765 int complete_rewrite)
766{
767 mmfile_t mf1, mf2;
768 const char *lbl[2];
769 char *a_one, *b_two;
770 const char *set = get_color(o->color_diff, DIFF_METAINFO);
771 const char *reset = get_color(o->color_diff, DIFF_RESET);
772
773 a_one = quote_two("a/", name_a);
774 b_two = quote_two("b/", name_b);
775 lbl[0] = DIFF_FILE_VALID(one) ? a_one : "/dev/null";
776 lbl[1] = DIFF_FILE_VALID(two) ? b_two : "/dev/null";
777 printf("%sdiff --git %s %s%s\n", set, a_one, b_two, reset);
778 if (lbl[0][0] == '/') {
779 /* /dev/null */
780 printf("%snew file mode %06o%s\n", set, two->mode, reset);
781 if (xfrm_msg && xfrm_msg[0])
782 printf("%s%s%s\n", set, xfrm_msg, reset);
783 }
784 else if (lbl[1][0] == '/') {
785 printf("%sdeleted file mode %06o%s\n", set, one->mode, reset);
786 if (xfrm_msg && xfrm_msg[0])
787 printf("%s%s%s\n", set, xfrm_msg, reset);
788 }
789 else {
790 if (one->mode != two->mode) {
791 printf("%sold mode %06o%s\n", set, one->mode, reset);
792 printf("%snew mode %06o%s\n", set, two->mode, reset);
793 }
794 if (xfrm_msg && xfrm_msg[0])
795 printf("%s%s%s\n", set, xfrm_msg, reset);
796 /*
797 * we do not run diff between different kind
798 * of objects.
799 */
800 if ((one->mode ^ two->mode) & S_IFMT)
801 goto free_ab_and_return;
802 if (complete_rewrite) {
803 emit_rewrite_diff(name_a, name_b, one, two);
804 goto free_ab_and_return;
805 }
806 }
807
808 if (fill_mmfile(&mf1, one) < 0 || fill_mmfile(&mf2, two) < 0)
809 die("unable to read files to diff");
810
811 if (!o->text && (mmfile_is_binary(&mf1) || mmfile_is_binary(&mf2))) {
812 /* Quite common confusing case */
813 if (mf1.size == mf2.size &&
814 !memcmp(mf1.ptr, mf2.ptr, mf1.size))
815 goto free_ab_and_return;
816 if (o->binary)
817 emit_binary_diff(&mf1, &mf2);
818 else
819 printf("Binary files %s and %s differ\n",
820 lbl[0], lbl[1]);
821 }
822 else {
823 /* Crazy xdl interfaces.. */
824 const char *diffopts = getenv("GIT_DIFF_OPTS");
825 xpparam_t xpp;
826 xdemitconf_t xecfg;
827 xdemitcb_t ecb;
828 struct emit_callback ecbdata;
829
830 memset(&ecbdata, 0, sizeof(ecbdata));
831 ecbdata.label_path = lbl;
832 ecbdata.color_diff = o->color_diff;
833 xpp.flags = XDF_NEED_MINIMAL | o->xdl_opts;
834 xecfg.ctxlen = o->context;
835 xecfg.flags = XDL_EMIT_FUNCNAMES;
836 if (!diffopts)
837 ;
838 else if (!strncmp(diffopts, "--unified=", 10))
839 xecfg.ctxlen = strtoul(diffopts + 10, NULL, 10);
840 else if (!strncmp(diffopts, "-u", 2))
841 xecfg.ctxlen = strtoul(diffopts + 2, NULL, 10);
842 ecb.outf = xdiff_outf;
843 ecb.priv = &ecbdata;
844 ecbdata.xm.consume = fn_out_consume;
845 xdl_diff(&mf1, &mf2, &xpp, &xecfg, &ecb);
846 }
847
848 free_ab_and_return:
849 free(a_one);
850 free(b_two);
851 return;
852}
853
854static void builtin_diffstat(const char *name_a, const char *name_b,
855 struct diff_filespec *one,
856 struct diff_filespec *two,
857 struct diffstat_t *diffstat,
858 struct diff_options *o,
859 int complete_rewrite)
860{
861 mmfile_t mf1, mf2;
862 struct diffstat_file *data;
863
864 data = diffstat_add(diffstat, name_a, name_b);
865
866 if (!one || !two) {
867 data->is_unmerged = 1;
868 return;
869 }
870 if (complete_rewrite) {
871 diff_populate_filespec(one, 0);
872 diff_populate_filespec(two, 0);
873 data->deleted = count_lines(one->data, one->size);
874 data->added = count_lines(two->data, two->size);
875 return;
876 }
877 if (fill_mmfile(&mf1, one) < 0 || fill_mmfile(&mf2, two) < 0)
878 die("unable to read files to diff");
879
880 if (mmfile_is_binary(&mf1) || mmfile_is_binary(&mf2))
881 data->is_binary = 1;
882 else {
883 /* Crazy xdl interfaces.. */
884 xpparam_t xpp;
885 xdemitconf_t xecfg;
886 xdemitcb_t ecb;
887
888 xpp.flags = XDF_NEED_MINIMAL | o->xdl_opts;
889 xecfg.ctxlen = 0;
890 xecfg.flags = 0;
891 ecb.outf = xdiff_outf;
892 ecb.priv = diffstat;
893 xdl_diff(&mf1, &mf2, &xpp, &xecfg, &ecb);
894 }
895}
896
897static void builtin_checkdiff(const char *name_a, const char *name_b,
898 struct diff_filespec *one,
899 struct diff_filespec *two)
900{
901 mmfile_t mf1, mf2;
902 struct checkdiff_t data;
903
904 if (!two)
905 return;
906
907 memset(&data, 0, sizeof(data));
908 data.xm.consume = checkdiff_consume;
909 data.filename = name_b ? name_b : name_a;
910 data.lineno = 0;
911
912 if (fill_mmfile(&mf1, one) < 0 || fill_mmfile(&mf2, two) < 0)
913 die("unable to read files to diff");
914
915 if (mmfile_is_binary(&mf2))
916 return;
917 else {
918 /* Crazy xdl interfaces.. */
919 xpparam_t xpp;
920 xdemitconf_t xecfg;
921 xdemitcb_t ecb;
922
923 xpp.flags = XDF_NEED_MINIMAL;
924 xecfg.ctxlen = 0;
925 xecfg.flags = 0;
926 ecb.outf = xdiff_outf;
927 ecb.priv = &data;
928 xdl_diff(&mf1, &mf2, &xpp, &xecfg, &ecb);
929 }
930}
931
932struct diff_filespec *alloc_filespec(const char *path)
933{
934 int namelen = strlen(path);
935 struct diff_filespec *spec = xmalloc(sizeof(*spec) + namelen + 1);
936
937 memset(spec, 0, sizeof(*spec));
938 spec->path = (char *)(spec + 1);
939 memcpy(spec->path, path, namelen+1);
940 return spec;
941}
942
943void fill_filespec(struct diff_filespec *spec, const unsigned char *sha1,
944 unsigned short mode)
945{
946 if (mode) {
947 spec->mode = canon_mode(mode);
948 memcpy(spec->sha1, sha1, 20);
949 spec->sha1_valid = !!memcmp(sha1, null_sha1, 20);
950 }
951}
952
953/*
954 * Given a name and sha1 pair, if the dircache tells us the file in
955 * the work tree has that object contents, return true, so that
956 * prepare_temp_file() does not have to inflate and extract.
957 */
958static int work_tree_matches(const char *name, const unsigned char *sha1)
959{
960 struct cache_entry *ce;
961 struct stat st;
962 int pos, len;
963
964 /* We do not read the cache ourselves here, because the
965 * benchmark with my previous version that always reads cache
966 * shows that it makes things worse for diff-tree comparing
967 * two linux-2.6 kernel trees in an already checked out work
968 * tree. This is because most diff-tree comparisons deal with
969 * only a small number of files, while reading the cache is
970 * expensive for a large project, and its cost outweighs the
971 * savings we get by not inflating the object to a temporary
972 * file. Practically, this code only helps when we are used
973 * by diff-cache --cached, which does read the cache before
974 * calling us.
975 */
976 if (!active_cache)
977 return 0;
978
979 len = strlen(name);
980 pos = cache_name_pos(name, len);
981 if (pos < 0)
982 return 0;
983 ce = active_cache[pos];
984 if ((lstat(name, &st) < 0) ||
985 !S_ISREG(st.st_mode) || /* careful! */
986 ce_match_stat(ce, &st, 0) ||
987 memcmp(sha1, ce->sha1, 20))
988 return 0;
989 /* we return 1 only when we can stat, it is a regular file,
990 * stat information matches, and sha1 recorded in the cache
991 * matches. I.e. we know the file in the work tree really is
992 * the same as the <name, sha1> pair.
993 */
994 return 1;
995}
996
997static struct sha1_size_cache {
998 unsigned char sha1[20];
999 unsigned long size;
1000} **sha1_size_cache;
1001static int sha1_size_cache_nr, sha1_size_cache_alloc;
1002
1003static struct sha1_size_cache *locate_size_cache(unsigned char *sha1,
1004 int find_only,
1005 unsigned long size)
1006{
1007 int first, last;
1008 struct sha1_size_cache *e;
1009
1010 first = 0;
1011 last = sha1_size_cache_nr;
1012 while (last > first) {
1013 int cmp, next = (last + first) >> 1;
1014 e = sha1_size_cache[next];
1015 cmp = memcmp(e->sha1, sha1, 20);
1016 if (!cmp)
1017 return e;
1018 if (cmp < 0) {
1019 last = next;
1020 continue;
1021 }
1022 first = next+1;
1023 }
1024 /* not found */
1025 if (find_only)
1026 return NULL;
1027 /* insert to make it at "first" */
1028 if (sha1_size_cache_alloc <= sha1_size_cache_nr) {
1029 sha1_size_cache_alloc = alloc_nr(sha1_size_cache_alloc);
1030 sha1_size_cache = xrealloc(sha1_size_cache,
1031 sha1_size_cache_alloc *
1032 sizeof(*sha1_size_cache));
1033 }
1034 sha1_size_cache_nr++;
1035 if (first < sha1_size_cache_nr)
1036 memmove(sha1_size_cache + first + 1, sha1_size_cache + first,
1037 (sha1_size_cache_nr - first - 1) *
1038 sizeof(*sha1_size_cache));
1039 e = xmalloc(sizeof(struct sha1_size_cache));
1040 sha1_size_cache[first] = e;
1041 memcpy(e->sha1, sha1, 20);
1042 e->size = size;
1043 return e;
1044}
1045
1046/*
1047 * While doing rename detection and pickaxe operation, we may need to
1048 * grab the data for the blob (or file) for our own in-core comparison.
1049 * diff_filespec has data and size fields for this purpose.
1050 */
1051int diff_populate_filespec(struct diff_filespec *s, int size_only)
1052{
1053 int err = 0;
1054 if (!DIFF_FILE_VALID(s))
1055 die("internal error: asking to populate invalid file.");
1056 if (S_ISDIR(s->mode))
1057 return -1;
1058
1059 if (!use_size_cache)
1060 size_only = 0;
1061
1062 if (s->data)
1063 return err;
1064 if (!s->sha1_valid ||
1065 work_tree_matches(s->path, s->sha1)) {
1066 struct stat st;
1067 int fd;
1068 if (lstat(s->path, &st) < 0) {
1069 if (errno == ENOENT) {
1070 err_empty:
1071 err = -1;
1072 empty:
1073 s->data = (char *)"";
1074 s->size = 0;
1075 return err;
1076 }
1077 }
1078 s->size = st.st_size;
1079 if (!s->size)
1080 goto empty;
1081 if (size_only)
1082 return 0;
1083 if (S_ISLNK(st.st_mode)) {
1084 int ret;
1085 s->data = xmalloc(s->size);
1086 s->should_free = 1;
1087 ret = readlink(s->path, s->data, s->size);
1088 if (ret < 0) {
1089 free(s->data);
1090 goto err_empty;
1091 }
1092 return 0;
1093 }
1094 fd = open(s->path, O_RDONLY);
1095 if (fd < 0)
1096 goto err_empty;
1097 s->data = mmap(NULL, s->size, PROT_READ, MAP_PRIVATE, fd, 0);
1098 close(fd);
1099 if (s->data == MAP_FAILED)
1100 goto err_empty;
1101 s->should_munmap = 1;
1102 }
1103 else {
1104 char type[20];
1105 struct sha1_size_cache *e;
1106
1107 if (size_only) {
1108 e = locate_size_cache(s->sha1, 1, 0);
1109 if (e) {
1110 s->size = e->size;
1111 return 0;
1112 }
1113 if (!sha1_object_info(s->sha1, type, &s->size))
1114 locate_size_cache(s->sha1, 0, s->size);
1115 }
1116 else {
1117 s->data = read_sha1_file(s->sha1, type, &s->size);
1118 s->should_free = 1;
1119 }
1120 }
1121 return 0;
1122}
1123
1124void diff_free_filespec_data(struct diff_filespec *s)
1125{
1126 if (s->should_free)
1127 free(s->data);
1128 else if (s->should_munmap)
1129 munmap(s->data, s->size);
1130 s->should_free = s->should_munmap = 0;
1131 s->data = NULL;
1132 free(s->cnt_data);
1133 s->cnt_data = NULL;
1134}
1135
1136static void prep_temp_blob(struct diff_tempfile *temp,
1137 void *blob,
1138 unsigned long size,
1139 const unsigned char *sha1,
1140 int mode)
1141{
1142 int fd;
1143
1144 fd = git_mkstemp(temp->tmp_path, TEMPFILE_PATH_LEN, ".diff_XXXXXX");
1145 if (fd < 0)
1146 die("unable to create temp-file");
1147 if (write(fd, blob, size) != size)
1148 die("unable to write temp-file");
1149 close(fd);
1150 temp->name = temp->tmp_path;
1151 strcpy(temp->hex, sha1_to_hex(sha1));
1152 temp->hex[40] = 0;
1153 sprintf(temp->mode, "%06o", mode);
1154}
1155
1156static void prepare_temp_file(const char *name,
1157 struct diff_tempfile *temp,
1158 struct diff_filespec *one)
1159{
1160 if (!DIFF_FILE_VALID(one)) {
1161 not_a_valid_file:
1162 /* A '-' entry produces this for file-2, and
1163 * a '+' entry produces this for file-1.
1164 */
1165 temp->name = "/dev/null";
1166 strcpy(temp->hex, ".");
1167 strcpy(temp->mode, ".");
1168 return;
1169 }
1170
1171 if (!one->sha1_valid ||
1172 work_tree_matches(name, one->sha1)) {
1173 struct stat st;
1174 if (lstat(name, &st) < 0) {
1175 if (errno == ENOENT)
1176 goto not_a_valid_file;
1177 die("stat(%s): %s", name, strerror(errno));
1178 }
1179 if (S_ISLNK(st.st_mode)) {
1180 int ret;
1181 char buf[PATH_MAX + 1]; /* ought to be SYMLINK_MAX */
1182 if (sizeof(buf) <= st.st_size)
1183 die("symlink too long: %s", name);
1184 ret = readlink(name, buf, st.st_size);
1185 if (ret < 0)
1186 die("readlink(%s)", name);
1187 prep_temp_blob(temp, buf, st.st_size,
1188 (one->sha1_valid ?
1189 one->sha1 : null_sha1),
1190 (one->sha1_valid ?
1191 one->mode : S_IFLNK));
1192 }
1193 else {
1194 /* we can borrow from the file in the work tree */
1195 temp->name = name;
1196 if (!one->sha1_valid)
1197 strcpy(temp->hex, sha1_to_hex(null_sha1));
1198 else
1199 strcpy(temp->hex, sha1_to_hex(one->sha1));
1200 /* Even though we may sometimes borrow the
1201 * contents from the work tree, we always want
1202 * one->mode. mode is trustworthy even when
1203 * !(one->sha1_valid), as long as
1204 * DIFF_FILE_VALID(one).
1205 */
1206 sprintf(temp->mode, "%06o", one->mode);
1207 }
1208 return;
1209 }
1210 else {
1211 if (diff_populate_filespec(one, 0))
1212 die("cannot read data blob for %s", one->path);
1213 prep_temp_blob(temp, one->data, one->size,
1214 one->sha1, one->mode);
1215 }
1216}
1217
1218static void remove_tempfile(void)
1219{
1220 int i;
1221
1222 for (i = 0; i < 2; i++)
1223 if (diff_temp[i].name == diff_temp[i].tmp_path) {
1224 unlink(diff_temp[i].name);
1225 diff_temp[i].name = NULL;
1226 }
1227}
1228
1229static void remove_tempfile_on_signal(int signo)
1230{
1231 remove_tempfile();
1232 signal(SIGINT, SIG_DFL);
1233 raise(signo);
1234}
1235
1236static int spawn_prog(const char *pgm, const char **arg)
1237{
1238 pid_t pid;
1239 int status;
1240
1241 fflush(NULL);
1242 pid = fork();
1243 if (pid < 0)
1244 die("unable to fork");
1245 if (!pid) {
1246 execvp(pgm, (char *const*) arg);
1247 exit(255);
1248 }
1249
1250 while (waitpid(pid, &status, 0) < 0) {
1251 if (errno == EINTR)
1252 continue;
1253 return -1;
1254 }
1255
1256 /* Earlier we did not check the exit status because
1257 * diff exits non-zero if files are different, and
1258 * we are not interested in knowing that. It was a
1259 * mistake which made it harder to quit a diff-*
1260 * session that uses the git-apply-patch-script as
1261 * the GIT_EXTERNAL_DIFF. A custom GIT_EXTERNAL_DIFF
1262 * should also exit non-zero only when it wants to
1263 * abort the entire diff-* session.
1264 */
1265 if (WIFEXITED(status) && !WEXITSTATUS(status))
1266 return 0;
1267 return -1;
1268}
1269
1270/* An external diff command takes:
1271 *
1272 * diff-cmd name infile1 infile1-sha1 infile1-mode \
1273 * infile2 infile2-sha1 infile2-mode [ rename-to ]
1274 *
1275 */
1276static void run_external_diff(const char *pgm,
1277 const char *name,
1278 const char *other,
1279 struct diff_filespec *one,
1280 struct diff_filespec *two,
1281 const char *xfrm_msg,
1282 int complete_rewrite)
1283{
1284 const char *spawn_arg[10];
1285 struct diff_tempfile *temp = diff_temp;
1286 int retval;
1287 static int atexit_asked = 0;
1288 const char *othername;
1289 const char **arg = &spawn_arg[0];
1290
1291 othername = (other? other : name);
1292 if (one && two) {
1293 prepare_temp_file(name, &temp[0], one);
1294 prepare_temp_file(othername, &temp[1], two);
1295 if (! atexit_asked &&
1296 (temp[0].name == temp[0].tmp_path ||
1297 temp[1].name == temp[1].tmp_path)) {
1298 atexit_asked = 1;
1299 atexit(remove_tempfile);
1300 }
1301 signal(SIGINT, remove_tempfile_on_signal);
1302 }
1303
1304 if (one && two) {
1305 *arg++ = pgm;
1306 *arg++ = name;
1307 *arg++ = temp[0].name;
1308 *arg++ = temp[0].hex;
1309 *arg++ = temp[0].mode;
1310 *arg++ = temp[1].name;
1311 *arg++ = temp[1].hex;
1312 *arg++ = temp[1].mode;
1313 if (other) {
1314 *arg++ = other;
1315 *arg++ = xfrm_msg;
1316 }
1317 } else {
1318 *arg++ = pgm;
1319 *arg++ = name;
1320 }
1321 *arg = NULL;
1322 retval = spawn_prog(pgm, spawn_arg);
1323 remove_tempfile();
1324 if (retval) {
1325 fprintf(stderr, "external diff died, stopping at %s.\n", name);
1326 exit(1);
1327 }
1328}
1329
1330static void run_diff_cmd(const char *pgm,
1331 const char *name,
1332 const char *other,
1333 struct diff_filespec *one,
1334 struct diff_filespec *two,
1335 const char *xfrm_msg,
1336 struct diff_options *o,
1337 int complete_rewrite)
1338{
1339 if (pgm) {
1340 run_external_diff(pgm, name, other, one, two, xfrm_msg,
1341 complete_rewrite);
1342 return;
1343 }
1344 if (one && two)
1345 builtin_diff(name, other ? other : name,
1346 one, two, xfrm_msg, o, complete_rewrite);
1347 else
1348 printf("* Unmerged path %s\n", name);
1349}
1350
1351static void diff_fill_sha1_info(struct diff_filespec *one)
1352{
1353 if (DIFF_FILE_VALID(one)) {
1354 if (!one->sha1_valid) {
1355 struct stat st;
1356 if (lstat(one->path, &st) < 0)
1357 die("stat %s", one->path);
1358 if (index_path(one->sha1, one->path, &st, 0))
1359 die("cannot hash %s\n", one->path);
1360 }
1361 }
1362 else
1363 memset(one->sha1, 0, 20);
1364}
1365
1366static void run_diff(struct diff_filepair *p, struct diff_options *o)
1367{
1368 const char *pgm = external_diff();
1369 char msg[PATH_MAX*2+300], *xfrm_msg;
1370 struct diff_filespec *one;
1371 struct diff_filespec *two;
1372 const char *name;
1373 const char *other;
1374 char *name_munged, *other_munged;
1375 int complete_rewrite = 0;
1376 int len;
1377
1378 if (DIFF_PAIR_UNMERGED(p)) {
1379 /* unmerged */
1380 run_diff_cmd(pgm, p->one->path, NULL, NULL, NULL, NULL, o, 0);
1381 return;
1382 }
1383
1384 name = p->one->path;
1385 other = (strcmp(name, p->two->path) ? p->two->path : NULL);
1386 name_munged = quote_one(name);
1387 other_munged = quote_one(other);
1388 one = p->one; two = p->two;
1389
1390 diff_fill_sha1_info(one);
1391 diff_fill_sha1_info(two);
1392
1393 len = 0;
1394 switch (p->status) {
1395 case DIFF_STATUS_COPIED:
1396 len += snprintf(msg + len, sizeof(msg) - len,
1397 "similarity index %d%%\n"
1398 "copy from %s\n"
1399 "copy to %s\n",
1400 (int)(0.5 + p->score * 100.0/MAX_SCORE),
1401 name_munged, other_munged);
1402 break;
1403 case DIFF_STATUS_RENAMED:
1404 len += snprintf(msg + len, sizeof(msg) - len,
1405 "similarity index %d%%\n"
1406 "rename from %s\n"
1407 "rename to %s\n",
1408 (int)(0.5 + p->score * 100.0/MAX_SCORE),
1409 name_munged, other_munged);
1410 break;
1411 case DIFF_STATUS_MODIFIED:
1412 if (p->score) {
1413 len += snprintf(msg + len, sizeof(msg) - len,
1414 "dissimilarity index %d%%\n",
1415 (int)(0.5 + p->score *
1416 100.0/MAX_SCORE));
1417 complete_rewrite = 1;
1418 break;
1419 }
1420 /* fallthru */
1421 default:
1422 /* nothing */
1423 ;
1424 }
1425
1426 if (memcmp(one->sha1, two->sha1, 20)) {
1427 int abbrev = o->full_index ? 40 : DEFAULT_ABBREV;
1428
1429 len += snprintf(msg + len, sizeof(msg) - len,
1430 "index %.*s..%.*s",
1431 abbrev, sha1_to_hex(one->sha1),
1432 abbrev, sha1_to_hex(two->sha1));
1433 if (one->mode == two->mode)
1434 len += snprintf(msg + len, sizeof(msg) - len,
1435 " %06o", one->mode);
1436 len += snprintf(msg + len, sizeof(msg) - len, "\n");
1437 }
1438
1439 if (len)
1440 msg[--len] = 0;
1441 xfrm_msg = len ? msg : NULL;
1442
1443 if (!pgm &&
1444 DIFF_FILE_VALID(one) && DIFF_FILE_VALID(two) &&
1445 (S_IFMT & one->mode) != (S_IFMT & two->mode)) {
1446 /* a filepair that changes between file and symlink
1447 * needs to be split into deletion and creation.
1448 */
1449 struct diff_filespec *null = alloc_filespec(two->path);
1450 run_diff_cmd(NULL, name, other, one, null, xfrm_msg, o, 0);
1451 free(null);
1452 null = alloc_filespec(one->path);
1453 run_diff_cmd(NULL, name, other, null, two, xfrm_msg, o, 0);
1454 free(null);
1455 }
1456 else
1457 run_diff_cmd(pgm, name, other, one, two, xfrm_msg, o,
1458 complete_rewrite);
1459
1460 free(name_munged);
1461 free(other_munged);
1462}
1463
1464static void run_diffstat(struct diff_filepair *p, struct diff_options *o,
1465 struct diffstat_t *diffstat)
1466{
1467 const char *name;
1468 const char *other;
1469 int complete_rewrite = 0;
1470
1471 if (DIFF_PAIR_UNMERGED(p)) {
1472 /* unmerged */
1473 builtin_diffstat(p->one->path, NULL, NULL, NULL, diffstat, o, 0);
1474 return;
1475 }
1476
1477 name = p->one->path;
1478 other = (strcmp(name, p->two->path) ? p->two->path : NULL);
1479
1480 diff_fill_sha1_info(p->one);
1481 diff_fill_sha1_info(p->two);
1482
1483 if (p->status == DIFF_STATUS_MODIFIED && p->score)
1484 complete_rewrite = 1;
1485 builtin_diffstat(name, other, p->one, p->two, diffstat, o, complete_rewrite);
1486}
1487
1488static void run_checkdiff(struct diff_filepair *p, struct diff_options *o)
1489{
1490 const char *name;
1491 const char *other;
1492
1493 if (DIFF_PAIR_UNMERGED(p)) {
1494 /* unmerged */
1495 return;
1496 }
1497
1498 name = p->one->path;
1499 other = (strcmp(name, p->two->path) ? p->two->path : NULL);
1500
1501 diff_fill_sha1_info(p->one);
1502 diff_fill_sha1_info(p->two);
1503
1504 builtin_checkdiff(name, other, p->one, p->two);
1505}
1506
1507void diff_setup(struct diff_options *options)
1508{
1509 memset(options, 0, sizeof(*options));
1510 options->line_termination = '\n';
1511 options->break_opt = -1;
1512 options->rename_limit = -1;
1513 options->context = 3;
1514 options->msg_sep = "";
1515
1516 options->change = diff_change;
1517 options->add_remove = diff_addremove;
1518 options->color_diff = diff_use_color_default;
1519 options->detect_rename = diff_detect_rename_default;
1520}
1521
1522int diff_setup_done(struct diff_options *options)
1523{
1524 if ((options->find_copies_harder &&
1525 options->detect_rename != DIFF_DETECT_COPY) ||
1526 (0 <= options->rename_limit && !options->detect_rename))
1527 return -1;
1528
1529 if (options->output_format & (DIFF_FORMAT_NAME |
1530 DIFF_FORMAT_NAME_STATUS |
1531 DIFF_FORMAT_CHECKDIFF |
1532 DIFF_FORMAT_NO_OUTPUT))
1533 options->output_format &= ~(DIFF_FORMAT_RAW |
1534 DIFF_FORMAT_DIFFSTAT |
1535 DIFF_FORMAT_SUMMARY |
1536 DIFF_FORMAT_PATCH);
1537
1538 /*
1539 * These cases always need recursive; we do not drop caller-supplied
1540 * recursive bits for other formats here.
1541 */
1542 if (options->output_format & (DIFF_FORMAT_PATCH |
1543 DIFF_FORMAT_DIFFSTAT |
1544 DIFF_FORMAT_CHECKDIFF))
1545 options->recursive = 1;
1546 /*
1547 * Also pickaxe would not work very well if you do not say recursive
1548 */
1549 if (options->pickaxe)
1550 options->recursive = 1;
1551
1552 if (options->detect_rename && options->rename_limit < 0)
1553 options->rename_limit = diff_rename_limit_default;
1554 if (options->setup & DIFF_SETUP_USE_CACHE) {
1555 if (!active_cache)
1556 /* read-cache does not die even when it fails
1557 * so it is safe for us to do this here. Also
1558 * it does not smudge active_cache or active_nr
1559 * when it fails, so we do not have to worry about
1560 * cleaning it up ourselves either.
1561 */
1562 read_cache();
1563 }
1564 if (options->setup & DIFF_SETUP_USE_SIZE_CACHE)
1565 use_size_cache = 1;
1566 if (options->abbrev <= 0 || 40 < options->abbrev)
1567 options->abbrev = 40; /* full */
1568
1569 return 0;
1570}
1571
1572static int opt_arg(const char *arg, int arg_short, const char *arg_long, int *val)
1573{
1574 char c, *eq;
1575 int len;
1576
1577 if (*arg != '-')
1578 return 0;
1579 c = *++arg;
1580 if (!c)
1581 return 0;
1582 if (c == arg_short) {
1583 c = *++arg;
1584 if (!c)
1585 return 1;
1586 if (val && isdigit(c)) {
1587 char *end;
1588 int n = strtoul(arg, &end, 10);
1589 if (*end)
1590 return 0;
1591 *val = n;
1592 return 1;
1593 }
1594 return 0;
1595 }
1596 if (c != '-')
1597 return 0;
1598 arg++;
1599 eq = strchr(arg, '=');
1600 if (eq)
1601 len = eq - arg;
1602 else
1603 len = strlen(arg);
1604 if (!len || strncmp(arg, arg_long, len))
1605 return 0;
1606 if (eq) {
1607 int n;
1608 char *end;
1609 if (!isdigit(*++eq))
1610 return 0;
1611 n = strtoul(eq, &end, 10);
1612 if (*end)
1613 return 0;
1614 *val = n;
1615 }
1616 return 1;
1617}
1618
1619int diff_opt_parse(struct diff_options *options, const char **av, int ac)
1620{
1621 const char *arg = av[0];
1622 if (!strcmp(arg, "-p") || !strcmp(arg, "-u"))
1623 options->output_format |= DIFF_FORMAT_PATCH;
1624 else if (opt_arg(arg, 'U', "unified", &options->context))
1625 options->output_format |= DIFF_FORMAT_PATCH;
1626 else if (!strcmp(arg, "--raw"))
1627 options->output_format |= DIFF_FORMAT_RAW;
1628 else if (!strcmp(arg, "--patch-with-raw")) {
1629 options->output_format |= DIFF_FORMAT_PATCH | DIFF_FORMAT_RAW;
1630 }
1631 else if (!strcmp(arg, "--stat"))
1632 options->output_format |= DIFF_FORMAT_DIFFSTAT;
1633 else if (!strcmp(arg, "--check"))
1634 options->output_format |= DIFF_FORMAT_CHECKDIFF;
1635 else if (!strcmp(arg, "--summary"))
1636 options->output_format |= DIFF_FORMAT_SUMMARY;
1637 else if (!strcmp(arg, "--patch-with-stat")) {
1638 options->output_format |= DIFF_FORMAT_PATCH | DIFF_FORMAT_DIFFSTAT;
1639 }
1640 else if (!strcmp(arg, "-z"))
1641 options->line_termination = 0;
1642 else if (!strncmp(arg, "-l", 2))
1643 options->rename_limit = strtoul(arg+2, NULL, 10);
1644 else if (!strcmp(arg, "--full-index"))
1645 options->full_index = 1;
1646 else if (!strcmp(arg, "--binary")) {
1647 options->output_format |= DIFF_FORMAT_PATCH;
1648 options->full_index = options->binary = 1;
1649 }
1650 else if (!strcmp(arg, "-a") || !strcmp(arg, "--text")) {
1651 options->text = 1;
1652 }
1653 else if (!strcmp(arg, "--name-only"))
1654 options->output_format |= DIFF_FORMAT_NAME;
1655 else if (!strcmp(arg, "--name-status"))
1656 options->output_format |= DIFF_FORMAT_NAME_STATUS;
1657 else if (!strcmp(arg, "-R"))
1658 options->reverse_diff = 1;
1659 else if (!strncmp(arg, "-S", 2))
1660 options->pickaxe = arg + 2;
1661 else if (!strcmp(arg, "-s")) {
1662 options->output_format |= DIFF_FORMAT_NO_OUTPUT;
1663 }
1664 else if (!strncmp(arg, "-O", 2))
1665 options->orderfile = arg + 2;
1666 else if (!strncmp(arg, "--diff-filter=", 14))
1667 options->filter = arg + 14;
1668 else if (!strcmp(arg, "--pickaxe-all"))
1669 options->pickaxe_opts = DIFF_PICKAXE_ALL;
1670 else if (!strcmp(arg, "--pickaxe-regex"))
1671 options->pickaxe_opts = DIFF_PICKAXE_REGEX;
1672 else if (!strncmp(arg, "-B", 2)) {
1673 if ((options->break_opt =
1674 diff_scoreopt_parse(arg)) == -1)
1675 return -1;
1676 }
1677 else if (!strncmp(arg, "-M", 2)) {
1678 if ((options->rename_score =
1679 diff_scoreopt_parse(arg)) == -1)
1680 return -1;
1681 options->detect_rename = DIFF_DETECT_RENAME;
1682 }
1683 else if (!strncmp(arg, "-C", 2)) {
1684 if ((options->rename_score =
1685 diff_scoreopt_parse(arg)) == -1)
1686 return -1;
1687 options->detect_rename = DIFF_DETECT_COPY;
1688 }
1689 else if (!strcmp(arg, "--find-copies-harder"))
1690 options->find_copies_harder = 1;
1691 else if (!strcmp(arg, "--abbrev"))
1692 options->abbrev = DEFAULT_ABBREV;
1693 else if (!strncmp(arg, "--abbrev=", 9)) {
1694 options->abbrev = strtoul(arg + 9, NULL, 10);
1695 if (options->abbrev < MINIMUM_ABBREV)
1696 options->abbrev = MINIMUM_ABBREV;
1697 else if (40 < options->abbrev)
1698 options->abbrev = 40;
1699 }
1700 else if (!strcmp(arg, "--color"))
1701 options->color_diff = 1;
1702 else if (!strcmp(arg, "--no-color"))
1703 options->color_diff = 0;
1704 else if (!strcmp(arg, "-w") || !strcmp(arg, "--ignore-all-space"))
1705 options->xdl_opts |= XDF_IGNORE_WHITESPACE;
1706 else if (!strcmp(arg, "-b") || !strcmp(arg, "--ignore-space-change"))
1707 options->xdl_opts |= XDF_IGNORE_WHITESPACE_CHANGE;
1708 else if (!strcmp(arg, "--no-renames"))
1709 options->detect_rename = 0;
1710 else
1711 return 0;
1712 return 1;
1713}
1714
1715static int parse_num(const char **cp_p)
1716{
1717 unsigned long num, scale;
1718 int ch, dot;
1719 const char *cp = *cp_p;
1720
1721 num = 0;
1722 scale = 1;
1723 dot = 0;
1724 for(;;) {
1725 ch = *cp;
1726 if ( !dot && ch == '.' ) {
1727 scale = 1;
1728 dot = 1;
1729 } else if ( ch == '%' ) {
1730 scale = dot ? scale*100 : 100;
1731 cp++; /* % is always at the end */
1732 break;
1733 } else if ( ch >= '0' && ch <= '9' ) {
1734 if ( scale < 100000 ) {
1735 scale *= 10;
1736 num = (num*10) + (ch-'0');
1737 }
1738 } else {
1739 break;
1740 }
1741 cp++;
1742 }
1743 *cp_p = cp;
1744
1745 /* user says num divided by scale and we say internally that
1746 * is MAX_SCORE * num / scale.
1747 */
1748 return (num >= scale) ? MAX_SCORE : (MAX_SCORE * num / scale);
1749}
1750
1751int diff_scoreopt_parse(const char *opt)
1752{
1753 int opt1, opt2, cmd;
1754
1755 if (*opt++ != '-')
1756 return -1;
1757 cmd = *opt++;
1758 if (cmd != 'M' && cmd != 'C' && cmd != 'B')
1759 return -1; /* that is not a -M, -C nor -B option */
1760
1761 opt1 = parse_num(&opt);
1762 if (cmd != 'B')
1763 opt2 = 0;
1764 else {
1765 if (*opt == 0)
1766 opt2 = 0;
1767 else if (*opt != '/')
1768 return -1; /* we expect -B80/99 or -B80 */
1769 else {
1770 opt++;
1771 opt2 = parse_num(&opt);
1772 }
1773 }
1774 if (*opt != 0)
1775 return -1;
1776 return opt1 | (opt2 << 16);
1777}
1778
1779struct diff_queue_struct diff_queued_diff;
1780
1781void diff_q(struct diff_queue_struct *queue, struct diff_filepair *dp)
1782{
1783 if (queue->alloc <= queue->nr) {
1784 queue->alloc = alloc_nr(queue->alloc);
1785 queue->queue = xrealloc(queue->queue,
1786 sizeof(dp) * queue->alloc);
1787 }
1788 queue->queue[queue->nr++] = dp;
1789}
1790
1791struct diff_filepair *diff_queue(struct diff_queue_struct *queue,
1792 struct diff_filespec *one,
1793 struct diff_filespec *two)
1794{
1795 struct diff_filepair *dp = xmalloc(sizeof(*dp));
1796 dp->one = one;
1797 dp->two = two;
1798 dp->score = 0;
1799 dp->status = 0;
1800 dp->source_stays = 0;
1801 dp->broken_pair = 0;
1802 if (queue)
1803 diff_q(queue, dp);
1804 return dp;
1805}
1806
1807void diff_free_filepair(struct diff_filepair *p)
1808{
1809 diff_free_filespec_data(p->one);
1810 diff_free_filespec_data(p->two);
1811 free(p->one);
1812 free(p->two);
1813 free(p);
1814}
1815
1816/* This is different from find_unique_abbrev() in that
1817 * it stuffs the result with dots for alignment.
1818 */
1819const char *diff_unique_abbrev(const unsigned char *sha1, int len)
1820{
1821 int abblen;
1822 const char *abbrev;
1823 if (len == 40)
1824 return sha1_to_hex(sha1);
1825
1826 abbrev = find_unique_abbrev(sha1, len);
1827 if (!abbrev)
1828 return sha1_to_hex(sha1);
1829 abblen = strlen(abbrev);
1830 if (abblen < 37) {
1831 static char hex[41];
1832 if (len < abblen && abblen <= len + 2)
1833 sprintf(hex, "%s%.*s", abbrev, len+3-abblen, "..");
1834 else
1835 sprintf(hex, "%s...", abbrev);
1836 return hex;
1837 }
1838 return sha1_to_hex(sha1);
1839}
1840
1841static void diff_flush_raw(struct diff_filepair *p,
1842 struct diff_options *options)
1843{
1844 int two_paths;
1845 char status[10];
1846 int abbrev = options->abbrev;
1847 const char *path_one, *path_two;
1848 int inter_name_termination = '\t';
1849 int line_termination = options->line_termination;
1850
1851 if (!line_termination)
1852 inter_name_termination = 0;
1853
1854 path_one = p->one->path;
1855 path_two = p->two->path;
1856 if (line_termination) {
1857 path_one = quote_one(path_one);
1858 path_two = quote_one(path_two);
1859 }
1860
1861 if (p->score)
1862 sprintf(status, "%c%03d", p->status,
1863 (int)(0.5 + p->score * 100.0/MAX_SCORE));
1864 else {
1865 status[0] = p->status;
1866 status[1] = 0;
1867 }
1868 switch (p->status) {
1869 case DIFF_STATUS_COPIED:
1870 case DIFF_STATUS_RENAMED:
1871 two_paths = 1;
1872 break;
1873 case DIFF_STATUS_ADDED:
1874 case DIFF_STATUS_DELETED:
1875 two_paths = 0;
1876 break;
1877 default:
1878 two_paths = 0;
1879 break;
1880 }
1881 if (!(options->output_format & DIFF_FORMAT_NAME_STATUS)) {
1882 printf(":%06o %06o %s ",
1883 p->one->mode, p->two->mode,
1884 diff_unique_abbrev(p->one->sha1, abbrev));
1885 printf("%s ",
1886 diff_unique_abbrev(p->two->sha1, abbrev));
1887 }
1888 printf("%s%c%s", status, inter_name_termination, path_one);
1889 if (two_paths)
1890 printf("%c%s", inter_name_termination, path_two);
1891 putchar(line_termination);
1892 if (path_one != p->one->path)
1893 free((void*)path_one);
1894 if (path_two != p->two->path)
1895 free((void*)path_two);
1896}
1897
1898static void diff_flush_name(struct diff_filepair *p, int line_termination)
1899{
1900 char *path = p->two->path;
1901
1902 if (line_termination)
1903 path = quote_one(p->two->path);
1904 printf("%s%c", path, line_termination);
1905 if (p->two->path != path)
1906 free(path);
1907}
1908
1909int diff_unmodified_pair(struct diff_filepair *p)
1910{
1911 /* This function is written stricter than necessary to support
1912 * the currently implemented transformers, but the idea is to
1913 * let transformers to produce diff_filepairs any way they want,
1914 * and filter and clean them up here before producing the output.
1915 */
1916 struct diff_filespec *one, *two;
1917
1918 if (DIFF_PAIR_UNMERGED(p))
1919 return 0; /* unmerged is interesting */
1920
1921 one = p->one;
1922 two = p->two;
1923
1924 /* deletion, addition, mode or type change
1925 * and rename are all interesting.
1926 */
1927 if (DIFF_FILE_VALID(one) != DIFF_FILE_VALID(two) ||
1928 DIFF_PAIR_MODE_CHANGED(p) ||
1929 strcmp(one->path, two->path))
1930 return 0;
1931
1932 /* both are valid and point at the same path. that is, we are
1933 * dealing with a change.
1934 */
1935 if (one->sha1_valid && two->sha1_valid &&
1936 !memcmp(one->sha1, two->sha1, sizeof(one->sha1)))
1937 return 1; /* no change */
1938 if (!one->sha1_valid && !two->sha1_valid)
1939 return 1; /* both look at the same file on the filesystem. */
1940 return 0;
1941}
1942
1943static void diff_flush_patch(struct diff_filepair *p, struct diff_options *o)
1944{
1945 if (diff_unmodified_pair(p))
1946 return;
1947
1948 if ((DIFF_FILE_VALID(p->one) && S_ISDIR(p->one->mode)) ||
1949 (DIFF_FILE_VALID(p->two) && S_ISDIR(p->two->mode)))
1950 return; /* no tree diffs in patch format */
1951
1952 run_diff(p, o);
1953}
1954
1955static void diff_flush_stat(struct diff_filepair *p, struct diff_options *o,
1956 struct diffstat_t *diffstat)
1957{
1958 if (diff_unmodified_pair(p))
1959 return;
1960
1961 if ((DIFF_FILE_VALID(p->one) && S_ISDIR(p->one->mode)) ||
1962 (DIFF_FILE_VALID(p->two) && S_ISDIR(p->two->mode)))
1963 return; /* no tree diffs in patch format */
1964
1965 run_diffstat(p, o, diffstat);
1966}
1967
1968static void diff_flush_checkdiff(struct diff_filepair *p,
1969 struct diff_options *o)
1970{
1971 if (diff_unmodified_pair(p))
1972 return;
1973
1974 if ((DIFF_FILE_VALID(p->one) && S_ISDIR(p->one->mode)) ||
1975 (DIFF_FILE_VALID(p->two) && S_ISDIR(p->two->mode)))
1976 return; /* no tree diffs in patch format */
1977
1978 run_checkdiff(p, o);
1979}
1980
1981int diff_queue_is_empty(void)
1982{
1983 struct diff_queue_struct *q = &diff_queued_diff;
1984 int i;
1985 for (i = 0; i < q->nr; i++)
1986 if (!diff_unmodified_pair(q->queue[i]))
1987 return 0;
1988 return 1;
1989}
1990
1991#if DIFF_DEBUG
1992void diff_debug_filespec(struct diff_filespec *s, int x, const char *one)
1993{
1994 fprintf(stderr, "queue[%d] %s (%s) %s %06o %s\n",
1995 x, one ? one : "",
1996 s->path,
1997 DIFF_FILE_VALID(s) ? "valid" : "invalid",
1998 s->mode,
1999 s->sha1_valid ? sha1_to_hex(s->sha1) : "");
2000 fprintf(stderr, "queue[%d] %s size %lu flags %d\n",
2001 x, one ? one : "",
2002 s->size, s->xfrm_flags);
2003}
2004
2005void diff_debug_filepair(const struct diff_filepair *p, int i)
2006{
2007 diff_debug_filespec(p->one, i, "one");
2008 diff_debug_filespec(p->two, i, "two");
2009 fprintf(stderr, "score %d, status %c stays %d broken %d\n",
2010 p->score, p->status ? p->status : '?',
2011 p->source_stays, p->broken_pair);
2012}
2013
2014void diff_debug_queue(const char *msg, struct diff_queue_struct *q)
2015{
2016 int i;
2017 if (msg)
2018 fprintf(stderr, "%s\n", msg);
2019 fprintf(stderr, "q->nr = %d\n", q->nr);
2020 for (i = 0; i < q->nr; i++) {
2021 struct diff_filepair *p = q->queue[i];
2022 diff_debug_filepair(p, i);
2023 }
2024}
2025#endif
2026
2027static void diff_resolve_rename_copy(void)
2028{
2029 int i, j;
2030 struct diff_filepair *p, *pp;
2031 struct diff_queue_struct *q = &diff_queued_diff;
2032
2033 diff_debug_queue("resolve-rename-copy", q);
2034
2035 for (i = 0; i < q->nr; i++) {
2036 p = q->queue[i];
2037 p->status = 0; /* undecided */
2038 if (DIFF_PAIR_UNMERGED(p))
2039 p->status = DIFF_STATUS_UNMERGED;
2040 else if (!DIFF_FILE_VALID(p->one))
2041 p->status = DIFF_STATUS_ADDED;
2042 else if (!DIFF_FILE_VALID(p->two))
2043 p->status = DIFF_STATUS_DELETED;
2044 else if (DIFF_PAIR_TYPE_CHANGED(p))
2045 p->status = DIFF_STATUS_TYPE_CHANGED;
2046
2047 /* from this point on, we are dealing with a pair
2048 * whose both sides are valid and of the same type, i.e.
2049 * either in-place edit or rename/copy edit.
2050 */
2051 else if (DIFF_PAIR_RENAME(p)) {
2052 if (p->source_stays) {
2053 p->status = DIFF_STATUS_COPIED;
2054 continue;
2055 }
2056 /* See if there is some other filepair that
2057 * copies from the same source as us. If so
2058 * we are a copy. Otherwise we are either a
2059 * copy if the path stays, or a rename if it
2060 * does not, but we already handled "stays" case.
2061 */
2062 for (j = i + 1; j < q->nr; j++) {
2063 pp = q->queue[j];
2064 if (strcmp(pp->one->path, p->one->path))
2065 continue; /* not us */
2066 if (!DIFF_PAIR_RENAME(pp))
2067 continue; /* not a rename/copy */
2068 /* pp is a rename/copy from the same source */
2069 p->status = DIFF_STATUS_COPIED;
2070 break;
2071 }
2072 if (!p->status)
2073 p->status = DIFF_STATUS_RENAMED;
2074 }
2075 else if (memcmp(p->one->sha1, p->two->sha1, 20) ||
2076 p->one->mode != p->two->mode)
2077 p->status = DIFF_STATUS_MODIFIED;
2078 else {
2079 /* This is a "no-change" entry and should not
2080 * happen anymore, but prepare for broken callers.
2081 */
2082 error("feeding unmodified %s to diffcore",
2083 p->one->path);
2084 p->status = DIFF_STATUS_UNKNOWN;
2085 }
2086 }
2087 diff_debug_queue("resolve-rename-copy done", q);
2088}
2089
2090static int check_pair_status(struct diff_filepair *p)
2091{
2092 switch (p->status) {
2093 case DIFF_STATUS_UNKNOWN:
2094 return 0;
2095 case 0:
2096 die("internal error in diff-resolve-rename-copy");
2097 default:
2098 return 1;
2099 }
2100}
2101
2102static void flush_one_pair(struct diff_filepair *p, struct diff_options *opt)
2103{
2104 int fmt = opt->output_format;
2105
2106 if (fmt & DIFF_FORMAT_CHECKDIFF)
2107 diff_flush_checkdiff(p, opt);
2108 else if (fmt & (DIFF_FORMAT_RAW | DIFF_FORMAT_NAME_STATUS))
2109 diff_flush_raw(p, opt);
2110 else if (fmt & DIFF_FORMAT_NAME)
2111 diff_flush_name(p, opt->line_termination);
2112}
2113
2114static void show_file_mode_name(const char *newdelete, struct diff_filespec *fs)
2115{
2116 if (fs->mode)
2117 printf(" %s mode %06o %s\n", newdelete, fs->mode, fs->path);
2118 else
2119 printf(" %s %s\n", newdelete, fs->path);
2120}
2121
2122
2123static void show_mode_change(struct diff_filepair *p, int show_name)
2124{
2125 if (p->one->mode && p->two->mode && p->one->mode != p->two->mode) {
2126 if (show_name)
2127 printf(" mode change %06o => %06o %s\n",
2128 p->one->mode, p->two->mode, p->two->path);
2129 else
2130 printf(" mode change %06o => %06o\n",
2131 p->one->mode, p->two->mode);
2132 }
2133}
2134
2135static void show_rename_copy(const char *renamecopy, struct diff_filepair *p)
2136{
2137 const char *old, *new;
2138
2139 /* Find common prefix */
2140 old = p->one->path;
2141 new = p->two->path;
2142 while (1) {
2143 const char *slash_old, *slash_new;
2144 slash_old = strchr(old, '/');
2145 slash_new = strchr(new, '/');
2146 if (!slash_old ||
2147 !slash_new ||
2148 slash_old - old != slash_new - new ||
2149 memcmp(old, new, slash_new - new))
2150 break;
2151 old = slash_old + 1;
2152 new = slash_new + 1;
2153 }
2154 /* p->one->path thru old is the common prefix, and old and new
2155 * through the end of names are renames
2156 */
2157 if (old != p->one->path)
2158 printf(" %s %.*s{%s => %s} (%d%%)\n", renamecopy,
2159 (int)(old - p->one->path), p->one->path,
2160 old, new, (int)(0.5 + p->score * 100.0/MAX_SCORE));
2161 else
2162 printf(" %s %s => %s (%d%%)\n", renamecopy,
2163 p->one->path, p->two->path,
2164 (int)(0.5 + p->score * 100.0/MAX_SCORE));
2165 show_mode_change(p, 0);
2166}
2167
2168static void diff_summary(struct diff_filepair *p)
2169{
2170 switch(p->status) {
2171 case DIFF_STATUS_DELETED:
2172 show_file_mode_name("delete", p->one);
2173 break;
2174 case DIFF_STATUS_ADDED:
2175 show_file_mode_name("create", p->two);
2176 break;
2177 case DIFF_STATUS_COPIED:
2178 show_rename_copy("copy", p);
2179 break;
2180 case DIFF_STATUS_RENAMED:
2181 show_rename_copy("rename", p);
2182 break;
2183 default:
2184 if (p->score) {
2185 printf(" rewrite %s (%d%%)\n", p->two->path,
2186 (int)(0.5 + p->score * 100.0/MAX_SCORE));
2187 show_mode_change(p, 0);
2188 } else show_mode_change(p, 1);
2189 break;
2190 }
2191}
2192
2193struct patch_id_t {
2194 struct xdiff_emit_state xm;
2195 SHA_CTX *ctx;
2196 int patchlen;
2197};
2198
2199static int remove_space(char *line, int len)
2200{
2201 int i;
2202 char *dst = line;
2203 unsigned char c;
2204
2205 for (i = 0; i < len; i++)
2206 if (!isspace((c = line[i])))
2207 *dst++ = c;
2208
2209 return dst - line;
2210}
2211
2212static void patch_id_consume(void *priv, char *line, unsigned long len)
2213{
2214 struct patch_id_t *data = priv;
2215 int new_len;
2216
2217 /* Ignore line numbers when computing the SHA1 of the patch */
2218 if (!strncmp(line, "@@ -", 4))
2219 return;
2220
2221 new_len = remove_space(line, len);
2222
2223 SHA1_Update(data->ctx, line, new_len);
2224 data->patchlen += new_len;
2225}
2226
2227/* returns 0 upon success, and writes result into sha1 */
2228static int diff_get_patch_id(struct diff_options *options, unsigned char *sha1)
2229{
2230 struct diff_queue_struct *q = &diff_queued_diff;
2231 int i;
2232 SHA_CTX ctx;
2233 struct patch_id_t data;
2234 char buffer[PATH_MAX * 4 + 20];
2235
2236 SHA1_Init(&ctx);
2237 memset(&data, 0, sizeof(struct patch_id_t));
2238 data.ctx = &ctx;
2239 data.xm.consume = patch_id_consume;
2240
2241 for (i = 0; i < q->nr; i++) {
2242 xpparam_t xpp;
2243 xdemitconf_t xecfg;
2244 xdemitcb_t ecb;
2245 mmfile_t mf1, mf2;
2246 struct diff_filepair *p = q->queue[i];
2247 int len1, len2;
2248
2249 if (p->status == 0)
2250 return error("internal diff status error");
2251 if (p->status == DIFF_STATUS_UNKNOWN)
2252 continue;
2253 if (diff_unmodified_pair(p))
2254 continue;
2255 if ((DIFF_FILE_VALID(p->one) && S_ISDIR(p->one->mode)) ||
2256 (DIFF_FILE_VALID(p->two) && S_ISDIR(p->two->mode)))
2257 continue;
2258 if (DIFF_PAIR_UNMERGED(p))
2259 continue;
2260
2261 diff_fill_sha1_info(p->one);
2262 diff_fill_sha1_info(p->two);
2263 if (fill_mmfile(&mf1, p->one) < 0 ||
2264 fill_mmfile(&mf2, p->two) < 0)
2265 return error("unable to read files to diff");
2266
2267 /* Maybe hash p->two? into the patch id? */
2268 if (mmfile_is_binary(&mf2))
2269 continue;
2270
2271 len1 = remove_space(p->one->path, strlen(p->one->path));
2272 len2 = remove_space(p->two->path, strlen(p->two->path));
2273 if (p->one->mode == 0)
2274 len1 = snprintf(buffer, sizeof(buffer),
2275 "diff--gita/%.*sb/%.*s"
2276 "newfilemode%06o"
2277 "---/dev/null"
2278 "+++b/%.*s",
2279 len1, p->one->path,
2280 len2, p->two->path,
2281 p->two->mode,
2282 len2, p->two->path);
2283 else if (p->two->mode == 0)
2284 len1 = snprintf(buffer, sizeof(buffer),
2285 "diff--gita/%.*sb/%.*s"
2286 "deletedfilemode%06o"
2287 "---a/%.*s"
2288 "+++/dev/null",
2289 len1, p->one->path,
2290 len2, p->two->path,
2291 p->one->mode,
2292 len1, p->one->path);
2293 else
2294 len1 = snprintf(buffer, sizeof(buffer),
2295 "diff--gita/%.*sb/%.*s"
2296 "---a/%.*s"
2297 "+++b/%.*s",
2298 len1, p->one->path,
2299 len2, p->two->path,
2300 len1, p->one->path,
2301 len2, p->two->path);
2302 SHA1_Update(&ctx, buffer, len1);
2303
2304 xpp.flags = XDF_NEED_MINIMAL;
2305 xecfg.ctxlen = 3;
2306 xecfg.flags = XDL_EMIT_FUNCNAMES;
2307 ecb.outf = xdiff_outf;
2308 ecb.priv = &data;
2309 xdl_diff(&mf1, &mf2, &xpp, &xecfg, &ecb);
2310 }
2311
2312 SHA1_Final(sha1, &ctx);
2313 return 0;
2314}
2315
2316int diff_flush_patch_id(struct diff_options *options, unsigned char *sha1)
2317{
2318 struct diff_queue_struct *q = &diff_queued_diff;
2319 int i;
2320 int result = diff_get_patch_id(options, sha1);
2321
2322 for (i = 0; i < q->nr; i++)
2323 diff_free_filepair(q->queue[i]);
2324
2325 free(q->queue);
2326 q->queue = NULL;
2327 q->nr = q->alloc = 0;
2328
2329 return result;
2330}
2331
2332static int is_summary_empty(const struct diff_queue_struct *q)
2333{
2334 int i;
2335
2336 for (i = 0; i < q->nr; i++) {
2337 const struct diff_filepair *p = q->queue[i];
2338
2339 switch (p->status) {
2340 case DIFF_STATUS_DELETED:
2341 case DIFF_STATUS_ADDED:
2342 case DIFF_STATUS_COPIED:
2343 case DIFF_STATUS_RENAMED:
2344 return 0;
2345 default:
2346 if (p->score)
2347 return 0;
2348 if (p->one->mode && p->two->mode &&
2349 p->one->mode != p->two->mode)
2350 return 0;
2351 break;
2352 }
2353 }
2354 return 1;
2355}
2356
2357void diff_flush(struct diff_options *options)
2358{
2359 struct diff_queue_struct *q = &diff_queued_diff;
2360 int i, output_format = options->output_format;
2361 int separator = 0;
2362
2363 /*
2364 * Order: raw, stat, summary, patch
2365 * or: name/name-status/checkdiff (other bits clear)
2366 */
2367 if (!q->nr)
2368 goto free_queue;
2369
2370 if (output_format & (DIFF_FORMAT_RAW |
2371 DIFF_FORMAT_NAME |
2372 DIFF_FORMAT_NAME_STATUS |
2373 DIFF_FORMAT_CHECKDIFF)) {
2374 for (i = 0; i < q->nr; i++) {
2375 struct diff_filepair *p = q->queue[i];
2376 if (check_pair_status(p))
2377 flush_one_pair(p, options);
2378 }
2379 separator++;
2380 }
2381
2382 if (output_format & DIFF_FORMAT_DIFFSTAT) {
2383 struct diffstat_t diffstat;
2384
2385 memset(&diffstat, 0, sizeof(struct diffstat_t));
2386 diffstat.xm.consume = diffstat_consume;
2387 for (i = 0; i < q->nr; i++) {
2388 struct diff_filepair *p = q->queue[i];
2389 if (check_pair_status(p))
2390 diff_flush_stat(p, options, &diffstat);
2391 }
2392 show_stats(&diffstat);
2393 separator++;
2394 }
2395
2396 if (output_format & DIFF_FORMAT_SUMMARY && !is_summary_empty(q)) {
2397 for (i = 0; i < q->nr; i++)
2398 diff_summary(q->queue[i]);
2399 separator++;
2400 }
2401
2402 if (output_format & DIFF_FORMAT_PATCH) {
2403 if (separator) {
2404 if (options->stat_sep) {
2405 /* attach patch instead of inline */
2406 fputs(options->stat_sep, stdout);
2407 } else {
2408 putchar(options->line_termination);
2409 }
2410 }
2411
2412 for (i = 0; i < q->nr; i++) {
2413 struct diff_filepair *p = q->queue[i];
2414 if (check_pair_status(p))
2415 diff_flush_patch(p, options);
2416 }
2417 }
2418
2419 for (i = 0; i < q->nr; i++)
2420 diff_free_filepair(q->queue[i]);
2421free_queue:
2422 free(q->queue);
2423 q->queue = NULL;
2424 q->nr = q->alloc = 0;
2425}
2426
2427static void diffcore_apply_filter(const char *filter)
2428{
2429 int i;
2430 struct diff_queue_struct *q = &diff_queued_diff;
2431 struct diff_queue_struct outq;
2432 outq.queue = NULL;
2433 outq.nr = outq.alloc = 0;
2434
2435 if (!filter)
2436 return;
2437
2438 if (strchr(filter, DIFF_STATUS_FILTER_AON)) {
2439 int found;
2440 for (i = found = 0; !found && i < q->nr; i++) {
2441 struct diff_filepair *p = q->queue[i];
2442 if (((p->status == DIFF_STATUS_MODIFIED) &&
2443 ((p->score &&
2444 strchr(filter, DIFF_STATUS_FILTER_BROKEN)) ||
2445 (!p->score &&
2446 strchr(filter, DIFF_STATUS_MODIFIED)))) ||
2447 ((p->status != DIFF_STATUS_MODIFIED) &&
2448 strchr(filter, p->status)))
2449 found++;
2450 }
2451 if (found)
2452 return;
2453
2454 /* otherwise we will clear the whole queue
2455 * by copying the empty outq at the end of this
2456 * function, but first clear the current entries
2457 * in the queue.
2458 */
2459 for (i = 0; i < q->nr; i++)
2460 diff_free_filepair(q->queue[i]);
2461 }
2462 else {
2463 /* Only the matching ones */
2464 for (i = 0; i < q->nr; i++) {
2465 struct diff_filepair *p = q->queue[i];
2466
2467 if (((p->status == DIFF_STATUS_MODIFIED) &&
2468 ((p->score &&
2469 strchr(filter, DIFF_STATUS_FILTER_BROKEN)) ||
2470 (!p->score &&
2471 strchr(filter, DIFF_STATUS_MODIFIED)))) ||
2472 ((p->status != DIFF_STATUS_MODIFIED) &&
2473 strchr(filter, p->status)))
2474 diff_q(&outq, p);
2475 else
2476 diff_free_filepair(p);
2477 }
2478 }
2479 free(q->queue);
2480 *q = outq;
2481}
2482
2483void diffcore_std(struct diff_options *options)
2484{
2485 if (options->break_opt != -1)
2486 diffcore_break(options->break_opt);
2487 if (options->detect_rename)
2488 diffcore_rename(options);
2489 if (options->break_opt != -1)
2490 diffcore_merge_broken();
2491 if (options->pickaxe)
2492 diffcore_pickaxe(options->pickaxe, options->pickaxe_opts);
2493 if (options->orderfile)
2494 diffcore_order(options->orderfile);
2495 diff_resolve_rename_copy();
2496 diffcore_apply_filter(options->filter);
2497}
2498
2499
2500void diffcore_std_no_resolve(struct diff_options *options)
2501{
2502 if (options->pickaxe)
2503 diffcore_pickaxe(options->pickaxe, options->pickaxe_opts);
2504 if (options->orderfile)
2505 diffcore_order(options->orderfile);
2506 diffcore_apply_filter(options->filter);
2507}
2508
2509void diff_addremove(struct diff_options *options,
2510 int addremove, unsigned mode,
2511 const unsigned char *sha1,
2512 const char *base, const char *path)
2513{
2514 char concatpath[PATH_MAX];
2515 struct diff_filespec *one, *two;
2516
2517 /* This may look odd, but it is a preparation for
2518 * feeding "there are unchanged files which should
2519 * not produce diffs, but when you are doing copy
2520 * detection you would need them, so here they are"
2521 * entries to the diff-core. They will be prefixed
2522 * with something like '=' or '*' (I haven't decided
2523 * which but should not make any difference).
2524 * Feeding the same new and old to diff_change()
2525 * also has the same effect.
2526 * Before the final output happens, they are pruned after
2527 * merged into rename/copy pairs as appropriate.
2528 */
2529 if (options->reverse_diff)
2530 addremove = (addremove == '+' ? '-' :
2531 addremove == '-' ? '+' : addremove);
2532
2533 if (!path) path = "";
2534 sprintf(concatpath, "%s%s", base, path);
2535 one = alloc_filespec(concatpath);
2536 two = alloc_filespec(concatpath);
2537
2538 if (addremove != '+')
2539 fill_filespec(one, sha1, mode);
2540 if (addremove != '-')
2541 fill_filespec(two, sha1, mode);
2542
2543 diff_queue(&diff_queued_diff, one, two);
2544}
2545
2546void diff_change(struct diff_options *options,
2547 unsigned old_mode, unsigned new_mode,
2548 const unsigned char *old_sha1,
2549 const unsigned char *new_sha1,
2550 const char *base, const char *path)
2551{
2552 char concatpath[PATH_MAX];
2553 struct diff_filespec *one, *two;
2554
2555 if (options->reverse_diff) {
2556 unsigned tmp;
2557 const unsigned char *tmp_c;
2558 tmp = old_mode; old_mode = new_mode; new_mode = tmp;
2559 tmp_c = old_sha1; old_sha1 = new_sha1; new_sha1 = tmp_c;
2560 }
2561 if (!path) path = "";
2562 sprintf(concatpath, "%s%s", base, path);
2563 one = alloc_filespec(concatpath);
2564 two = alloc_filespec(concatpath);
2565 fill_filespec(one, old_sha1, old_mode);
2566 fill_filespec(two, new_sha1, new_mode);
2567
2568 diff_queue(&diff_queued_diff, one, two);
2569}
2570
2571void diff_unmerge(struct diff_options *options,
2572 const char *path)
2573{
2574 struct diff_filespec *one, *two;
2575 one = alloc_filespec(path);
2576 two = alloc_filespec(path);
2577 diff_queue(&diff_queued_diff, one, two);
2578}