tag.c: use 'ref-filter' APIs
[gitweb.git] / fsck.c
diff --git a/fsck.c b/fsck.c
index ab246185e8f0d80e218b61fd88b74469cbb3f9ea..e41e753d6dcbb577148260a1392210d50fb0b325 100644 (file)
--- a/fsck.c
+++ b/fsck.c
@@ -8,8 +8,15 @@
 #include "fsck.h"
 #include "refs.h"
 #include "utf8.h"
+#include "sha1-array.h"
+
+#define FSCK_FATAL -1
+#define FSCK_INFO -2
 
 #define FOREACH_MSG_ID(FUNC) \
+       /* fatal errors */ \
+       FUNC(NUL_IN_HEADER, FATAL) \
+       FUNC(UNTERMINATED_HEADER, FATAL) \
        /* errors */ \
        FUNC(BAD_DATE, ERROR) \
        FUNC(BAD_DATE_OVERFLOW, ERROR) \
        FUNC(MISSING_TREE, ERROR) \
        FUNC(MISSING_TYPE, ERROR) \
        FUNC(MISSING_TYPE_ENTRY, ERROR) \
-       FUNC(NUL_IN_HEADER, ERROR) \
+       FUNC(MULTIPLE_AUTHORS, ERROR) \
        FUNC(TAG_OBJECT_NOT_TAG, ERROR) \
        FUNC(TREE_NOT_SORTED, ERROR) \
        FUNC(UNKNOWN_TYPE, ERROR) \
-       FUNC(UNTERMINATED_HEADER, ERROR) \
        FUNC(ZERO_PADDED_DATE, ERROR) \
        /* warnings */ \
        FUNC(BAD_FILEMODE, WARN) \
-       FUNC(BAD_TAG_NAME, WARN) \
        FUNC(EMPTY_NAME, WARN) \
        FUNC(FULL_PATHNAME, WARN) \
        FUNC(HAS_DOT, WARN) \
        FUNC(HAS_DOTDOT, WARN) \
        FUNC(HAS_DOTGIT, WARN) \
-       FUNC(MISSING_TAGGER_ENTRY, WARN) \
        FUNC(NULL_SHA1, WARN) \
-       FUNC(ZERO_PADDED_FILEMODE, WARN)
+       FUNC(ZERO_PADDED_FILEMODE, WARN) \
+       /* infos (reported as warnings, but ignored by default) */ \
+       FUNC(BAD_TAG_NAME, INFO) \
+       FUNC(MISSING_TAGGER_ENTRY, INFO)
 
 #define MSG_ID(id, msg_type) FSCK_MSG_##id,
 enum fsck_msg_id {
@@ -63,27 +70,200 @@ enum fsck_msg_id {
 };
 #undef MSG_ID
 
-#define MSG_ID(id, msg_type) { FSCK_##msg_type },
+#define STR(x) #x
+#define MSG_ID(id, msg_type) { STR(id), NULL, FSCK_##msg_type },
 static struct {
+       const char *id_string;
+       const char *downcased;
        int msg_type;
 } msg_id_info[FSCK_MSG_MAX + 1] = {
        FOREACH_MSG_ID(MSG_ID)
-       { -1 }
+       { NULL, NULL, -1 }
 };
 #undef MSG_ID
 
+static int parse_msg_id(const char *text)
+{
+       int i;
+
+       if (!msg_id_info[0].downcased) {
+               /* convert id_string to lower case, without underscores. */
+               for (i = 0; i < FSCK_MSG_MAX; i++) {
+                       const char *p = msg_id_info[i].id_string;
+                       int len = strlen(p);
+                       char *q = xmalloc(len);
+
+                       msg_id_info[i].downcased = q;
+                       while (*p)
+                               if (*p == '_')
+                                       p++;
+                               else
+                                       *(q)++ = tolower(*(p)++);
+                       *q = '\0';
+               }
+       }
+
+       for (i = 0; i < FSCK_MSG_MAX; i++)
+               if (!strcmp(text, msg_id_info[i].downcased))
+                       return i;
+
+       return -1;
+}
+
 static int fsck_msg_type(enum fsck_msg_id msg_id,
        struct fsck_options *options)
 {
        int msg_type;
 
-       msg_type = msg_id_info[msg_id].msg_type;
-       if (options->strict && msg_type == FSCK_WARN)
-               msg_type = FSCK_ERROR;
+       assert(msg_id >= 0 && msg_id < FSCK_MSG_MAX);
+
+       if (options->msg_type)
+               msg_type = options->msg_type[msg_id];
+       else {
+               msg_type = msg_id_info[msg_id].msg_type;
+               if (options->strict && msg_type == FSCK_WARN)
+                       msg_type = FSCK_ERROR;
+       }
 
        return msg_type;
 }
 
+static void init_skiplist(struct fsck_options *options, const char *path)
+{
+       static struct sha1_array skiplist = SHA1_ARRAY_INIT;
+       int sorted, fd;
+       char buffer[41];
+       unsigned char sha1[20];
+
+       if (options->skiplist)
+               sorted = options->skiplist->sorted;
+       else {
+               sorted = 1;
+               options->skiplist = &skiplist;
+       }
+
+       fd = open(path, O_RDONLY);
+       if (fd < 0)
+               die("Could not open skip list: %s", path);
+       for (;;) {
+               int result = read_in_full(fd, buffer, sizeof(buffer));
+               if (result < 0)
+                       die_errno("Could not read '%s'", path);
+               if (!result)
+                       break;
+               if (get_sha1_hex(buffer, sha1) || buffer[40] != '\n')
+                       die("Invalid SHA-1: %s", buffer);
+               sha1_array_append(&skiplist, sha1);
+               if (sorted && skiplist.nr > 1 &&
+                               hashcmp(skiplist.sha1[skiplist.nr - 2],
+                                       sha1) > 0)
+                       sorted = 0;
+       }
+       close(fd);
+
+       if (sorted)
+               skiplist.sorted = 1;
+}
+
+static int parse_msg_type(const char *str)
+{
+       if (!strcmp(str, "error"))
+               return FSCK_ERROR;
+       else if (!strcmp(str, "warn"))
+               return FSCK_WARN;
+       else if (!strcmp(str, "ignore"))
+               return FSCK_IGNORE;
+       else
+               die("Unknown fsck message type: '%s'", str);
+}
+
+int is_valid_msg_type(const char *msg_id, const char *msg_type)
+{
+       if (parse_msg_id(msg_id) < 0)
+               return 0;
+       parse_msg_type(msg_type);
+       return 1;
+}
+
+void fsck_set_msg_type(struct fsck_options *options,
+               const char *msg_id, const char *msg_type)
+{
+       int id = parse_msg_id(msg_id), type;
+
+       if (id < 0)
+               die("Unhandled message id: %s", msg_id);
+       type = parse_msg_type(msg_type);
+
+       if (type != FSCK_ERROR && msg_id_info[id].msg_type == FSCK_FATAL)
+               die("Cannot demote %s to %s", msg_id, msg_type);
+
+       if (!options->msg_type) {
+               int i;
+               int *msg_type = xmalloc(sizeof(int) * FSCK_MSG_MAX);
+               for (i = 0; i < FSCK_MSG_MAX; i++)
+                       msg_type[i] = fsck_msg_type(i, options);
+               options->msg_type = msg_type;
+       }
+
+       options->msg_type[id] = type;
+}
+
+void fsck_set_msg_types(struct fsck_options *options, const char *values)
+{
+       char *buf = xstrdup(values), *to_free = buf;
+       int done = 0;
+
+       while (!done) {
+               int len = strcspn(buf, " ,|"), equal;
+
+               done = !buf[len];
+               if (!len) {
+                       buf++;
+                       continue;
+               }
+               buf[len] = '\0';
+
+               for (equal = 0;
+                    equal < len && buf[equal] != '=' && buf[equal] != ':';
+                    equal++)
+                       buf[equal] = tolower(buf[equal]);
+               buf[equal] = '\0';
+
+               if (!strcmp(buf, "skiplist")) {
+                       if (equal == len)
+                               die("skiplist requires a path");
+                       init_skiplist(options, buf + equal + 1);
+                       buf += len + 1;
+                       continue;
+               }
+
+               if (equal == len)
+                       die("Missing '=': '%s'", buf);
+
+               fsck_set_msg_type(options, buf, buf + equal + 1);
+               buf += len + 1;
+       }
+       free(to_free);
+}
+
+static void append_msg_id(struct strbuf *sb, const char *msg_id)
+{
+       for (;;) {
+               char c = *(msg_id)++;
+
+               if (!c)
+                       break;
+               if (c != '_')
+                       strbuf_addch(sb, tolower(c));
+               else {
+                       assert(*msg_id);
+                       strbuf_addch(sb, *(msg_id)++);
+               }
+       }
+
+       strbuf_addstr(sb, ": ");
+}
+
 __attribute__((format (printf, 4, 5)))
 static int report(struct fsck_options *options, struct object *object,
        enum fsck_msg_id id, const char *fmt, ...)
@@ -92,6 +272,20 @@ static int report(struct fsck_options *options, struct object *object,
        struct strbuf sb = STRBUF_INIT;
        int msg_type = fsck_msg_type(id, options), result;
 
+       if (msg_type == FSCK_IGNORE)
+               return 0;
+
+       if (options->skiplist && object &&
+                       sha1_array_lookup(options->skiplist, object->sha1) >= 0)
+               return 0;
+
+       if (msg_type == FSCK_FATAL)
+               msg_type = FSCK_ERROR;
+       else if (msg_type == FSCK_INFO)
+               msg_type = FSCK_WARN;
+
+       append_msg_id(&sb, msg_id_info[id].id_string);
+
        va_start(ap, fmt);
        strbuf_vaddf(&sb, fmt, ap);
        result = options->error_func(object, msg_type, sb.buf);
@@ -333,8 +527,8 @@ static int fsck_tree(struct tree *item, struct fsck_options *options)
        return retval;
 }
 
-static int require_end_of_header(const void *data, unsigned long size,
-       struct object *obj, struct fsck_options *options)
+static int verify_headers(const void *data, unsigned long size,
+                         struct object *obj, struct fsck_options *options)
 {
        const char *buffer = (const char *)data;
        unsigned long i;
@@ -351,46 +545,60 @@ static int require_end_of_header(const void *data, unsigned long size,
                }
        }
 
+       /*
+        * We did not find double-LF that separates the header
+        * and the body.  Not having a body is not a crime but
+        * we do want to see the terminating LF for the last header
+        * line.
+        */
+       if (size && buffer[size - 1] == '\n')
+               return 0;
+
        return report(options, obj,
                FSCK_MSG_UNTERMINATED_HEADER, "unterminated header");
 }
 
 static int fsck_ident(const char **ident, struct object *obj, struct fsck_options *options)
 {
+       const char *p = *ident;
        char *end;
 
-       if (**ident == '<')
+       *ident = strchrnul(*ident, '\n');
+       if (**ident == '\n')
+               (*ident)++;
+
+       if (*p == '<')
                return report(options, obj, FSCK_MSG_MISSING_NAME_BEFORE_EMAIL, "invalid author/committer line - missing space before email");
-       *ident += strcspn(*ident, "<>\n");
-       if (**ident == '>')
+       p += strcspn(p, "<>\n");
+       if (*p == '>')
                return report(options, obj, FSCK_MSG_BAD_NAME, "invalid author/committer line - bad name");
-       if (**ident != '<')
+       if (*p != '<')
                return report(options, obj, FSCK_MSG_MISSING_EMAIL, "invalid author/committer line - missing email");
-       if ((*ident)[-1] != ' ')
+       if (p[-1] != ' ')
                return report(options, obj, FSCK_MSG_MISSING_SPACE_BEFORE_EMAIL, "invalid author/committer line - missing space before email");
-       (*ident)++;
-       *ident += strcspn(*ident, "<>\n");
-       if (**ident != '>')
+       p++;
+       p += strcspn(p, "<>\n");
+       if (*p != '>')
                return report(options, obj, FSCK_MSG_BAD_EMAIL, "invalid author/committer line - bad email");
-       (*ident)++;
-       if (**ident != ' ')
+       p++;
+       if (*p != ' ')
                return report(options, obj, FSCK_MSG_MISSING_SPACE_BEFORE_DATE, "invalid author/committer line - missing space before date");
-       (*ident)++;
-       if (**ident == '0' && (*ident)[1] != ' ')
+       p++;
+       if (*p == '0' && p[1] != ' ')
                return report(options, obj, FSCK_MSG_ZERO_PADDED_DATE, "invalid author/committer line - zero-padded date");
-       if (date_overflows(strtoul(*ident, &end, 10)))
+       if (date_overflows(strtoul(p, &end, 10)))
                return report(options, obj, FSCK_MSG_BAD_DATE_OVERFLOW, "invalid author/committer line - date causes integer overflow");
-       if (end == *ident || *end != ' ')
+       if ((end == p || *end != ' '))
                return report(options, obj, FSCK_MSG_BAD_DATE, "invalid author/committer line - bad date");
-       *ident = end + 1;
-       if ((**ident != '+' && **ident != '-') ||
-           !isdigit((*ident)[1]) ||
-           !isdigit((*ident)[2]) ||
-           !isdigit((*ident)[3]) ||
-           !isdigit((*ident)[4]) ||
-           ((*ident)[5] != '\n'))
+       p = end + 1;
+       if ((*p != '+' && *p != '-') ||
+           !isdigit(p[1]) ||
+           !isdigit(p[2]) ||
+           !isdigit(p[3]) ||
+           !isdigit(p[4]) ||
+           (p[5] != '\n'))
                return report(options, obj, FSCK_MSG_BAD_TIMEZONE, "invalid author/committer line - bad time zone");
-       (*ident) += 6;
+       p += 6;
        return 0;
 }
 
@@ -399,20 +607,26 @@ static int fsck_commit_buffer(struct commit *commit, const char *buffer,
 {
        unsigned char tree_sha1[20], sha1[20];
        struct commit_graft *graft;
-       unsigned parent_count, parent_line_count = 0;
+       unsigned parent_count, parent_line_count = 0, author_count;
        int err;
 
-       if (require_end_of_header(buffer, size, &commit->object, options))
+       if (verify_headers(buffer, size, &commit->object, options))
                return -1;
 
        if (!skip_prefix(buffer, "tree ", &buffer))
                return report(options, &commit->object, FSCK_MSG_MISSING_TREE, "invalid format - expected 'tree' line");
-       if (get_sha1_hex(buffer, tree_sha1) || buffer[40] != '\n')
-               return report(options, &commit->object, FSCK_MSG_BAD_TREE_SHA1, "invalid 'tree' line format - bad sha1");
+       if (get_sha1_hex(buffer, tree_sha1) || buffer[40] != '\n') {
+               err = report(options, &commit->object, FSCK_MSG_BAD_TREE_SHA1, "invalid 'tree' line format - bad sha1");
+               if (err)
+                       return err;
+       }
        buffer += 41;
        while (skip_prefix(buffer, "parent ", &buffer)) {
-               if (get_sha1_hex(buffer, sha1) || buffer[40] != '\n')
-                       return report(options, &commit->object, FSCK_MSG_BAD_PARENT_SHA1, "invalid 'parent' line format - bad sha1");
+               if (get_sha1_hex(buffer, sha1) || buffer[40] != '\n') {
+                       err = report(options, &commit->object, FSCK_MSG_BAD_PARENT_SHA1, "invalid 'parent' line format - bad sha1");
+                       if (err)
+                               return err;
+               }
                buffer += 41;
                parent_line_count++;
        }
@@ -421,15 +635,29 @@ static int fsck_commit_buffer(struct commit *commit, const char *buffer,
        if (graft) {
                if (graft->nr_parent == -1 && !parent_count)
                        ; /* shallow commit */
-               else if (graft->nr_parent != parent_count)
-                       return report(options, &commit->object, FSCK_MSG_MISSING_GRAFT, "graft objects missing");
+               else if (graft->nr_parent != parent_count) {
+                       err = report(options, &commit->object, FSCK_MSG_MISSING_GRAFT, "graft objects missing");
+                       if (err)
+                               return err;
+               }
        } else {
-               if (parent_count != parent_line_count)
-                       return report(options, &commit->object, FSCK_MSG_MISSING_PARENT, "parent objects missing");
+               if (parent_count != parent_line_count) {
+                       err = report(options, &commit->object, FSCK_MSG_MISSING_PARENT, "parent objects missing");
+                       if (err)
+                               return err;
+               }
        }
-       if (!skip_prefix(buffer, "author ", &buffer))
-               return report(options, &commit->object, FSCK_MSG_MISSING_AUTHOR, "invalid format - expected 'author' line");
-       err = fsck_ident(&buffer, &commit->object, options);
+       author_count = 0;
+       while (skip_prefix(buffer, "author ", &buffer)) {
+               author_count++;
+               err = fsck_ident(&buffer, &commit->object, options);
+               if (err)
+                       return err;
+       }
+       if (author_count < 1)
+               err = report(options, &commit->object, FSCK_MSG_MISSING_AUTHOR, "invalid format - expected 'author' line");
+       else if (author_count > 1)
+               err = report(options, &commit->object, FSCK_MSG_MULTIPLE_AUTHORS, "invalid format - multiple 'author' lines");
        if (err)
                return err;
        if (!skip_prefix(buffer, "committer ", &buffer))
@@ -483,7 +711,7 @@ static int fsck_tag_buffer(struct tag *tag, const char *data,
                }
        }
 
-       if (require_end_of_header(buffer, size, &tag->object, options))
+       if (verify_headers(buffer, size, &tag->object, options))
                goto done;
 
        if (!skip_prefix(buffer, "object ", &buffer)) {
@@ -492,7 +720,8 @@ static int fsck_tag_buffer(struct tag *tag, const char *data,
        }
        if (get_sha1_hex(buffer, sha1) || buffer[40] != '\n') {
                ret = report(options, &tag->object, FSCK_MSG_BAD_OBJECT_SHA1, "invalid 'object' line format - bad sha1");
-               goto done;
+               if (ret)
+                       goto done;
        }
        buffer += 41;
 
@@ -521,15 +750,21 @@ static int fsck_tag_buffer(struct tag *tag, const char *data,
                goto done;
        }
        strbuf_addf(&sb, "refs/tags/%.*s", (int)(eol - buffer), buffer);
-       if (check_refname_format(sb.buf, 0))
-               report(options, &tag->object, FSCK_MSG_BAD_TAG_NAME,
+       if (check_refname_format(sb.buf, 0)) {
+               ret = report(options, &tag->object, FSCK_MSG_BAD_TAG_NAME,
                           "invalid 'tag' name: %.*s",
                           (int)(eol - buffer), buffer);
+               if (ret)
+                       goto done;
+       }
        buffer = eol + 1;
 
-       if (!skip_prefix(buffer, "tagger ", &buffer))
+       if (!skip_prefix(buffer, "tagger ", &buffer)) {
                /* early tags do not contain 'tagger' lines; warn only */
-               report(options, &tag->object, FSCK_MSG_MISSING_TAGGER_ENTRY, "invalid format - expected 'tagger' line");
+               ret = report(options, &tag->object, FSCK_MSG_MISSING_TAGGER_ENTRY, "invalid format - expected 'tagger' line");
+               if (ret)
+                       goto done;
+       }
        else
                ret = fsck_ident(&buffer, &tag->object, options);
 
@@ -573,6 +808,10 @@ int fsck_object(struct object *obj, void *data, unsigned long size,
 
 int fsck_error_function(struct object *obj, int msg_type, const char *message)
 {
+       if (msg_type == FSCK_WARN) {
+               warning("object %s: %s", sha1_to_hex(obj->sha1), message);
+               return 0;
+       }
        error("object %s: %s", sha1_to_hex(obj->sha1), message);
        return 1;
 }