Merge branch 'rj/submodule-fsck-skip'
authorJunio C Hamano <gitster@pobox.com>
Tue, 24 Jul 2018 21:50:42 +0000 (14:50 -0700)
committerJunio C Hamano <gitster@pobox.com>
Tue, 24 Jul 2018 21:50:42 +0000 (14:50 -0700)
"fsck.skipList" did not prevent a blob object listed there from
being inspected for is contents (e.g. we recently started to
inspect the contents of ".gitmodules" for certain malicious
patterns), which has been corrected.

* rj/submodule-fsck-skip:
fsck: check skiplist for object in fsck_blob()

1  2 
fsck.c
diff --combined fsck.c
index 4dfe65f715467cb31dab418af658968e491a9645,e91cbf6d44d46d7c6c3e98514d3d1e52bf361df6..ae4b1f3c09710eff4cfeb4be6e9b9d0488a2d249
--- 1/fsck.c
--- 2/fsck.c
+++ b/fsck.c
@@@ -1,5 -1,4 +1,5 @@@
  #include "cache.h"
 +#include "object-store.h"
  #include "object.h"
  #include "blob.h"
  #include "tree.h"
@@@ -15,7 -14,6 +15,7 @@@
  #include "packfile.h"
  #include "submodule-config.h"
  #include "config.h"
 +#include "help.h"
  
  static struct oidset gitmodules_found = OIDSET_INIT;
  static struct oidset gitmodules_done = OIDSET_INIT;
@@@ -88,60 -86,37 +88,60 @@@ enum fsck_msg_id 
  #undef MSG_ID
  
  #define STR(x) #x
 -#define MSG_ID(id, msg_type) { STR(id), NULL, FSCK_##msg_type },
 +#define MSG_ID(id, msg_type) { STR(id), NULL, NULL, FSCK_##msg_type },
  static struct {
        const char *id_string;
        const char *downcased;
 +      const char *camelcased;
        int msg_type;
  } msg_id_info[FSCK_MSG_MAX + 1] = {
        FOREACH_MSG_ID(MSG_ID)
 -      { NULL, NULL, -1 }
 +      { NULL, NULL, NULL, -1 }
  };
  #undef MSG_ID
  
 -static int parse_msg_id(const char *text)
 +static void prepare_msg_ids(void)
  {
        int i;
  
 -      if (!msg_id_info[0].downcased) {
 -              /* convert id_string to lower case, without underscores. */
 -              for (i = 0; i < FSCK_MSG_MAX; i++) {
 -                      const char *p = msg_id_info[i].id_string;
 -                      int len = strlen(p);
 -                      char *q = xmalloc(len);
 -
 -                      msg_id_info[i].downcased = q;
 -                      while (*p)
 -                              if (*p == '_')
 -                                      p++;
 -                              else
 -                                      *(q)++ = tolower(*(p)++);
 -                      *q = '\0';
 +      if (msg_id_info[0].downcased)
 +              return;
 +
 +      /* convert id_string to lower case, without underscores. */
 +      for (i = 0; i < FSCK_MSG_MAX; i++) {
 +              const char *p = msg_id_info[i].id_string;
 +              int len = strlen(p);
 +              char *q = xmalloc(len);
 +
 +              msg_id_info[i].downcased = q;
 +              while (*p)
 +                      if (*p == '_')
 +                              p++;
 +                      else
 +                              *(q)++ = tolower(*(p)++);
 +              *q = '\0';
 +
 +              p = msg_id_info[i].id_string;
 +              q = xmalloc(len);
 +              msg_id_info[i].camelcased = q;
 +              while (*p) {
 +                      if (*p == '_') {
 +                              p++;
 +                              if (*p)
 +                                      *q++ = *p++;
 +                      } else {
 +                              *q++ = tolower(*p++);
 +                      }
                }
 +              *q = '\0';
        }
 +}
 +
 +static int parse_msg_id(const char *text)
 +{
 +      int i;
 +
 +      prepare_msg_ids();
  
        for (i = 0; i < FSCK_MSG_MAX; i++)
                if (!strcmp(text, msg_id_info[i].downcased))
        return -1;
  }
  
 +void list_config_fsck_msg_ids(struct string_list *list, const char *prefix)
 +{
 +      int i;
 +
 +      prepare_msg_ids();
 +
 +      for (i = 0; i < FSCK_MSG_MAX; i++)
 +              list_config_item(list, prefix, msg_id_info[i].camelcased);
 +}
 +
  static int fsck_msg_type(enum fsck_msg_id msg_id,
        struct fsck_options *options)
  {
@@@ -316,6 -281,13 +316,13 @@@ static void append_msg_id(struct strbu
        strbuf_addstr(sb, ": ");
  }
  
+ static int object_on_skiplist(struct fsck_options *opts, struct object *obj)
+ {
+       if (opts && opts->skiplist && obj)
+               return oid_array_lookup(opts->skiplist, &obj->oid) >= 0;
+       return 0;
+ }
  __attribute__((format (printf, 4, 5)))
  static int report(struct fsck_options *options, struct object *object,
        enum fsck_msg_id id, const char *fmt, ...)
        if (msg_type == FSCK_IGNORE)
                return 0;
  
-       if (options->skiplist && object &&
-                       oid_array_lookup(options->skiplist, &object->oid) >= 0)
+       if (object_on_skiplist(options, object))
                return 0;
  
        if (msg_type == FSCK_FATAL)
@@@ -444,11 -415,9 +450,11 @@@ static int fsck_walk_commit(struct comm
  
        name = get_object_name(options, &commit->object);
        if (name)
 -              put_object_name(options, &commit->tree->object, "%s:", name);
 +              put_object_name(options, &get_commit_tree(commit)->object,
 +                              "%s:", name);
  
 -      result = options->walk((struct object *)commit->tree, OBJ_TREE, data, options);
 +      result = options->walk((struct object *)get_commit_tree(commit),
 +                             OBJ_TREE, data, options);
        if (result < 0)
                return result;
        res = result;
@@@ -769,34 -738,33 +775,34 @@@ static int fsck_ident(const char **iden
  static int fsck_commit_buffer(struct commit *commit, const char *buffer,
        unsigned long size, struct fsck_options *options)
  {
 -      unsigned char tree_sha1[20], sha1[20];
 +      struct object_id tree_oid, oid;
        struct commit_graft *graft;
        unsigned parent_count, parent_line_count = 0, author_count;
        int err;
        const char *buffer_begin = buffer;
 +      const char *p;
  
        if (verify_headers(buffer, size, &commit->object, options))
                return -1;
  
        if (!skip_prefix(buffer, "tree ", &buffer))
                return report(options, &commit->object, FSCK_MSG_MISSING_TREE, "invalid format - expected 'tree' line");
 -      if (get_sha1_hex(buffer, tree_sha1) || buffer[40] != '\n') {
 +      if (parse_oid_hex(buffer, &tree_oid, &p) || *p != '\n') {
                err = report(options, &commit->object, FSCK_MSG_BAD_TREE_SHA1, "invalid 'tree' line format - bad sha1");
                if (err)
                        return err;
        }
 -      buffer += 41;
 +      buffer = p + 1;
        while (skip_prefix(buffer, "parent ", &buffer)) {
 -              if (get_sha1_hex(buffer, sha1) || buffer[40] != '\n') {
 +              if (parse_oid_hex(buffer, &oid, &p) || *p != '\n') {
                        err = report(options, &commit->object, FSCK_MSG_BAD_PARENT_SHA1, "invalid 'parent' line format - bad sha1");
                        if (err)
                                return err;
                }
 -              buffer += 41;
 +              buffer = p + 1;
                parent_line_count++;
        }
 -      graft = lookup_commit_graft(&commit->object.oid);
 +      graft = lookup_commit_graft(the_repository, &commit->object.oid);
        parent_count = commit_list_count(commit->parents);
        if (graft) {
                if (graft->nr_parent == -1 && !parent_count)
        err = fsck_ident(&buffer, &commit->object, options);
        if (err)
                return err;
 -      if (!commit->tree) {
 -              err = report(options, &commit->object, FSCK_MSG_BAD_TREE, "could not load commit's tree %s", sha1_to_hex(tree_sha1));
 +      if (!get_commit_tree(commit)) {
 +              err = report(options, &commit->object, FSCK_MSG_BAD_TREE, "could not load commit's tree %s", oid_to_hex(&tree_oid));
                if (err)
                        return err;
        }
@@@ -858,12 -826,11 +864,12 @@@ static int fsck_commit(struct commit *c
  static int fsck_tag_buffer(struct tag *tag, const char *data,
        unsigned long size, struct fsck_options *options)
  {
 -      unsigned char sha1[20];
 +      struct object_id oid;
        int ret = 0;
        const char *buffer;
        char *to_free = NULL, *eol;
        struct strbuf sb = STRBUF_INIT;
 +      const char *p;
  
        if (data)
                buffer = data;
                enum object_type type;
  
                buffer = to_free =
 -                      read_sha1_file(tag->object.oid.hash, &type, &size);
 +                      read_object_file(&tag->object.oid, &type, &size);
                if (!buffer)
                        return report(options, &tag->object,
                                FSCK_MSG_MISSING_TAG_OBJECT,
                ret = report(options, &tag->object, FSCK_MSG_MISSING_OBJECT, "invalid format - expected 'object' line");
                goto done;
        }
 -      if (get_sha1_hex(buffer, sha1) || buffer[40] != '\n') {
 +      if (parse_oid_hex(buffer, &oid, &p) || *p != '\n') {
                ret = report(options, &tag->object, FSCK_MSG_BAD_OBJECT_SHA1, "invalid 'object' line format - bad sha1");
                if (ret)
                        goto done;
        }
 -      buffer += 41;
 +      buffer = p + 1;
  
        if (!skip_prefix(buffer, "type ", &buffer)) {
                ret = report(options, &tag->object, FSCK_MSG_MISSING_TYPE_ENTRY, "invalid format - expected 'type' line");
@@@ -998,6 -965,9 +1004,9 @@@ static int fsck_blob(struct blob *blob
                return 0;
        oidset_insert(&gitmodules_done, &blob->object.oid);
  
+       if (object_on_skiplist(options, &blob->object))
+               return 0;
        if (!buf) {
                /*
                 * A missing buffer here is a sign that the caller found the
@@@ -1078,7 -1048,7 +1087,7 @@@ int fsck_finish(struct fsck_options *op
                        continue;
                }
  
 -              buf = read_sha1_file(oid->hash, &type, &size);
 +              buf = read_object_file(oid, &type, &size);
                if (!buf) {
                        if (is_promisor_object(&blob->object.oid))
                                continue;