reachable.con commit fsck: introduce `git fsck --connectivity-only` (02976bf)
   1#include "cache.h"
   2#include "refs.h"
   3#include "tag.h"
   4#include "commit.h"
   5#include "blob.h"
   6#include "diff.h"
   7#include "revision.h"
   8#include "reachable.h"
   9#include "cache-tree.h"
  10#include "progress.h"
  11#include "list-objects.h"
  12
  13struct connectivity_progress {
  14        struct progress *progress;
  15        unsigned long count;
  16};
  17
  18static void update_progress(struct connectivity_progress *cp)
  19{
  20        cp->count++;
  21        if ((cp->count & 1023) == 0)
  22                display_progress(cp->progress, cp->count);
  23}
  24
  25static int add_one_ref(const char *path, const struct object_id *oid,
  26                       int flag, void *cb_data)
  27{
  28        struct object *object = parse_object_or_die(oid->hash, path);
  29        struct rev_info *revs = (struct rev_info *)cb_data;
  30
  31        add_pending_object(revs, object, "");
  32
  33        return 0;
  34}
  35
  36/*
  37 * The traversal will have already marked us as SEEN, so we
  38 * only need to handle any progress reporting here.
  39 */
  40static void mark_object(struct object *obj, const struct name_path *path,
  41                        const char *name, void *data)
  42{
  43        update_progress(data);
  44}
  45
  46static void mark_commit(struct commit *c, void *data)
  47{
  48        mark_object(&c->object, NULL, NULL, data);
  49}
  50
  51struct recent_data {
  52        struct rev_info *revs;
  53        unsigned long timestamp;
  54};
  55
  56static void add_recent_object(const unsigned char *sha1,
  57                              unsigned long mtime,
  58                              struct recent_data *data)
  59{
  60        struct object *obj;
  61        enum object_type type;
  62
  63        if (mtime <= data->timestamp)
  64                return;
  65
  66        /*
  67         * We do not want to call parse_object here, because
  68         * inflating blobs and trees could be very expensive.
  69         * However, we do need to know the correct type for
  70         * later processing, and the revision machinery expects
  71         * commits and tags to have been parsed.
  72         */
  73        type = sha1_object_info(sha1, NULL);
  74        if (type < 0)
  75                die("unable to get object info for %s", sha1_to_hex(sha1));
  76
  77        switch (type) {
  78        case OBJ_TAG:
  79        case OBJ_COMMIT:
  80                obj = parse_object_or_die(sha1, NULL);
  81                break;
  82        case OBJ_TREE:
  83                obj = (struct object *)lookup_tree(sha1);
  84                break;
  85        case OBJ_BLOB:
  86                obj = (struct object *)lookup_blob(sha1);
  87                break;
  88        default:
  89                die("unknown object type for %s: %s",
  90                    sha1_to_hex(sha1), typename(type));
  91        }
  92
  93        if (!obj)
  94                die("unable to lookup %s", sha1_to_hex(sha1));
  95
  96        add_pending_object(data->revs, obj, "");
  97}
  98
  99static int add_recent_loose(const unsigned char *sha1,
 100                            const char *path, void *data)
 101{
 102        struct stat st;
 103        struct object *obj = lookup_object(sha1);
 104
 105        if (obj && obj->flags & SEEN)
 106                return 0;
 107
 108        if (stat(path, &st) < 0) {
 109                /*
 110                 * It's OK if an object went away during our iteration; this
 111                 * could be due to a simultaneous repack. But anything else
 112                 * we should abort, since we might then fail to mark objects
 113                 * which should not be pruned.
 114                 */
 115                if (errno == ENOENT)
 116                        return 0;
 117                return error("unable to stat %s: %s",
 118                             sha1_to_hex(sha1), strerror(errno));
 119        }
 120
 121        add_recent_object(sha1, st.st_mtime, data);
 122        return 0;
 123}
 124
 125static int add_recent_packed(const unsigned char *sha1,
 126                             struct packed_git *p, uint32_t pos,
 127                             void *data)
 128{
 129        struct object *obj = lookup_object(sha1);
 130
 131        if (obj && obj->flags & SEEN)
 132                return 0;
 133        add_recent_object(sha1, p->mtime, data);
 134        return 0;
 135}
 136
 137int add_unseen_recent_objects_to_traversal(struct rev_info *revs,
 138                                           unsigned long timestamp)
 139{
 140        struct recent_data data;
 141        int r;
 142
 143        data.revs = revs;
 144        data.timestamp = timestamp;
 145
 146        r = for_each_loose_object(add_recent_loose, &data,
 147                                  FOR_EACH_OBJECT_LOCAL_ONLY);
 148        if (r)
 149                return r;
 150        return for_each_packed_object(add_recent_packed, &data,
 151                                      FOR_EACH_OBJECT_LOCAL_ONLY);
 152}
 153
 154void mark_reachable_objects(struct rev_info *revs, int mark_reflog,
 155                            unsigned long mark_recent,
 156                            struct progress *progress)
 157{
 158        struct connectivity_progress cp;
 159
 160        /*
 161         * Set up revision parsing, and mark us as being interested
 162         * in all object types, not just commits.
 163         */
 164        revs->tag_objects = 1;
 165        revs->blob_objects = 1;
 166        revs->tree_objects = 1;
 167
 168        /* Add all refs from the index file */
 169        add_index_objects_to_pending(revs, 0);
 170
 171        /* Add all external refs */
 172        for_each_ref(add_one_ref, revs);
 173
 174        /* detached HEAD is not included in the list above */
 175        head_ref(add_one_ref, revs);
 176
 177        /* Add all reflog info */
 178        if (mark_reflog)
 179                add_reflogs_to_pending(revs, 0);
 180
 181        cp.progress = progress;
 182        cp.count = 0;
 183
 184        /*
 185         * Set up the revision walk - this will move all commits
 186         * from the pending list to the commit walking list.
 187         */
 188        if (prepare_revision_walk(revs))
 189                die("revision walk setup failed");
 190        traverse_commit_list(revs, mark_commit, mark_object, &cp);
 191
 192        if (mark_recent) {
 193                revs->ignore_missing_links = 1;
 194                if (add_unseen_recent_objects_to_traversal(revs, mark_recent))
 195                        die("unable to mark recent objects");
 196                if (prepare_revision_walk(revs))
 197                        die("revision walk setup failed");
 198                traverse_commit_list(revs, mark_commit, mark_object, &cp);
 199        }
 200
 201        display_progress(cp.progress, cp.count);
 202}