object.con commit shallow: migrate shallow information into the object parser (eee4502)
   1#include "cache.h"
   2#include "object.h"
   3#include "replace-object.h"
   4#include "object-store.h"
   5#include "blob.h"
   6#include "tree.h"
   7#include "commit.h"
   8#include "tag.h"
   9#include "alloc.h"
  10#include "object-store.h"
  11#include "packfile.h"
  12
  13unsigned int get_max_object_index(void)
  14{
  15        return the_repository->parsed_objects->obj_hash_size;
  16}
  17
  18struct object *get_indexed_object(unsigned int idx)
  19{
  20        return the_repository->parsed_objects->obj_hash[idx];
  21}
  22
  23static const char *object_type_strings[] = {
  24        NULL,           /* OBJ_NONE = 0 */
  25        "commit",       /* OBJ_COMMIT = 1 */
  26        "tree",         /* OBJ_TREE = 2 */
  27        "blob",         /* OBJ_BLOB = 3 */
  28        "tag",          /* OBJ_TAG = 4 */
  29};
  30
  31const char *type_name(unsigned int type)
  32{
  33        if (type >= ARRAY_SIZE(object_type_strings))
  34                return NULL;
  35        return object_type_strings[type];
  36}
  37
  38int type_from_string_gently(const char *str, ssize_t len, int gentle)
  39{
  40        int i;
  41
  42        if (len < 0)
  43                len = strlen(str);
  44
  45        for (i = 1; i < ARRAY_SIZE(object_type_strings); i++)
  46                if (!strncmp(str, object_type_strings[i], len) &&
  47                    object_type_strings[i][len] == '\0')
  48                        return i;
  49
  50        if (gentle)
  51                return -1;
  52
  53        die("invalid object type \"%s\"", str);
  54}
  55
  56/*
  57 * Return a numerical hash value between 0 and n-1 for the object with
  58 * the specified sha1.  n must be a power of 2.  Please note that the
  59 * return value is *not* consistent across computer architectures.
  60 */
  61static unsigned int hash_obj(const unsigned char *sha1, unsigned int n)
  62{
  63        return sha1hash(sha1) & (n - 1);
  64}
  65
  66/*
  67 * Insert obj into the hash table hash, which has length size (which
  68 * must be a power of 2).  On collisions, simply overflow to the next
  69 * empty bucket.
  70 */
  71static void insert_obj_hash(struct object *obj, struct object **hash, unsigned int size)
  72{
  73        unsigned int j = hash_obj(obj->oid.hash, size);
  74
  75        while (hash[j]) {
  76                j++;
  77                if (j >= size)
  78                        j = 0;
  79        }
  80        hash[j] = obj;
  81}
  82
  83/*
  84 * Look up the record for the given sha1 in the hash map stored in
  85 * obj_hash.  Return NULL if it was not found.
  86 */
  87struct object *lookup_object(const unsigned char *sha1)
  88{
  89        unsigned int i, first;
  90        struct object *obj;
  91
  92        if (!the_repository->parsed_objects->obj_hash)
  93                return NULL;
  94
  95        first = i = hash_obj(sha1,
  96                             the_repository->parsed_objects->obj_hash_size);
  97        while ((obj = the_repository->parsed_objects->obj_hash[i]) != NULL) {
  98                if (!hashcmp(sha1, obj->oid.hash))
  99                        break;
 100                i++;
 101                if (i == the_repository->parsed_objects->obj_hash_size)
 102                        i = 0;
 103        }
 104        if (obj && i != first) {
 105                /*
 106                 * Move object to where we started to look for it so
 107                 * that we do not need to walk the hash table the next
 108                 * time we look for it.
 109                 */
 110                SWAP(the_repository->parsed_objects->obj_hash[i],
 111                     the_repository->parsed_objects->obj_hash[first]);
 112        }
 113        return obj;
 114}
 115
 116/*
 117 * Increase the size of the hash map stored in obj_hash to the next
 118 * power of 2 (but at least 32).  Copy the existing values to the new
 119 * hash map.
 120 */
 121static void grow_object_hash(struct repository *r)
 122{
 123        int i;
 124        /*
 125         * Note that this size must always be power-of-2 to match hash_obj
 126         * above.
 127         */
 128        int new_hash_size = r->parsed_objects->obj_hash_size < 32 ? 32 : 2 * r->parsed_objects->obj_hash_size;
 129        struct object **new_hash;
 130
 131        new_hash = xcalloc(new_hash_size, sizeof(struct object *));
 132        for (i = 0; i < r->parsed_objects->obj_hash_size; i++) {
 133                struct object *obj = r->parsed_objects->obj_hash[i];
 134
 135                if (!obj)
 136                        continue;
 137                insert_obj_hash(obj, new_hash, new_hash_size);
 138        }
 139        free(r->parsed_objects->obj_hash);
 140        r->parsed_objects->obj_hash = new_hash;
 141        r->parsed_objects->obj_hash_size = new_hash_size;
 142}
 143
 144void *create_object(struct repository *r, const unsigned char *sha1, void *o)
 145{
 146        struct object *obj = o;
 147
 148        obj->parsed = 0;
 149        obj->flags = 0;
 150        hashcpy(obj->oid.hash, sha1);
 151
 152        if (r->parsed_objects->obj_hash_size - 1 <= r->parsed_objects->nr_objs * 2)
 153                grow_object_hash(r);
 154
 155        insert_obj_hash(obj, r->parsed_objects->obj_hash,
 156                        r->parsed_objects->obj_hash_size);
 157        r->parsed_objects->nr_objs++;
 158        return obj;
 159}
 160
 161void *object_as_type(struct object *obj, enum object_type type, int quiet)
 162{
 163        if (obj->type == type)
 164                return obj;
 165        else if (obj->type == OBJ_NONE) {
 166                if (type == OBJ_COMMIT)
 167                        ((struct commit *)obj)->index = alloc_commit_index(the_repository);
 168                obj->type = type;
 169                return obj;
 170        }
 171        else {
 172                if (!quiet)
 173                        error("object %s is a %s, not a %s",
 174                              oid_to_hex(&obj->oid),
 175                              type_name(obj->type), type_name(type));
 176                return NULL;
 177        }
 178}
 179
 180struct object *lookup_unknown_object(const unsigned char *sha1)
 181{
 182        struct object *obj = lookup_object(sha1);
 183        if (!obj)
 184                obj = create_object(the_repository, sha1,
 185                                    alloc_object_node(the_repository));
 186        return obj;
 187}
 188
 189struct object *parse_object_buffer(const struct object_id *oid, enum object_type type, unsigned long size, void *buffer, int *eaten_p)
 190{
 191        struct object *obj;
 192        *eaten_p = 0;
 193
 194        obj = NULL;
 195        if (type == OBJ_BLOB) {
 196                struct blob *blob = lookup_blob(oid);
 197                if (blob) {
 198                        if (parse_blob_buffer(blob, buffer, size))
 199                                return NULL;
 200                        obj = &blob->object;
 201                }
 202        } else if (type == OBJ_TREE) {
 203                struct tree *tree = lookup_tree(oid);
 204                if (tree) {
 205                        obj = &tree->object;
 206                        if (!tree->buffer)
 207                                tree->object.parsed = 0;
 208                        if (!tree->object.parsed) {
 209                                if (parse_tree_buffer(tree, buffer, size))
 210                                        return NULL;
 211                                *eaten_p = 1;
 212                        }
 213                }
 214        } else if (type == OBJ_COMMIT) {
 215                struct commit *commit = lookup_commit(oid);
 216                if (commit) {
 217                        if (parse_commit_buffer(commit, buffer, size))
 218                                return NULL;
 219                        if (!get_cached_commit_buffer(commit, NULL)) {
 220                                set_commit_buffer(commit, buffer, size);
 221                                *eaten_p = 1;
 222                        }
 223                        obj = &commit->object;
 224                }
 225        } else if (type == OBJ_TAG) {
 226                struct tag *tag = lookup_tag(oid);
 227                if (tag) {
 228                        if (parse_tag_buffer(tag, buffer, size))
 229                               return NULL;
 230                        obj = &tag->object;
 231                }
 232        } else {
 233                warning("object %s has unknown type id %d", oid_to_hex(oid), type);
 234                obj = NULL;
 235        }
 236        return obj;
 237}
 238
 239struct object *parse_object_or_die(const struct object_id *oid,
 240                                   const char *name)
 241{
 242        struct object *o = parse_object(oid);
 243        if (o)
 244                return o;
 245
 246        die(_("unable to parse object: %s"), name ? name : oid_to_hex(oid));
 247}
 248
 249struct object *parse_object(const struct object_id *oid)
 250{
 251        unsigned long size;
 252        enum object_type type;
 253        int eaten;
 254        const struct object_id *repl = lookup_replace_object(the_repository, oid);
 255        void *buffer;
 256        struct object *obj;
 257
 258        obj = lookup_object(oid->hash);
 259        if (obj && obj->parsed)
 260                return obj;
 261
 262        if ((obj && obj->type == OBJ_BLOB && has_object_file(oid)) ||
 263            (!obj && has_object_file(oid) &&
 264             oid_object_info(the_repository, oid, NULL) == OBJ_BLOB)) {
 265                if (check_object_signature(repl, NULL, 0, NULL) < 0) {
 266                        error("sha1 mismatch %s", oid_to_hex(oid));
 267                        return NULL;
 268                }
 269                parse_blob_buffer(lookup_blob(oid), NULL, 0);
 270                return lookup_object(oid->hash);
 271        }
 272
 273        buffer = read_object_file(oid, &type, &size);
 274        if (buffer) {
 275                if (check_object_signature(repl, buffer, size, type_name(type)) < 0) {
 276                        free(buffer);
 277                        error("sha1 mismatch %s", oid_to_hex(repl));
 278                        return NULL;
 279                }
 280
 281                obj = parse_object_buffer(oid, type, size, buffer, &eaten);
 282                if (!eaten)
 283                        free(buffer);
 284                return obj;
 285        }
 286        return NULL;
 287}
 288
 289struct object_list *object_list_insert(struct object *item,
 290                                       struct object_list **list_p)
 291{
 292        struct object_list *new_list = xmalloc(sizeof(struct object_list));
 293        new_list->item = item;
 294        new_list->next = *list_p;
 295        *list_p = new_list;
 296        return new_list;
 297}
 298
 299int object_list_contains(struct object_list *list, struct object *obj)
 300{
 301        while (list) {
 302                if (list->item == obj)
 303                        return 1;
 304                list = list->next;
 305        }
 306        return 0;
 307}
 308
 309/*
 310 * A zero-length string to which object_array_entry::name can be
 311 * initialized without requiring a malloc/free.
 312 */
 313static char object_array_slopbuf[1];
 314
 315void add_object_array_with_path(struct object *obj, const char *name,
 316                                struct object_array *array,
 317                                unsigned mode, const char *path)
 318{
 319        unsigned nr = array->nr;
 320        unsigned alloc = array->alloc;
 321        struct object_array_entry *objects = array->objects;
 322        struct object_array_entry *entry;
 323
 324        if (nr >= alloc) {
 325                alloc = (alloc + 32) * 2;
 326                REALLOC_ARRAY(objects, alloc);
 327                array->alloc = alloc;
 328                array->objects = objects;
 329        }
 330        entry = &objects[nr];
 331        entry->item = obj;
 332        if (!name)
 333                entry->name = NULL;
 334        else if (!*name)
 335                /* Use our own empty string instead of allocating one: */
 336                entry->name = object_array_slopbuf;
 337        else
 338                entry->name = xstrdup(name);
 339        entry->mode = mode;
 340        if (path)
 341                entry->path = xstrdup(path);
 342        else
 343                entry->path = NULL;
 344        array->nr = ++nr;
 345}
 346
 347void add_object_array(struct object *obj, const char *name, struct object_array *array)
 348{
 349        add_object_array_with_path(obj, name, array, S_IFINVALID, NULL);
 350}
 351
 352/*
 353 * Free all memory associated with an entry; the result is
 354 * in an unspecified state and should not be examined.
 355 */
 356static void object_array_release_entry(struct object_array_entry *ent)
 357{
 358        if (ent->name != object_array_slopbuf)
 359                free(ent->name);
 360        free(ent->path);
 361}
 362
 363struct object *object_array_pop(struct object_array *array)
 364{
 365        struct object *ret;
 366
 367        if (!array->nr)
 368                return NULL;
 369
 370        ret = array->objects[array->nr - 1].item;
 371        object_array_release_entry(&array->objects[array->nr - 1]);
 372        array->nr--;
 373        return ret;
 374}
 375
 376void object_array_filter(struct object_array *array,
 377                         object_array_each_func_t want, void *cb_data)
 378{
 379        unsigned nr = array->nr, src, dst;
 380        struct object_array_entry *objects = array->objects;
 381
 382        for (src = dst = 0; src < nr; src++) {
 383                if (want(&objects[src], cb_data)) {
 384                        if (src != dst)
 385                                objects[dst] = objects[src];
 386                        dst++;
 387                } else {
 388                        object_array_release_entry(&objects[src]);
 389                }
 390        }
 391        array->nr = dst;
 392}
 393
 394void object_array_clear(struct object_array *array)
 395{
 396        int i;
 397        for (i = 0; i < array->nr; i++)
 398                object_array_release_entry(&array->objects[i]);
 399        FREE_AND_NULL(array->objects);
 400        array->nr = array->alloc = 0;
 401}
 402
 403/*
 404 * Return true iff array already contains an entry with name.
 405 */
 406static int contains_name(struct object_array *array, const char *name)
 407{
 408        unsigned nr = array->nr, i;
 409        struct object_array_entry *object = array->objects;
 410
 411        for (i = 0; i < nr; i++, object++)
 412                if (!strcmp(object->name, name))
 413                        return 1;
 414        return 0;
 415}
 416
 417void object_array_remove_duplicates(struct object_array *array)
 418{
 419        unsigned nr = array->nr, src;
 420        struct object_array_entry *objects = array->objects;
 421
 422        array->nr = 0;
 423        for (src = 0; src < nr; src++) {
 424                if (!contains_name(array, objects[src].name)) {
 425                        if (src != array->nr)
 426                                objects[array->nr] = objects[src];
 427                        array->nr++;
 428                } else {
 429                        object_array_release_entry(&objects[src]);
 430                }
 431        }
 432}
 433
 434void clear_object_flags(unsigned flags)
 435{
 436        int i;
 437
 438        for (i=0; i < the_repository->parsed_objects->obj_hash_size; i++) {
 439                struct object *obj = the_repository->parsed_objects->obj_hash[i];
 440                if (obj)
 441                        obj->flags &= ~flags;
 442        }
 443}
 444
 445void clear_commit_marks_all(unsigned int flags)
 446{
 447        int i;
 448
 449        for (i = 0; i < the_repository->parsed_objects->obj_hash_size; i++) {
 450                struct object *obj = the_repository->parsed_objects->obj_hash[i];
 451                if (obj && obj->type == OBJ_COMMIT)
 452                        obj->flags &= ~flags;
 453        }
 454}
 455
 456struct parsed_object_pool *parsed_object_pool_new(void)
 457{
 458        struct parsed_object_pool *o = xmalloc(sizeof(*o));
 459        memset(o, 0, sizeof(*o));
 460
 461        o->blob_state = allocate_alloc_state();
 462        o->tree_state = allocate_alloc_state();
 463        o->commit_state = allocate_alloc_state();
 464        o->tag_state = allocate_alloc_state();
 465        o->object_state = allocate_alloc_state();
 466
 467        o->is_shallow = -1;
 468        o->shallow_stat = xcalloc(1, sizeof(*o->shallow_stat));
 469
 470        return o;
 471}
 472
 473struct raw_object_store *raw_object_store_new(void)
 474{
 475        struct raw_object_store *o = xmalloc(sizeof(*o));
 476
 477        memset(o, 0, sizeof(*o));
 478        INIT_LIST_HEAD(&o->packed_git_mru);
 479        return o;
 480}
 481
 482static void free_alt_odb(struct alternate_object_database *alt)
 483{
 484        strbuf_release(&alt->scratch);
 485        oid_array_clear(&alt->loose_objects_cache);
 486        free(alt);
 487}
 488
 489static void free_alt_odbs(struct raw_object_store *o)
 490{
 491        while (o->alt_odb_list) {
 492                struct alternate_object_database *next;
 493
 494                next = o->alt_odb_list->next;
 495                free_alt_odb(o->alt_odb_list);
 496                o->alt_odb_list = next;
 497        }
 498}
 499
 500void raw_object_store_clear(struct raw_object_store *o)
 501{
 502        FREE_AND_NULL(o->objectdir);
 503        FREE_AND_NULL(o->alternate_db);
 504
 505        free_alt_odbs(o);
 506        o->alt_odb_tail = NULL;
 507
 508        INIT_LIST_HEAD(&o->packed_git_mru);
 509        close_all_packs(o);
 510        o->packed_git = NULL;
 511}
 512
 513void parsed_object_pool_clear(struct parsed_object_pool *o)
 514{
 515        /*
 516         * As objects are allocated in slabs (see alloc.c), we do
 517         * not need to free each object, but each slab instead.
 518         *
 519         * Before doing so, we need to free any additional memory
 520         * the objects may hold.
 521         */
 522        unsigned i;
 523
 524        for (i = 0; i < o->obj_hash_size; i++) {
 525                struct object *obj = o->obj_hash[i];
 526
 527                if (!obj)
 528                        continue;
 529
 530                if (obj->type == OBJ_TREE)
 531                        free_tree_buffer((struct tree*)obj);
 532                else if (obj->type == OBJ_COMMIT)
 533                        release_commit_memory((struct commit*)obj);
 534                else if (obj->type == OBJ_TAG)
 535                        release_tag_memory((struct tag*)obj);
 536        }
 537
 538        FREE_AND_NULL(o->obj_hash);
 539        o->obj_hash_size = 0;
 540
 541        clear_alloc_state(o->blob_state);
 542        clear_alloc_state(o->tree_state);
 543        clear_alloc_state(o->commit_state);
 544        clear_alloc_state(o->tag_state);
 545        clear_alloc_state(o->object_state);
 546        FREE_AND_NULL(o->blob_state);
 547        FREE_AND_NULL(o->tree_state);
 548        FREE_AND_NULL(o->commit_state);
 549        FREE_AND_NULL(o->tag_state);
 550        FREE_AND_NULL(o->object_state);
 551}