builtin / repack.con commit general improvements (43abf13)
   1#include "builtin.h"
   2#include "cache.h"
   3#include "config.h"
   4#include "dir.h"
   5#include "parse-options.h"
   6#include "run-command.h"
   7#include "sigchain.h"
   8#include "strbuf.h"
   9#include "string-list.h"
  10#include "argv-array.h"
  11#include "midx.h"
  12#include "packfile.h"
  13#include "object-store.h"
  14#include "promisor-remote.h"
  15
  16static int delta_base_offset = 1;
  17static int pack_kept_objects = -1;
  18static int write_bitmaps = -1;
  19static int use_delta_islands;
  20static char *packdir, *packtmp;
  21
  22static const char *const git_repack_usage[] = {
  23        N_("git repack [<options>]"),
  24        NULL
  25};
  26
  27static const char incremental_bitmap_conflict_error[] = N_(
  28"Incremental repacks are incompatible with bitmap indexes.  Use\n"
  29"--no-write-bitmap-index or disable the pack.writebitmaps configuration."
  30);
  31
  32
  33static int repack_config(const char *var, const char *value, void *cb)
  34{
  35        if (!strcmp(var, "repack.usedeltabaseoffset")) {
  36                delta_base_offset = git_config_bool(var, value);
  37                return 0;
  38        }
  39        if (!strcmp(var, "repack.packkeptobjects")) {
  40                pack_kept_objects = git_config_bool(var, value);
  41                return 0;
  42        }
  43        if (!strcmp(var, "repack.writebitmaps") ||
  44            !strcmp(var, "pack.writebitmaps")) {
  45                write_bitmaps = git_config_bool(var, value);
  46                return 0;
  47        }
  48        if (!strcmp(var, "repack.usedeltaislands")) {
  49                use_delta_islands = git_config_bool(var, value);
  50                return 0;
  51        }
  52        return git_default_config(var, value, cb);
  53}
  54
  55/*
  56 * Remove temporary $GIT_OBJECT_DIRECTORY/pack/.tmp-$$-pack-* files.
  57 */
  58static void remove_temporary_files(void)
  59{
  60        struct strbuf buf = STRBUF_INIT;
  61        size_t dirlen, prefixlen;
  62        DIR *dir;
  63        struct dirent *e;
  64
  65        dir = opendir(packdir);
  66        if (!dir)
  67                return;
  68
  69        /* Point at the slash at the end of ".../objects/pack/" */
  70        dirlen = strlen(packdir) + 1;
  71        strbuf_addstr(&buf, packtmp);
  72        /* Hold the length of  ".tmp-%d-pack-" */
  73        prefixlen = buf.len - dirlen;
  74
  75        while ((e = readdir(dir))) {
  76                if (strncmp(e->d_name, buf.buf + dirlen, prefixlen))
  77                        continue;
  78                strbuf_setlen(&buf, dirlen);
  79                strbuf_addstr(&buf, e->d_name);
  80                unlink(buf.buf);
  81        }
  82        closedir(dir);
  83        strbuf_release(&buf);
  84}
  85
  86static void remove_pack_on_signal(int signo)
  87{
  88        remove_temporary_files();
  89        sigchain_pop(signo);
  90        raise(signo);
  91}
  92
  93/*
  94 * Adds all packs hex strings to the fname list, which do not
  95 * have a corresponding .keep file. These packs are not to
  96 * be kept if we are going to pack everything into one file.
  97 */
  98static void get_non_kept_pack_filenames(struct string_list *fname_list,
  99                                        const struct string_list *extra_keep)
 100{
 101        DIR *dir;
 102        struct dirent *e;
 103        char *fname;
 104
 105        if (!(dir = opendir(packdir)))
 106                return;
 107
 108        while ((e = readdir(dir)) != NULL) {
 109                size_t len;
 110                int i;
 111
 112                for (i = 0; i < extra_keep->nr; i++)
 113                        if (!fspathcmp(e->d_name, extra_keep->items[i].string))
 114                                break;
 115                if (extra_keep->nr > 0 && i < extra_keep->nr)
 116                        continue;
 117
 118                if (!strip_suffix(e->d_name, ".pack", &len))
 119                        continue;
 120
 121                fname = xmemdupz(e->d_name, len);
 122
 123                if (!file_exists(mkpath("%s/%s.keep", packdir, fname)))
 124                        string_list_append_nodup(fname_list, fname);
 125                else
 126                        free(fname);
 127        }
 128        closedir(dir);
 129}
 130
 131static void remove_redundant_pack(const char *dir_name, const char *base_name)
 132{
 133        struct strbuf buf = STRBUF_INIT;
 134        strbuf_addf(&buf, "%s/%s.pack", dir_name, base_name);
 135        unlink_pack_path(buf.buf, 1);
 136        strbuf_release(&buf);
 137}
 138
 139struct pack_objects_args {
 140        const char *window;
 141        const char *window_memory;
 142        const char *depth;
 143        const char *threads;
 144        const char *max_pack_size;
 145        int no_reuse_delta;
 146        int no_reuse_object;
 147        int quiet;
 148        int local;
 149};
 150
 151static void prepare_pack_objects(struct child_process *cmd,
 152                                 const struct pack_objects_args *args)
 153{
 154        argv_array_push(&cmd->args, "pack-objects");
 155        if (args->window)
 156                argv_array_pushf(&cmd->args, "--window=%s", args->window);
 157        if (args->window_memory)
 158                argv_array_pushf(&cmd->args, "--window-memory=%s", args->window_memory);
 159        if (args->depth)
 160                argv_array_pushf(&cmd->args, "--depth=%s", args->depth);
 161        if (args->threads)
 162                argv_array_pushf(&cmd->args, "--threads=%s", args->threads);
 163        if (args->max_pack_size)
 164                argv_array_pushf(&cmd->args, "--max-pack-size=%s", args->max_pack_size);
 165        if (args->no_reuse_delta)
 166                argv_array_pushf(&cmd->args, "--no-reuse-delta");
 167        if (args->no_reuse_object)
 168                argv_array_pushf(&cmd->args, "--no-reuse-object");
 169        if (args->local)
 170                argv_array_push(&cmd->args,  "--local");
 171        if (args->quiet)
 172                argv_array_push(&cmd->args,  "--quiet");
 173        if (delta_base_offset)
 174                argv_array_push(&cmd->args,  "--delta-base-offset");
 175        argv_array_push(&cmd->args, packtmp);
 176        cmd->git_cmd = 1;
 177        cmd->out = -1;
 178}
 179
 180/*
 181 * Write oid to the given struct child_process's stdin, starting it first if
 182 * necessary.
 183 */
 184static int write_oid(const struct object_id *oid, struct packed_git *pack,
 185                     uint32_t pos, void *data)
 186{
 187        struct child_process *cmd = data;
 188
 189        if (cmd->in == -1) {
 190                if (start_command(cmd))
 191                        die(_("could not start pack-objects to repack promisor objects"));
 192        }
 193
 194        xwrite(cmd->in, oid_to_hex(oid), GIT_SHA1_HEXSZ);
 195        xwrite(cmd->in, "\n", 1);
 196        return 0;
 197}
 198
 199static void repack_promisor_objects(const struct pack_objects_args *args,
 200                                    struct string_list *names)
 201{
 202        struct child_process cmd = CHILD_PROCESS_INIT;
 203        FILE *out;
 204        struct strbuf line = STRBUF_INIT;
 205
 206        prepare_pack_objects(&cmd, args);
 207        cmd.in = -1;
 208
 209        /*
 210         * NEEDSWORK: Giving pack-objects only the OIDs without any ordering
 211         * hints may result in suboptimal deltas in the resulting pack. See if
 212         * the OIDs can be sent with fake paths such that pack-objects can use a
 213         * {type -> existing pack order} ordering when computing deltas instead
 214         * of a {type -> size} ordering, which may produce better deltas.
 215         */
 216        for_each_packed_object(write_oid, &cmd,
 217                               FOR_EACH_OBJECT_PROMISOR_ONLY);
 218
 219        if (cmd.in == -1)
 220                /* No packed objects; cmd was never started */
 221                return;
 222
 223        close(cmd.in);
 224
 225        out = xfdopen(cmd.out, "r");
 226        while (strbuf_getline_lf(&line, out) != EOF) {
 227                char *promisor_name;
 228                int fd;
 229                if (line.len != the_hash_algo->hexsz)
 230                        die(_("repack: Expecting full hex object ID lines only from pack-objects."));
 231                string_list_append(names, line.buf);
 232
 233                /*
 234                 * pack-objects creates the .pack and .idx files, but not the
 235                 * .promisor file. Create the .promisor file, which is empty.
 236                 */
 237                promisor_name = mkpathdup("%s-%s.promisor", packtmp,
 238                                          line.buf);
 239                fd = open(promisor_name, O_CREAT|O_EXCL|O_WRONLY, 0600);
 240                if (fd < 0)
 241                        die_errno(_("unable to create '%s'"), promisor_name);
 242                close(fd);
 243                free(promisor_name);
 244        }
 245        fclose(out);
 246        if (finish_command(&cmd))
 247                die(_("could not finish pack-objects to repack promisor objects"));
 248}
 249
 250#define ALL_INTO_ONE 1
 251#define LOOSEN_UNREACHABLE 2
 252
 253int cmd_repack(int argc, const char **argv, const char *prefix)
 254{
 255        struct {
 256                const char *name;
 257                unsigned optional:1;
 258        } exts[] = {
 259                {".pack"},
 260                {".idx"},
 261                {".bitmap", 1},
 262                {".promisor", 1},
 263        };
 264        struct child_process cmd = CHILD_PROCESS_INIT;
 265        struct string_list_item *item;
 266        struct string_list names = STRING_LIST_INIT_DUP;
 267        struct string_list rollback = STRING_LIST_INIT_NODUP;
 268        struct string_list existing_packs = STRING_LIST_INIT_DUP;
 269        struct strbuf line = STRBUF_INIT;
 270        int i, ext, ret, failed;
 271        FILE *out;
 272
 273        /* variables to be filled by option parsing */
 274        int pack_everything = 0;
 275        int delete_redundant = 0;
 276        const char *unpack_unreachable = NULL;
 277        int keep_unreachable = 0;
 278        struct string_list keep_pack_list = STRING_LIST_INIT_NODUP;
 279        int no_update_server_info = 0;
 280        int midx_cleared = 0;
 281        struct pack_objects_args po_args = {NULL};
 282
 283        struct option builtin_repack_options[] = {
 284                OPT_BIT('a', NULL, &pack_everything,
 285                                N_("pack everything in a single pack"), ALL_INTO_ONE),
 286                OPT_BIT('A', NULL, &pack_everything,
 287                                N_("same as -a, and turn unreachable objects loose"),
 288                                   LOOSEN_UNREACHABLE | ALL_INTO_ONE),
 289                OPT_BOOL('d', NULL, &delete_redundant,
 290                                N_("remove redundant packs, and run git-prune-packed")),
 291                OPT_BOOL('f', NULL, &po_args.no_reuse_delta,
 292                                N_("pass --no-reuse-delta to git-pack-objects")),
 293                OPT_BOOL('F', NULL, &po_args.no_reuse_object,
 294                                N_("pass --no-reuse-object to git-pack-objects")),
 295                OPT_BOOL('n', NULL, &no_update_server_info,
 296                                N_("do not run git-update-server-info")),
 297                OPT__QUIET(&po_args.quiet, N_("be quiet")),
 298                OPT_BOOL('l', "local", &po_args.local,
 299                                N_("pass --local to git-pack-objects")),
 300                OPT_BOOL('b', "write-bitmap-index", &write_bitmaps,
 301                                N_("write bitmap index")),
 302                OPT_BOOL('i', "delta-islands", &use_delta_islands,
 303                                N_("pass --delta-islands to git-pack-objects")),
 304                OPT_STRING(0, "unpack-unreachable", &unpack_unreachable, N_("approxidate"),
 305                                N_("with -A, do not loosen objects older than this")),
 306                OPT_BOOL('k', "keep-unreachable", &keep_unreachable,
 307                                N_("with -a, repack unreachable objects")),
 308                OPT_STRING(0, "window", &po_args.window, N_("n"),
 309                                N_("size of the window used for delta compression")),
 310                OPT_STRING(0, "window-memory", &po_args.window_memory, N_("bytes"),
 311                                N_("same as the above, but limit memory size instead of entries count")),
 312                OPT_STRING(0, "depth", &po_args.depth, N_("n"),
 313                                N_("limits the maximum delta depth")),
 314                OPT_STRING(0, "threads", &po_args.threads, N_("n"),
 315                                N_("limits the maximum number of threads")),
 316                OPT_STRING(0, "max-pack-size", &po_args.max_pack_size, N_("bytes"),
 317                                N_("maximum size of each packfile")),
 318                OPT_BOOL(0, "pack-kept-objects", &pack_kept_objects,
 319                                N_("repack objects in packs marked with .keep")),
 320                OPT_STRING_LIST(0, "keep-pack", &keep_pack_list, N_("name"),
 321                                N_("do not repack this pack")),
 322                OPT_END()
 323        };
 324
 325        git_config(repack_config, NULL);
 326
 327        argc = parse_options(argc, argv, prefix, builtin_repack_options,
 328                                git_repack_usage, 0);
 329
 330        if (delete_redundant && repository_format_precious_objects)
 331                die(_("cannot delete packs in a precious-objects repo"));
 332
 333        if (keep_unreachable &&
 334            (unpack_unreachable || (pack_everything & LOOSEN_UNREACHABLE)))
 335                die(_("--keep-unreachable and -A are incompatible"));
 336
 337        if (write_bitmaps < 0) {
 338                if (!(pack_everything & ALL_INTO_ONE) ||
 339                    !is_bare_repository())
 340                        write_bitmaps = 0;
 341        }
 342        if (pack_kept_objects < 0)
 343                pack_kept_objects = write_bitmaps > 0;
 344
 345        if (write_bitmaps && !(pack_everything & ALL_INTO_ONE))
 346                die(_(incremental_bitmap_conflict_error));
 347
 348        packdir = mkpathdup("%s/pack", get_object_directory());
 349        packtmp = mkpathdup("%s/.tmp-%d-pack", packdir, (int)getpid());
 350
 351        sigchain_push_common(remove_pack_on_signal);
 352
 353        prepare_pack_objects(&cmd, &po_args);
 354
 355        argv_array_push(&cmd.args, "--keep-true-parents");
 356        if (!pack_kept_objects)
 357                argv_array_push(&cmd.args, "--honor-pack-keep");
 358        for (i = 0; i < keep_pack_list.nr; i++)
 359                argv_array_pushf(&cmd.args, "--keep-pack=%s",
 360                                 keep_pack_list.items[i].string);
 361        argv_array_push(&cmd.args, "--non-empty");
 362        argv_array_push(&cmd.args, "--all");
 363        argv_array_push(&cmd.args, "--reflog");
 364        argv_array_push(&cmd.args, "--indexed-objects");
 365        if (has_promisor_remote())
 366                argv_array_push(&cmd.args, "--exclude-promisor-objects");
 367        if (write_bitmaps > 0)
 368                argv_array_push(&cmd.args, "--write-bitmap-index");
 369        else if (write_bitmaps < 0)
 370                argv_array_push(&cmd.args, "--write-bitmap-index-quiet");
 371        if (use_delta_islands)
 372                argv_array_push(&cmd.args, "--delta-islands");
 373
 374        if (pack_everything & ALL_INTO_ONE) {
 375                get_non_kept_pack_filenames(&existing_packs, &keep_pack_list);
 376
 377                repack_promisor_objects(&po_args, &names);
 378
 379                if (existing_packs.nr && delete_redundant) {
 380                        if (unpack_unreachable) {
 381                                argv_array_pushf(&cmd.args,
 382                                                "--unpack-unreachable=%s",
 383                                                unpack_unreachable);
 384                                argv_array_push(&cmd.env_array, "GIT_REF_PARANOIA=1");
 385                        } else if (pack_everything & LOOSEN_UNREACHABLE) {
 386                                argv_array_push(&cmd.args,
 387                                                "--unpack-unreachable");
 388                        } else if (keep_unreachable) {
 389                                argv_array_push(&cmd.args, "--keep-unreachable");
 390                                argv_array_push(&cmd.args, "--pack-loose-unreachable");
 391                        } else {
 392                                argv_array_push(&cmd.env_array, "GIT_REF_PARANOIA=1");
 393                        }
 394                }
 395        } else {
 396                argv_array_push(&cmd.args, "--unpacked");
 397                argv_array_push(&cmd.args, "--incremental");
 398        }
 399
 400        cmd.no_stdin = 1;
 401
 402        ret = start_command(&cmd);
 403        if (ret)
 404                return ret;
 405
 406        out = xfdopen(cmd.out, "r");
 407        while (strbuf_getline_lf(&line, out) != EOF) {
 408                if (line.len != the_hash_algo->hexsz)
 409                        die(_("repack: Expecting full hex object ID lines only from pack-objects."));
 410                string_list_append(&names, line.buf);
 411        }
 412        fclose(out);
 413        ret = finish_command(&cmd);
 414        if (ret)
 415                return ret;
 416
 417        if (!names.nr && !po_args.quiet)
 418                printf_ln(_("Nothing new to pack."));
 419
 420        close_object_store(the_repository->objects);
 421
 422        /*
 423         * Ok we have prepared all new packfiles.
 424         * First see if there are packs of the same name and if so
 425         * if we can move them out of the way (this can happen if we
 426         * repacked immediately after packing fully.
 427         */
 428        failed = 0;
 429        for_each_string_list_item(item, &names) {
 430                for (ext = 0; ext < ARRAY_SIZE(exts); ext++) {
 431                        char *fname, *fname_old;
 432
 433                        if (!midx_cleared) {
 434                                clear_midx_file(the_repository);
 435                                midx_cleared = 1;
 436                        }
 437
 438                        fname = mkpathdup("%s/pack-%s%s", packdir,
 439                                                item->string, exts[ext].name);
 440                        if (!file_exists(fname)) {
 441                                free(fname);
 442                                continue;
 443                        }
 444
 445                        fname_old = mkpathdup("%s/old-%s%s", packdir,
 446                                                item->string, exts[ext].name);
 447                        if (file_exists(fname_old))
 448                                if (unlink(fname_old))
 449                                        failed = 1;
 450
 451                        if (!failed && rename(fname, fname_old)) {
 452                                free(fname);
 453                                free(fname_old);
 454                                failed = 1;
 455                                break;
 456                        } else {
 457                                string_list_append(&rollback, fname);
 458                                free(fname_old);
 459                        }
 460                }
 461                if (failed)
 462                        break;
 463        }
 464        if (failed) {
 465                struct string_list rollback_failure = STRING_LIST_INIT_DUP;
 466                for_each_string_list_item(item, &rollback) {
 467                        char *fname, *fname_old;
 468                        fname = mkpathdup("%s/%s", packdir, item->string);
 469                        fname_old = mkpathdup("%s/old-%s", packdir, item->string);
 470                        if (rename(fname_old, fname))
 471                                string_list_append(&rollback_failure, fname);
 472                        free(fname);
 473                        free(fname_old);
 474                }
 475
 476                if (rollback_failure.nr) {
 477                        int i;
 478                        fprintf(stderr,
 479                                _("WARNING: Some packs in use have been renamed by\n"
 480                                  "WARNING: prefixing old- to their name, in order to\n"
 481                                  "WARNING: replace them with the new version of the\n"
 482                                  "WARNING: file.  But the operation failed, and the\n"
 483                                  "WARNING: attempt to rename them back to their\n"
 484                                  "WARNING: original names also failed.\n"
 485                                  "WARNING: Please rename them in %s manually:\n"), packdir);
 486                        for (i = 0; i < rollback_failure.nr; i++)
 487                                fprintf(stderr, "WARNING:   old-%s -> %s\n",
 488                                        rollback_failure.items[i].string,
 489                                        rollback_failure.items[i].string);
 490                }
 491                exit(1);
 492        }
 493
 494        /* Now the ones with the same name are out of the way... */
 495        for_each_string_list_item(item, &names) {
 496                for (ext = 0; ext < ARRAY_SIZE(exts); ext++) {
 497                        char *fname, *fname_old;
 498                        struct stat statbuffer;
 499                        int exists = 0;
 500                        fname = mkpathdup("%s/pack-%s%s",
 501                                        packdir, item->string, exts[ext].name);
 502                        fname_old = mkpathdup("%s-%s%s",
 503                                        packtmp, item->string, exts[ext].name);
 504                        if (!stat(fname_old, &statbuffer)) {
 505                                statbuffer.st_mode &= ~(S_IWUSR | S_IWGRP | S_IWOTH);
 506                                chmod(fname_old, statbuffer.st_mode);
 507                                exists = 1;
 508                        }
 509                        if (exists || !exts[ext].optional) {
 510                                if (rename(fname_old, fname))
 511                                        die_errno(_("renaming '%s' failed"), fname_old);
 512                        }
 513                        free(fname);
 514                        free(fname_old);
 515                }
 516        }
 517
 518        /* Remove the "old-" files */
 519        for_each_string_list_item(item, &names) {
 520                for (ext = 0; ext < ARRAY_SIZE(exts); ext++) {
 521                        char *fname;
 522                        fname = mkpathdup("%s/old-%s%s",
 523                                          packdir,
 524                                          item->string,
 525                                          exts[ext].name);
 526                        if (remove_path(fname))
 527                                warning(_("failed to remove '%s'"), fname);
 528                        free(fname);
 529                }
 530        }
 531
 532        /* End of pack replacement. */
 533
 534        reprepare_packed_git(the_repository);
 535
 536        if (delete_redundant) {
 537                const int hexsz = the_hash_algo->hexsz;
 538                int opts = 0;
 539                string_list_sort(&names);
 540                for_each_string_list_item(item, &existing_packs) {
 541                        char *sha1;
 542                        size_t len = strlen(item->string);
 543                        if (len < hexsz)
 544                                continue;
 545                        sha1 = item->string + len - hexsz;
 546                        if (!string_list_has_string(&names, sha1))
 547                                remove_redundant_pack(packdir, item->string);
 548                }
 549                if (!po_args.quiet && isatty(2))
 550                        opts |= PRUNE_PACKED_VERBOSE;
 551                prune_packed_objects(opts);
 552
 553                if (!keep_unreachable &&
 554                    (!(pack_everything & LOOSEN_UNREACHABLE) ||
 555                     unpack_unreachable) &&
 556                    is_repository_shallow(the_repository))
 557                        prune_shallow(PRUNE_QUICK);
 558        }
 559
 560        if (!no_update_server_info)
 561                update_server_info(0);
 562        remove_temporary_files();
 563
 564        if (git_env_bool(GIT_TEST_MULTI_PACK_INDEX, 0))
 565                write_midx_file(get_object_directory());
 566
 567        string_list_clear(&names, 0);
 568        string_list_clear(&rollback, 0);
 569        string_list_clear(&existing_packs, 0);
 570        strbuf_release(&line);
 571
 572        return 0;
 573}