entry.con commit streaming: convert open_istream to use struct object_id (ef7b519)
   1#include "cache.h"
   2#include "blob.h"
   3#include "dir.h"
   4#include "streaming.h"
   5#include "submodule.h"
   6#include "progress.h"
   7#include "fsmonitor.h"
   8
   9static void create_directories(const char *path, int path_len,
  10                               const struct checkout *state)
  11{
  12        char *buf = xmallocz(path_len);
  13        int len = 0;
  14
  15        while (len < path_len) {
  16                do {
  17                        buf[len] = path[len];
  18                        len++;
  19                } while (len < path_len && path[len] != '/');
  20                if (len >= path_len)
  21                        break;
  22                buf[len] = 0;
  23
  24                /*
  25                 * For 'checkout-index --prefix=<dir>', <dir> is
  26                 * allowed to be a symlink to an existing directory,
  27                 * and we set 'state->base_dir_len' below, such that
  28                 * we test the path components of the prefix with the
  29                 * stat() function instead of the lstat() function.
  30                 */
  31                if (has_dirs_only_path(buf, len, state->base_dir_len))
  32                        continue; /* ok, it is already a directory. */
  33
  34                /*
  35                 * If this mkdir() would fail, it could be that there
  36                 * is already a symlink or something else exists
  37                 * there, therefore we then try to unlink it and try
  38                 * one more time to create the directory.
  39                 */
  40                if (mkdir(buf, 0777)) {
  41                        if (errno == EEXIST && state->force &&
  42                            !unlink_or_warn(buf) && !mkdir(buf, 0777))
  43                                continue;
  44                        die_errno("cannot create directory at '%s'", buf);
  45                }
  46        }
  47        free(buf);
  48}
  49
  50static void remove_subtree(struct strbuf *path)
  51{
  52        DIR *dir = opendir(path->buf);
  53        struct dirent *de;
  54        int origlen = path->len;
  55
  56        if (!dir)
  57                die_errno("cannot opendir '%s'", path->buf);
  58        while ((de = readdir(dir)) != NULL) {
  59                struct stat st;
  60
  61                if (is_dot_or_dotdot(de->d_name))
  62                        continue;
  63
  64                strbuf_addch(path, '/');
  65                strbuf_addstr(path, de->d_name);
  66                if (lstat(path->buf, &st))
  67                        die_errno("cannot lstat '%s'", path->buf);
  68                if (S_ISDIR(st.st_mode))
  69                        remove_subtree(path);
  70                else if (unlink(path->buf))
  71                        die_errno("cannot unlink '%s'", path->buf);
  72                strbuf_setlen(path, origlen);
  73        }
  74        closedir(dir);
  75        if (rmdir(path->buf))
  76                die_errno("cannot rmdir '%s'", path->buf);
  77}
  78
  79static int create_file(const char *path, unsigned int mode)
  80{
  81        mode = (mode & 0100) ? 0777 : 0666;
  82        return open(path, O_WRONLY | O_CREAT | O_EXCL, mode);
  83}
  84
  85static void *read_blob_entry(const struct cache_entry *ce, unsigned long *size)
  86{
  87        enum object_type type;
  88        void *blob_data = read_sha1_file(ce->oid.hash, &type, size);
  89
  90        if (blob_data) {
  91                if (type == OBJ_BLOB)
  92                        return blob_data;
  93                free(blob_data);
  94        }
  95        return NULL;
  96}
  97
  98static int open_output_fd(char *path, const struct cache_entry *ce, int to_tempfile)
  99{
 100        int symlink = (ce->ce_mode & S_IFMT) != S_IFREG;
 101        if (to_tempfile) {
 102                xsnprintf(path, TEMPORARY_FILENAME_LENGTH, "%s",
 103                          symlink ? ".merge_link_XXXXXX" : ".merge_file_XXXXXX");
 104                return mkstemp(path);
 105        } else {
 106                return create_file(path, !symlink ? ce->ce_mode : 0666);
 107        }
 108}
 109
 110static int fstat_output(int fd, const struct checkout *state, struct stat *st)
 111{
 112        /* use fstat() only when path == ce->name */
 113        if (fstat_is_reliable() &&
 114            state->refresh_cache && !state->base_dir_len) {
 115                fstat(fd, st);
 116                return 1;
 117        }
 118        return 0;
 119}
 120
 121static int streaming_write_entry(const struct cache_entry *ce, char *path,
 122                                 struct stream_filter *filter,
 123                                 const struct checkout *state, int to_tempfile,
 124                                 int *fstat_done, struct stat *statbuf)
 125{
 126        int result = 0;
 127        int fd;
 128
 129        fd = open_output_fd(path, ce, to_tempfile);
 130        if (fd < 0)
 131                return -1;
 132
 133        result |= stream_blob_to_fd(fd, &ce->oid, filter, 1);
 134        *fstat_done = fstat_output(fd, state, statbuf);
 135        result |= close(fd);
 136
 137        if (result)
 138                unlink(path);
 139        return result;
 140}
 141
 142void enable_delayed_checkout(struct checkout *state)
 143{
 144        if (!state->delayed_checkout) {
 145                state->delayed_checkout = xmalloc(sizeof(*state->delayed_checkout));
 146                state->delayed_checkout->state = CE_CAN_DELAY;
 147                string_list_init(&state->delayed_checkout->filters, 0);
 148                string_list_init(&state->delayed_checkout->paths, 0);
 149        }
 150}
 151
 152static int remove_available_paths(struct string_list_item *item, void *cb_data)
 153{
 154        struct string_list *available_paths = cb_data;
 155        struct string_list_item *available;
 156
 157        available = string_list_lookup(available_paths, item->string);
 158        if (available)
 159                available->util = (void *)item->string;
 160        return !available;
 161}
 162
 163int finish_delayed_checkout(struct checkout *state)
 164{
 165        int errs = 0;
 166        unsigned delayed_object_count;
 167        off_t filtered_bytes = 0;
 168        struct string_list_item *filter, *path;
 169        struct progress *progress;
 170        struct delayed_checkout *dco = state->delayed_checkout;
 171
 172        if (!state->delayed_checkout)
 173                return errs;
 174
 175        dco->state = CE_RETRY;
 176        delayed_object_count = dco->paths.nr;
 177        progress = start_delayed_progress(_("Filtering content"), delayed_object_count);
 178        while (dco->filters.nr > 0) {
 179                for_each_string_list_item(filter, &dco->filters) {
 180                        struct string_list available_paths = STRING_LIST_INIT_NODUP;
 181                        display_progress(progress, delayed_object_count - dco->paths.nr);
 182
 183                        if (!async_query_available_blobs(filter->string, &available_paths)) {
 184                                /* Filter reported an error */
 185                                errs = 1;
 186                                filter->string = "";
 187                                continue;
 188                        }
 189                        if (available_paths.nr <= 0) {
 190                                /*
 191                                 * Filter responded with no entries. That means
 192                                 * the filter is done and we can remove the
 193                                 * filter from the list (see
 194                                 * "string_list_remove_empty_items" call below).
 195                                 */
 196                                filter->string = "";
 197                                continue;
 198                        }
 199
 200                        /*
 201                         * In dco->paths we store a list of all delayed paths.
 202                         * The filter just send us a list of available paths.
 203                         * Remove them from the list.
 204                         */
 205                        filter_string_list(&dco->paths, 0,
 206                                &remove_available_paths, &available_paths);
 207
 208                        for_each_string_list_item(path, &available_paths) {
 209                                struct cache_entry* ce;
 210
 211                                if (!path->util) {
 212                                        error("external filter '%s' signaled that '%s' "
 213                                              "is now available although it has not been "
 214                                              "delayed earlier",
 215                                              filter->string, path->string);
 216                                        errs |= 1;
 217
 218                                        /*
 219                                         * Do not ask the filter for available blobs,
 220                                         * again, as the filter is likely buggy.
 221                                         */
 222                                        filter->string = "";
 223                                        continue;
 224                                }
 225                                ce = index_file_exists(state->istate, path->string,
 226                                                       strlen(path->string), 0);
 227                                if (ce) {
 228                                        errs |= checkout_entry(ce, state, NULL);
 229                                        filtered_bytes += ce->ce_stat_data.sd_size;
 230                                        display_throughput(progress, filtered_bytes);
 231                                } else
 232                                        errs = 1;
 233                        }
 234                }
 235                string_list_remove_empty_items(&dco->filters, 0);
 236        }
 237        stop_progress(&progress);
 238        string_list_clear(&dco->filters, 0);
 239
 240        /* At this point we should not have any delayed paths anymore. */
 241        errs |= dco->paths.nr;
 242        for_each_string_list_item(path, &dco->paths) {
 243                error("'%s' was not filtered properly", path->string);
 244        }
 245        string_list_clear(&dco->paths, 0);
 246
 247        free(dco);
 248        state->delayed_checkout = NULL;
 249
 250        return errs;
 251}
 252
 253static int write_entry(struct cache_entry *ce,
 254                       char *path, const struct checkout *state, int to_tempfile)
 255{
 256        unsigned int ce_mode_s_ifmt = ce->ce_mode & S_IFMT;
 257        struct delayed_checkout *dco = state->delayed_checkout;
 258        int fd, ret, fstat_done = 0;
 259        char *new_blob;
 260        struct strbuf buf = STRBUF_INIT;
 261        unsigned long size;
 262        ssize_t wrote;
 263        size_t newsize = 0;
 264        struct stat st;
 265        const struct submodule *sub;
 266
 267        if (ce_mode_s_ifmt == S_IFREG) {
 268                struct stream_filter *filter = get_stream_filter(ce->name,
 269                                                                 ce->oid.hash);
 270                if (filter &&
 271                    !streaming_write_entry(ce, path, filter,
 272                                           state, to_tempfile,
 273                                           &fstat_done, &st))
 274                        goto finish;
 275        }
 276
 277        switch (ce_mode_s_ifmt) {
 278        case S_IFLNK:
 279                new_blob = read_blob_entry(ce, &size);
 280                if (!new_blob)
 281                        return error("unable to read sha1 file of %s (%s)",
 282                                     path, oid_to_hex(&ce->oid));
 283
 284                /*
 285                 * We can't make a real symlink; write out a regular file entry
 286                 * with the symlink destination as its contents.
 287                 */
 288                if (!has_symlinks || to_tempfile)
 289                        goto write_file_entry;
 290
 291                ret = symlink(new_blob, path);
 292                free(new_blob);
 293                if (ret)
 294                        return error_errno("unable to create symlink %s", path);
 295                break;
 296
 297        case S_IFREG:
 298                /*
 299                 * We do not send the blob in case of a retry, so do not
 300                 * bother reading it at all.
 301                 */
 302                if (dco && dco->state == CE_RETRY) {
 303                        new_blob = NULL;
 304                        size = 0;
 305                } else {
 306                        new_blob = read_blob_entry(ce, &size);
 307                        if (!new_blob)
 308                                return error("unable to read sha1 file of %s (%s)",
 309                                             path, oid_to_hex(&ce->oid));
 310                }
 311
 312                /*
 313                 * Convert from git internal format to working tree format
 314                 */
 315                if (dco && dco->state != CE_NO_DELAY) {
 316                        ret = async_convert_to_working_tree(ce->name, new_blob,
 317                                                            size, &buf, dco);
 318                        if (ret && string_list_has_string(&dco->paths, ce->name)) {
 319                                free(new_blob);
 320                                goto delayed;
 321                        }
 322                } else
 323                        ret = convert_to_working_tree(ce->name, new_blob, size, &buf);
 324
 325                if (ret) {
 326                        free(new_blob);
 327                        new_blob = strbuf_detach(&buf, &newsize);
 328                        size = newsize;
 329                }
 330                /*
 331                 * No "else" here as errors from convert are OK at this
 332                 * point. If the error would have been fatal (e.g.
 333                 * filter is required), then we would have died already.
 334                 */
 335
 336        write_file_entry:
 337                fd = open_output_fd(path, ce, to_tempfile);
 338                if (fd < 0) {
 339                        free(new_blob);
 340                        return error_errno("unable to create file %s", path);
 341                }
 342
 343                wrote = write_in_full(fd, new_blob, size);
 344                if (!to_tempfile)
 345                        fstat_done = fstat_output(fd, state, &st);
 346                close(fd);
 347                free(new_blob);
 348                if (wrote < 0)
 349                        return error("unable to write file %s", path);
 350                break;
 351
 352        case S_IFGITLINK:
 353                if (to_tempfile)
 354                        return error("cannot create temporary submodule %s", path);
 355                if (mkdir(path, 0777) < 0)
 356                        return error("cannot create submodule directory %s", path);
 357                sub = submodule_from_ce(ce);
 358                if (sub)
 359                        return submodule_move_head(ce->name,
 360                                NULL, oid_to_hex(&ce->oid),
 361                                state->force ? SUBMODULE_MOVE_HEAD_FORCE : 0);
 362                break;
 363
 364        default:
 365                return error("unknown file mode for %s in index", path);
 366        }
 367
 368finish:
 369        if (state->refresh_cache) {
 370                assert(state->istate);
 371                if (!fstat_done)
 372                        if (lstat(ce->name, &st) < 0)
 373                                return error_errno("unable to stat just-written file %s",
 374                                                   ce->name);
 375                fill_stat_cache_info(ce, &st);
 376                ce->ce_flags |= CE_UPDATE_IN_BASE;
 377                mark_fsmonitor_invalid(state->istate, ce);
 378                state->istate->cache_changed |= CE_ENTRY_CHANGED;
 379        }
 380delayed:
 381        return 0;
 382}
 383
 384/*
 385 * This is like 'lstat()', except it refuses to follow symlinks
 386 * in the path, after skipping "skiplen".
 387 */
 388static int check_path(const char *path, int len, struct stat *st, int skiplen)
 389{
 390        const char *slash = path + len;
 391
 392        while (path < slash && *slash != '/')
 393                slash--;
 394        if (!has_dirs_only_path(path, slash - path, skiplen)) {
 395                errno = ENOENT;
 396                return -1;
 397        }
 398        return lstat(path, st);
 399}
 400
 401/*
 402 * Write the contents from ce out to the working tree.
 403 *
 404 * When topath[] is not NULL, instead of writing to the working tree
 405 * file named by ce, a temporary file is created by this function and
 406 * its name is returned in topath[], which must be able to hold at
 407 * least TEMPORARY_FILENAME_LENGTH bytes long.
 408 */
 409int checkout_entry(struct cache_entry *ce,
 410                   const struct checkout *state, char *topath)
 411{
 412        static struct strbuf path = STRBUF_INIT;
 413        struct stat st;
 414
 415        if (topath)
 416                return write_entry(ce, topath, state, 1);
 417
 418        strbuf_reset(&path);
 419        strbuf_add(&path, state->base_dir, state->base_dir_len);
 420        strbuf_add(&path, ce->name, ce_namelen(ce));
 421
 422        if (!check_path(path.buf, path.len, &st, state->base_dir_len)) {
 423                const struct submodule *sub;
 424                unsigned changed = ce_match_stat(ce, &st, CE_MATCH_IGNORE_VALID|CE_MATCH_IGNORE_SKIP_WORKTREE);
 425                /*
 426                 * Needs to be checked before !changed returns early,
 427                 * as the possibly empty directory was not changed
 428                 */
 429                sub = submodule_from_ce(ce);
 430                if (sub) {
 431                        int err;
 432                        if (!is_submodule_populated_gently(ce->name, &err)) {
 433                                struct stat sb;
 434                                if (lstat(ce->name, &sb))
 435                                        die(_("could not stat file '%s'"), ce->name);
 436                                if (!(st.st_mode & S_IFDIR))
 437                                        unlink_or_warn(ce->name);
 438
 439                                return submodule_move_head(ce->name,
 440                                        NULL, oid_to_hex(&ce->oid), 0);
 441                        } else
 442                                return submodule_move_head(ce->name,
 443                                        "HEAD", oid_to_hex(&ce->oid),
 444                                        state->force ? SUBMODULE_MOVE_HEAD_FORCE : 0);
 445                }
 446
 447                if (!changed)
 448                        return 0;
 449                if (!state->force) {
 450                        if (!state->quiet)
 451                                fprintf(stderr,
 452                                        "%s already exists, no checkout\n",
 453                                        path.buf);
 454                        return -1;
 455                }
 456
 457                /*
 458                 * We unlink the old file, to get the new one with the
 459                 * right permissions (including umask, which is nasty
 460                 * to emulate by hand - much easier to let the system
 461                 * just do the right thing)
 462                 */
 463                if (S_ISDIR(st.st_mode)) {
 464                        /* If it is a gitlink, leave it alone! */
 465                        if (S_ISGITLINK(ce->ce_mode))
 466                                return 0;
 467                        if (!state->force)
 468                                return error("%s is a directory", path.buf);
 469                        remove_subtree(&path);
 470                } else if (unlink(path.buf))
 471                        return error_errno("unable to unlink old '%s'", path.buf);
 472        } else if (state->not_new)
 473                return 0;
 474
 475        create_directories(path.buf, path.len, state);
 476        return write_entry(ce, path.buf, state, 0);
 477}