submodule.con commit push, fetch: error out for submodule entries not pointing to commits (3c96aa9)
   1#include "cache.h"
   2#include "repository.h"
   3#include "config.h"
   4#include "submodule-config.h"
   5#include "submodule.h"
   6#include "dir.h"
   7#include "diff.h"
   8#include "commit.h"
   9#include "revision.h"
  10#include "run-command.h"
  11#include "diffcore.h"
  12#include "refs.h"
  13#include "string-list.h"
  14#include "sha1-array.h"
  15#include "argv-array.h"
  16#include "blob.h"
  17#include "thread-utils.h"
  18#include "quote.h"
  19#include "remote.h"
  20#include "worktree.h"
  21#include "parse-options.h"
  22
  23static int config_update_recurse_submodules = RECURSE_SUBMODULES_OFF;
  24static struct string_list changed_submodule_paths = STRING_LIST_INIT_DUP;
  25static int initialized_fetch_ref_tips;
  26static struct oid_array ref_tips_before_fetch;
  27static struct oid_array ref_tips_after_fetch;
  28
  29/*
  30 * Check if the .gitmodules file is unmerged. Parsing of the .gitmodules file
  31 * will be disabled because we can't guess what might be configured in
  32 * .gitmodules unless the user resolves the conflict.
  33 */
  34int is_gitmodules_unmerged(const struct index_state *istate)
  35{
  36        int pos = index_name_pos(istate, GITMODULES_FILE, strlen(GITMODULES_FILE));
  37        if (pos < 0) { /* .gitmodules not found or isn't merged */
  38                pos = -1 - pos;
  39                if (istate->cache_nr > pos) {  /* there is a .gitmodules */
  40                        const struct cache_entry *ce = istate->cache[pos];
  41                        if (ce_namelen(ce) == strlen(GITMODULES_FILE) &&
  42                            !strcmp(ce->name, GITMODULES_FILE))
  43                                return 1;
  44                }
  45        }
  46
  47        return 0;
  48}
  49
  50/*
  51 * Check if the .gitmodules file has unstaged modifications.  This must be
  52 * checked before allowing modifications to the .gitmodules file with the
  53 * intention to stage them later, because when continuing we would stage the
  54 * modifications the user didn't stage herself too. That might change in a
  55 * future version when we learn to stage the changes we do ourselves without
  56 * staging any previous modifications.
  57 */
  58int is_staging_gitmodules_ok(const struct index_state *istate)
  59{
  60        int pos = index_name_pos(istate, GITMODULES_FILE, strlen(GITMODULES_FILE));
  61
  62        if ((pos >= 0) && (pos < istate->cache_nr)) {
  63                struct stat st;
  64                if (lstat(GITMODULES_FILE, &st) == 0 &&
  65                    ce_match_stat(istate->cache[pos], &st, 0) & DATA_CHANGED)
  66                        return 0;
  67        }
  68
  69        return 1;
  70}
  71
  72/*
  73 * Try to update the "path" entry in the "submodule.<name>" section of the
  74 * .gitmodules file. Return 0 only if a .gitmodules file was found, a section
  75 * with the correct path=<oldpath> setting was found and we could update it.
  76 */
  77int update_path_in_gitmodules(const char *oldpath, const char *newpath)
  78{
  79        struct strbuf entry = STRBUF_INIT;
  80        const struct submodule *submodule;
  81
  82        if (!file_exists(GITMODULES_FILE)) /* Do nothing without .gitmodules */
  83                return -1;
  84
  85        if (is_gitmodules_unmerged(&the_index))
  86                die(_("Cannot change unmerged .gitmodules, resolve merge conflicts first"));
  87
  88        submodule = submodule_from_path(&null_oid, oldpath);
  89        if (!submodule || !submodule->name) {
  90                warning(_("Could not find section in .gitmodules where path=%s"), oldpath);
  91                return -1;
  92        }
  93        strbuf_addstr(&entry, "submodule.");
  94        strbuf_addstr(&entry, submodule->name);
  95        strbuf_addstr(&entry, ".path");
  96        if (git_config_set_in_file_gently(GITMODULES_FILE, entry.buf, newpath) < 0) {
  97                /* Maybe the user already did that, don't error out here */
  98                warning(_("Could not update .gitmodules entry %s"), entry.buf);
  99                strbuf_release(&entry);
 100                return -1;
 101        }
 102        strbuf_release(&entry);
 103        return 0;
 104}
 105
 106/*
 107 * Try to remove the "submodule.<name>" section from .gitmodules where the given
 108 * path is configured. Return 0 only if a .gitmodules file was found, a section
 109 * with the correct path=<path> setting was found and we could remove it.
 110 */
 111int remove_path_from_gitmodules(const char *path)
 112{
 113        struct strbuf sect = STRBUF_INIT;
 114        const struct submodule *submodule;
 115
 116        if (!file_exists(GITMODULES_FILE)) /* Do nothing without .gitmodules */
 117                return -1;
 118
 119        if (is_gitmodules_unmerged(&the_index))
 120                die(_("Cannot change unmerged .gitmodules, resolve merge conflicts first"));
 121
 122        submodule = submodule_from_path(&null_oid, path);
 123        if (!submodule || !submodule->name) {
 124                warning(_("Could not find section in .gitmodules where path=%s"), path);
 125                return -1;
 126        }
 127        strbuf_addstr(&sect, "submodule.");
 128        strbuf_addstr(&sect, submodule->name);
 129        if (git_config_rename_section_in_file(GITMODULES_FILE, sect.buf, NULL) < 0) {
 130                /* Maybe the user already did that, don't error out here */
 131                warning(_("Could not remove .gitmodules entry for %s"), path);
 132                strbuf_release(&sect);
 133                return -1;
 134        }
 135        strbuf_release(&sect);
 136        return 0;
 137}
 138
 139void stage_updated_gitmodules(void)
 140{
 141        if (add_file_to_cache(GITMODULES_FILE, 0))
 142                die(_("staging updated .gitmodules failed"));
 143}
 144
 145static int add_submodule_odb(const char *path)
 146{
 147        struct strbuf objects_directory = STRBUF_INIT;
 148        int ret = 0;
 149
 150        ret = strbuf_git_path_submodule(&objects_directory, path, "objects/");
 151        if (ret)
 152                goto done;
 153        if (!is_directory(objects_directory.buf)) {
 154                ret = -1;
 155                goto done;
 156        }
 157        add_to_alternates_memory(objects_directory.buf);
 158done:
 159        strbuf_release(&objects_directory);
 160        return ret;
 161}
 162
 163void set_diffopt_flags_from_submodule_config(struct diff_options *diffopt,
 164                                             const char *path)
 165{
 166        const struct submodule *submodule = submodule_from_path(&null_oid, path);
 167        if (submodule) {
 168                const char *ignore;
 169                char *key;
 170
 171                key = xstrfmt("submodule.%s.ignore", submodule->name);
 172                if (repo_config_get_string_const(the_repository, key, &ignore))
 173                        ignore = submodule->ignore;
 174                free(key);
 175
 176                if (ignore)
 177                        handle_ignore_submodules_arg(diffopt, ignore);
 178                else if (is_gitmodules_unmerged(&the_index))
 179                        DIFF_OPT_SET(diffopt, IGNORE_SUBMODULES);
 180        }
 181}
 182
 183/* Cheap function that only determines if we're interested in submodules at all */
 184int git_default_submodule_config(const char *var, const char *value, void *cb)
 185{
 186        if (!strcmp(var, "submodule.recurse")) {
 187                int v = git_config_bool(var, value) ?
 188                        RECURSE_SUBMODULES_ON : RECURSE_SUBMODULES_OFF;
 189                config_update_recurse_submodules = v;
 190        }
 191        return 0;
 192}
 193
 194int option_parse_recurse_submodules_worktree_updater(const struct option *opt,
 195                                                     const char *arg, int unset)
 196{
 197        if (unset) {
 198                config_update_recurse_submodules = RECURSE_SUBMODULES_OFF;
 199                return 0;
 200        }
 201        if (arg)
 202                config_update_recurse_submodules =
 203                        parse_update_recurse_submodules_arg(opt->long_name,
 204                                                            arg);
 205        else
 206                config_update_recurse_submodules = RECURSE_SUBMODULES_ON;
 207
 208        return 0;
 209}
 210
 211/*
 212 * Determine if a submodule has been initialized at a given 'path'
 213 */
 214int is_submodule_active(struct repository *repo, const char *path)
 215{
 216        int ret = 0;
 217        char *key = NULL;
 218        char *value = NULL;
 219        const struct string_list *sl;
 220        const struct submodule *module;
 221
 222        module = submodule_from_cache(repo, &null_oid, path);
 223
 224        /* early return if there isn't a path->module mapping */
 225        if (!module)
 226                return 0;
 227
 228        /* submodule.<name>.active is set */
 229        key = xstrfmt("submodule.%s.active", module->name);
 230        if (!repo_config_get_bool(repo, key, &ret)) {
 231                free(key);
 232                return ret;
 233        }
 234        free(key);
 235
 236        /* submodule.active is set */
 237        sl = repo_config_get_value_multi(repo, "submodule.active");
 238        if (sl) {
 239                struct pathspec ps;
 240                struct argv_array args = ARGV_ARRAY_INIT;
 241                const struct string_list_item *item;
 242
 243                for_each_string_list_item(item, sl) {
 244                        argv_array_push(&args, item->string);
 245                }
 246
 247                parse_pathspec(&ps, 0, 0, NULL, args.argv);
 248                ret = match_pathspec(&ps, path, strlen(path), 0, NULL, 1);
 249
 250                argv_array_clear(&args);
 251                clear_pathspec(&ps);
 252                return ret;
 253        }
 254
 255        /* fallback to checking if the URL is set */
 256        key = xstrfmt("submodule.%s.url", module->name);
 257        ret = !repo_config_get_string(repo, key, &value);
 258
 259        free(value);
 260        free(key);
 261        return ret;
 262}
 263
 264int is_submodule_populated_gently(const char *path, int *return_error_code)
 265{
 266        int ret = 0;
 267        char *gitdir = xstrfmt("%s/.git", path);
 268
 269        if (resolve_gitdir_gently(gitdir, return_error_code))
 270                ret = 1;
 271
 272        free(gitdir);
 273        return ret;
 274}
 275
 276/*
 277 * Dies if the provided 'prefix' corresponds to an unpopulated submodule
 278 */
 279void die_in_unpopulated_submodule(const struct index_state *istate,
 280                                  const char *prefix)
 281{
 282        int i, prefixlen;
 283
 284        if (!prefix)
 285                return;
 286
 287        prefixlen = strlen(prefix);
 288
 289        for (i = 0; i < istate->cache_nr; i++) {
 290                struct cache_entry *ce = istate->cache[i];
 291                int ce_len = ce_namelen(ce);
 292
 293                if (!S_ISGITLINK(ce->ce_mode))
 294                        continue;
 295                if (prefixlen <= ce_len)
 296                        continue;
 297                if (strncmp(ce->name, prefix, ce_len))
 298                        continue;
 299                if (prefix[ce_len] != '/')
 300                        continue;
 301
 302                die(_("in unpopulated submodule '%s'"), ce->name);
 303        }
 304}
 305
 306/*
 307 * Dies if any paths in the provided pathspec descends into a submodule
 308 */
 309void die_path_inside_submodule(const struct index_state *istate,
 310                               const struct pathspec *ps)
 311{
 312        int i, j;
 313
 314        for (i = 0; i < istate->cache_nr; i++) {
 315                struct cache_entry *ce = istate->cache[i];
 316                int ce_len = ce_namelen(ce);
 317
 318                if (!S_ISGITLINK(ce->ce_mode))
 319                        continue;
 320
 321                for (j = 0; j < ps->nr ; j++) {
 322                        const struct pathspec_item *item = &ps->items[j];
 323
 324                        if (item->len <= ce_len)
 325                                continue;
 326                        if (item->match[ce_len] != '/')
 327                                continue;
 328                        if (strncmp(ce->name, item->match, ce_len))
 329                                continue;
 330                        if (item->len == ce_len + 1)
 331                                continue;
 332
 333                        die(_("Pathspec '%s' is in submodule '%.*s'"),
 334                            item->original, ce_len, ce->name);
 335                }
 336        }
 337}
 338
 339enum submodule_update_type parse_submodule_update_type(const char *value)
 340{
 341        if (!strcmp(value, "none"))
 342                return SM_UPDATE_NONE;
 343        else if (!strcmp(value, "checkout"))
 344                return SM_UPDATE_CHECKOUT;
 345        else if (!strcmp(value, "rebase"))
 346                return SM_UPDATE_REBASE;
 347        else if (!strcmp(value, "merge"))
 348                return SM_UPDATE_MERGE;
 349        else if (*value == '!')
 350                return SM_UPDATE_COMMAND;
 351        else
 352                return SM_UPDATE_UNSPECIFIED;
 353}
 354
 355int parse_submodule_update_strategy(const char *value,
 356                struct submodule_update_strategy *dst)
 357{
 358        enum submodule_update_type type;
 359
 360        free((void*)dst->command);
 361        dst->command = NULL;
 362
 363        type = parse_submodule_update_type(value);
 364        if (type == SM_UPDATE_UNSPECIFIED)
 365                return -1;
 366
 367        dst->type = type;
 368        if (type == SM_UPDATE_COMMAND)
 369                dst->command = xstrdup(value + 1);
 370
 371        return 0;
 372}
 373
 374const char *submodule_strategy_to_string(const struct submodule_update_strategy *s)
 375{
 376        struct strbuf sb = STRBUF_INIT;
 377        switch (s->type) {
 378        case SM_UPDATE_CHECKOUT:
 379                return "checkout";
 380        case SM_UPDATE_MERGE:
 381                return "merge";
 382        case SM_UPDATE_REBASE:
 383                return "rebase";
 384        case SM_UPDATE_NONE:
 385                return "none";
 386        case SM_UPDATE_UNSPECIFIED:
 387                return NULL;
 388        case SM_UPDATE_COMMAND:
 389                strbuf_addf(&sb, "!%s", s->command);
 390                return strbuf_detach(&sb, NULL);
 391        }
 392        return NULL;
 393}
 394
 395void handle_ignore_submodules_arg(struct diff_options *diffopt,
 396                                  const char *arg)
 397{
 398        DIFF_OPT_CLR(diffopt, IGNORE_SUBMODULES);
 399        DIFF_OPT_CLR(diffopt, IGNORE_UNTRACKED_IN_SUBMODULES);
 400        DIFF_OPT_CLR(diffopt, IGNORE_DIRTY_SUBMODULES);
 401
 402        if (!strcmp(arg, "all"))
 403                DIFF_OPT_SET(diffopt, IGNORE_SUBMODULES);
 404        else if (!strcmp(arg, "untracked"))
 405                DIFF_OPT_SET(diffopt, IGNORE_UNTRACKED_IN_SUBMODULES);
 406        else if (!strcmp(arg, "dirty"))
 407                DIFF_OPT_SET(diffopt, IGNORE_DIRTY_SUBMODULES);
 408        else if (strcmp(arg, "none"))
 409                die("bad --ignore-submodules argument: %s", arg);
 410}
 411
 412static int prepare_submodule_summary(struct rev_info *rev, const char *path,
 413                struct commit *left, struct commit *right,
 414                struct commit_list *merge_bases)
 415{
 416        struct commit_list *list;
 417
 418        init_revisions(rev, NULL);
 419        setup_revisions(0, NULL, rev, NULL);
 420        rev->left_right = 1;
 421        rev->first_parent_only = 1;
 422        left->object.flags |= SYMMETRIC_LEFT;
 423        add_pending_object(rev, &left->object, path);
 424        add_pending_object(rev, &right->object, path);
 425        for (list = merge_bases; list; list = list->next) {
 426                list->item->object.flags |= UNINTERESTING;
 427                add_pending_object(rev, &list->item->object,
 428                        oid_to_hex(&list->item->object.oid));
 429        }
 430        return prepare_revision_walk(rev);
 431}
 432
 433static void print_submodule_summary(struct rev_info *rev, struct diff_options *o)
 434{
 435        static const char format[] = "  %m %s";
 436        struct strbuf sb = STRBUF_INIT;
 437        struct commit *commit;
 438
 439        while ((commit = get_revision(rev))) {
 440                struct pretty_print_context ctx = {0};
 441                ctx.date_mode = rev->date_mode;
 442                ctx.output_encoding = get_log_output_encoding();
 443                strbuf_setlen(&sb, 0);
 444                format_commit_message(commit, format, &sb, &ctx);
 445                strbuf_addch(&sb, '\n');
 446                if (commit->object.flags & SYMMETRIC_LEFT)
 447                        diff_emit_submodule_del(o, sb.buf);
 448                else
 449                        diff_emit_submodule_add(o, sb.buf);
 450        }
 451        strbuf_release(&sb);
 452}
 453
 454static void prepare_submodule_repo_env_no_git_dir(struct argv_array *out)
 455{
 456        const char * const *var;
 457
 458        for (var = local_repo_env; *var; var++) {
 459                if (strcmp(*var, CONFIG_DATA_ENVIRONMENT))
 460                        argv_array_push(out, *var);
 461        }
 462}
 463
 464void prepare_submodule_repo_env(struct argv_array *out)
 465{
 466        prepare_submodule_repo_env_no_git_dir(out);
 467        argv_array_pushf(out, "%s=%s", GIT_DIR_ENVIRONMENT,
 468                         DEFAULT_GIT_DIR_ENVIRONMENT);
 469}
 470
 471/* Helper function to display the submodule header line prior to the full
 472 * summary output. If it can locate the submodule objects directory it will
 473 * attempt to lookup both the left and right commits and put them into the
 474 * left and right pointers.
 475 */
 476static void show_submodule_header(struct diff_options *o, const char *path,
 477                struct object_id *one, struct object_id *two,
 478                unsigned dirty_submodule,
 479                struct commit **left, struct commit **right,
 480                struct commit_list **merge_bases)
 481{
 482        const char *message = NULL;
 483        struct strbuf sb = STRBUF_INIT;
 484        int fast_forward = 0, fast_backward = 0;
 485
 486        if (dirty_submodule & DIRTY_SUBMODULE_UNTRACKED)
 487                diff_emit_submodule_untracked(o, path);
 488
 489        if (dirty_submodule & DIRTY_SUBMODULE_MODIFIED)
 490                diff_emit_submodule_modified(o, path);
 491
 492        if (is_null_oid(one))
 493                message = "(new submodule)";
 494        else if (is_null_oid(two))
 495                message = "(submodule deleted)";
 496
 497        if (add_submodule_odb(path)) {
 498                if (!message)
 499                        message = "(not initialized)";
 500                goto output_header;
 501        }
 502
 503        /*
 504         * Attempt to lookup the commit references, and determine if this is
 505         * a fast forward or fast backwards update.
 506         */
 507        *left = lookup_commit_reference(one);
 508        *right = lookup_commit_reference(two);
 509
 510        /*
 511         * Warn about missing commits in the submodule project, but only if
 512         * they aren't null.
 513         */
 514        if ((!is_null_oid(one) && !*left) ||
 515             (!is_null_oid(two) && !*right))
 516                message = "(commits not present)";
 517
 518        *merge_bases = get_merge_bases(*left, *right);
 519        if (*merge_bases) {
 520                if ((*merge_bases)->item == *left)
 521                        fast_forward = 1;
 522                else if ((*merge_bases)->item == *right)
 523                        fast_backward = 1;
 524        }
 525
 526        if (!oidcmp(one, two)) {
 527                strbuf_release(&sb);
 528                return;
 529        }
 530
 531output_header:
 532        strbuf_addf(&sb, "Submodule %s ", path);
 533        strbuf_add_unique_abbrev(&sb, one->hash, DEFAULT_ABBREV);
 534        strbuf_addstr(&sb, (fast_backward || fast_forward) ? ".." : "...");
 535        strbuf_add_unique_abbrev(&sb, two->hash, DEFAULT_ABBREV);
 536        if (message)
 537                strbuf_addf(&sb, " %s\n", message);
 538        else
 539                strbuf_addf(&sb, "%s:\n", fast_backward ? " (rewind)" : "");
 540        diff_emit_submodule_header(o, sb.buf);
 541
 542        strbuf_release(&sb);
 543}
 544
 545void show_submodule_summary(struct diff_options *o, const char *path,
 546                struct object_id *one, struct object_id *two,
 547                unsigned dirty_submodule)
 548{
 549        struct rev_info rev;
 550        struct commit *left = NULL, *right = NULL;
 551        struct commit_list *merge_bases = NULL;
 552
 553        show_submodule_header(o, path, one, two, dirty_submodule,
 554                              &left, &right, &merge_bases);
 555
 556        /*
 557         * If we don't have both a left and a right pointer, there is no
 558         * reason to try and display a summary. The header line should contain
 559         * all the information the user needs.
 560         */
 561        if (!left || !right)
 562                goto out;
 563
 564        /* Treat revision walker failure the same as missing commits */
 565        if (prepare_submodule_summary(&rev, path, left, right, merge_bases)) {
 566                diff_emit_submodule_error(o, "(revision walker failed)\n");
 567                goto out;
 568        }
 569
 570        print_submodule_summary(&rev, o);
 571
 572out:
 573        if (merge_bases)
 574                free_commit_list(merge_bases);
 575        clear_commit_marks(left, ~0);
 576        clear_commit_marks(right, ~0);
 577}
 578
 579void show_submodule_inline_diff(struct diff_options *o, const char *path,
 580                struct object_id *one, struct object_id *two,
 581                unsigned dirty_submodule)
 582{
 583        const struct object_id *old = &empty_tree_oid, *new = &empty_tree_oid;
 584        struct commit *left = NULL, *right = NULL;
 585        struct commit_list *merge_bases = NULL;
 586        struct child_process cp = CHILD_PROCESS_INIT;
 587        struct strbuf sb = STRBUF_INIT;
 588
 589        show_submodule_header(o, path, one, two, dirty_submodule,
 590                              &left, &right, &merge_bases);
 591
 592        /* We need a valid left and right commit to display a difference */
 593        if (!(left || is_null_oid(one)) ||
 594            !(right || is_null_oid(two)))
 595                goto done;
 596
 597        if (left)
 598                old = one;
 599        if (right)
 600                new = two;
 601
 602        cp.git_cmd = 1;
 603        cp.dir = path;
 604        cp.out = -1;
 605        cp.no_stdin = 1;
 606
 607        /* TODO: other options may need to be passed here. */
 608        argv_array_pushl(&cp.args, "diff", "--submodule=diff", NULL);
 609        argv_array_pushf(&cp.args, "--color=%s", want_color(o->use_color) ?
 610                         "always" : "never");
 611
 612        if (DIFF_OPT_TST(o, REVERSE_DIFF)) {
 613                argv_array_pushf(&cp.args, "--src-prefix=%s%s/",
 614                                 o->b_prefix, path);
 615                argv_array_pushf(&cp.args, "--dst-prefix=%s%s/",
 616                                 o->a_prefix, path);
 617        } else {
 618                argv_array_pushf(&cp.args, "--src-prefix=%s%s/",
 619                                 o->a_prefix, path);
 620                argv_array_pushf(&cp.args, "--dst-prefix=%s%s/",
 621                                 o->b_prefix, path);
 622        }
 623        argv_array_push(&cp.args, oid_to_hex(old));
 624        /*
 625         * If the submodule has modified content, we will diff against the
 626         * work tree, under the assumption that the user has asked for the
 627         * diff format and wishes to actually see all differences even if they
 628         * haven't yet been committed to the submodule yet.
 629         */
 630        if (!(dirty_submodule & DIRTY_SUBMODULE_MODIFIED))
 631                argv_array_push(&cp.args, oid_to_hex(new));
 632
 633        prepare_submodule_repo_env(&cp.env_array);
 634        if (start_command(&cp))
 635                diff_emit_submodule_error(o, "(diff failed)\n");
 636
 637        while (strbuf_getwholeline_fd(&sb, cp.out, '\n') != EOF)
 638                diff_emit_submodule_pipethrough(o, sb.buf, sb.len);
 639
 640        if (finish_command(&cp))
 641                diff_emit_submodule_error(o, "(diff failed)\n");
 642
 643done:
 644        strbuf_release(&sb);
 645        if (merge_bases)
 646                free_commit_list(merge_bases);
 647        if (left)
 648                clear_commit_marks(left, ~0);
 649        if (right)
 650                clear_commit_marks(right, ~0);
 651}
 652
 653int should_update_submodules(void)
 654{
 655        return config_update_recurse_submodules == RECURSE_SUBMODULES_ON;
 656}
 657
 658const struct submodule *submodule_from_ce(const struct cache_entry *ce)
 659{
 660        if (!S_ISGITLINK(ce->ce_mode))
 661                return NULL;
 662
 663        if (!should_update_submodules())
 664                return NULL;
 665
 666        return submodule_from_path(&null_oid, ce->name);
 667}
 668
 669static struct oid_array *submodule_commits(struct string_list *submodules,
 670                                           const char *path)
 671{
 672        struct string_list_item *item;
 673
 674        item = string_list_insert(submodules, path);
 675        if (item->util)
 676                return (struct oid_array *) item->util;
 677
 678        /* NEEDSWORK: should we have oid_array_init()? */
 679        item->util = xcalloc(1, sizeof(struct oid_array));
 680        return (struct oid_array *) item->util;
 681}
 682
 683static void collect_changed_submodules_cb(struct diff_queue_struct *q,
 684                                          struct diff_options *options,
 685                                          void *data)
 686{
 687        int i;
 688        struct string_list *changed = data;
 689
 690        for (i = 0; i < q->nr; i++) {
 691                struct diff_filepair *p = q->queue[i];
 692                struct oid_array *commits;
 693                if (!S_ISGITLINK(p->two->mode))
 694                        continue;
 695
 696                if (S_ISGITLINK(p->one->mode)) {
 697                        /*
 698                         * NEEDSWORK: We should honor the name configured in
 699                         * the .gitmodules file of the commit we are examining
 700                         * here to be able to correctly follow submodules
 701                         * being moved around.
 702                         */
 703                        commits = submodule_commits(changed, p->two->path);
 704                        oid_array_append(commits, &p->two->oid);
 705                } else {
 706                        /* Submodule is new or was moved here */
 707                        /*
 708                         * NEEDSWORK: When the .git directories of submodules
 709                         * live inside the superprojects .git directory some
 710                         * day we should fetch new submodules directly into
 711                         * that location too when config or options request
 712                         * that so they can be checked out from there.
 713                         */
 714                        continue;
 715                }
 716        }
 717}
 718
 719/*
 720 * Collect the paths of submodules in 'changed' which have changed based on
 721 * the revisions as specified in 'argv'.  Each entry in 'changed' will also
 722 * have a corresponding 'struct oid_array' (in the 'util' field) which lists
 723 * what the submodule pointers were updated to during the change.
 724 */
 725static void collect_changed_submodules(struct string_list *changed,
 726                                       struct argv_array *argv)
 727{
 728        struct rev_info rev;
 729        const struct commit *commit;
 730
 731        init_revisions(&rev, NULL);
 732        setup_revisions(argv->argc, argv->argv, &rev, NULL);
 733        if (prepare_revision_walk(&rev))
 734                die("revision walk setup failed");
 735
 736        while ((commit = get_revision(&rev))) {
 737                struct rev_info diff_rev;
 738
 739                init_revisions(&diff_rev, NULL);
 740                diff_rev.diffopt.output_format |= DIFF_FORMAT_CALLBACK;
 741                diff_rev.diffopt.format_callback = collect_changed_submodules_cb;
 742                diff_rev.diffopt.format_callback_data = changed;
 743                diff_tree_combined_merge(commit, 1, &diff_rev);
 744        }
 745
 746        reset_revision_walk();
 747}
 748
 749static void free_submodules_oids(struct string_list *submodules)
 750{
 751        struct string_list_item *item;
 752        for_each_string_list_item(item, submodules)
 753                oid_array_clear((struct oid_array *) item->util);
 754        string_list_clear(submodules, 1);
 755}
 756
 757static int has_remote(const char *refname, const struct object_id *oid,
 758                      int flags, void *cb_data)
 759{
 760        return 1;
 761}
 762
 763static int append_oid_to_argv(const struct object_id *oid, void *data)
 764{
 765        struct argv_array *argv = data;
 766        argv_array_push(argv, oid_to_hex(oid));
 767        return 0;
 768}
 769
 770struct has_commit_data {
 771        int result;
 772        const char *path;
 773};
 774
 775static int check_has_commit(const struct object_id *oid, void *data)
 776{
 777        struct has_commit_data *cb = data;
 778
 779        enum object_type type = sha1_object_info(oid->hash, NULL);
 780
 781        switch (type) {
 782        case OBJ_COMMIT:
 783                return 0;
 784        case OBJ_BAD:
 785                /*
 786                 * Object is missing or invalid. If invalid, an error message
 787                 * has already been printed.
 788                 */
 789                cb->result = 0;
 790                return 0;
 791        default:
 792                die(_("submodule entry '%s' (%s) is a %s, not a commit"),
 793                    cb->path, oid_to_hex(oid), typename(type));
 794        }
 795}
 796
 797static int submodule_has_commits(const char *path, struct oid_array *commits)
 798{
 799        struct has_commit_data has_commit = { 1, path };
 800
 801        /*
 802         * Perform a cheap, but incorrect check for the existence of 'commits'.
 803         * This is done by adding the submodule's object store to the in-core
 804         * object store, and then querying for each commit's existence.  If we
 805         * do not have the commit object anywhere, there is no chance we have
 806         * it in the object store of the correct submodule and have it
 807         * reachable from a ref, so we can fail early without spawning rev-list
 808         * which is expensive.
 809         */
 810        if (add_submodule_odb(path))
 811                return 0;
 812
 813        oid_array_for_each_unique(commits, check_has_commit, &has_commit);
 814
 815        if (has_commit.result) {
 816                /*
 817                 * Even if the submodule is checked out and the commit is
 818                 * present, make sure it exists in the submodule's object store
 819                 * and that it is reachable from a ref.
 820                 */
 821                struct child_process cp = CHILD_PROCESS_INIT;
 822                struct strbuf out = STRBUF_INIT;
 823
 824                argv_array_pushl(&cp.args, "rev-list", "-n", "1", NULL);
 825                oid_array_for_each_unique(commits, append_oid_to_argv, &cp.args);
 826                argv_array_pushl(&cp.args, "--not", "--all", NULL);
 827
 828                prepare_submodule_repo_env(&cp.env_array);
 829                cp.git_cmd = 1;
 830                cp.no_stdin = 1;
 831                cp.dir = path;
 832
 833                if (capture_command(&cp, &out, GIT_MAX_HEXSZ + 1) || out.len)
 834                        has_commit.result = 0;
 835
 836                strbuf_release(&out);
 837        }
 838
 839        return has_commit.result;
 840}
 841
 842static int submodule_needs_pushing(const char *path, struct oid_array *commits)
 843{
 844        if (!submodule_has_commits(path, commits))
 845                /*
 846                 * NOTE: We do consider it safe to return "no" here. The
 847                 * correct answer would be "We do not know" instead of
 848                 * "No push needed", but it is quite hard to change
 849                 * the submodule pointer without having the submodule
 850                 * around. If a user did however change the submodules
 851                 * without having the submodule around, this indicates
 852                 * an expert who knows what they are doing or a
 853                 * maintainer integrating work from other people. In
 854                 * both cases it should be safe to skip this check.
 855                 */
 856                return 0;
 857
 858        if (for_each_remote_ref_submodule(path, has_remote, NULL) > 0) {
 859                struct child_process cp = CHILD_PROCESS_INIT;
 860                struct strbuf buf = STRBUF_INIT;
 861                int needs_pushing = 0;
 862
 863                argv_array_push(&cp.args, "rev-list");
 864                oid_array_for_each_unique(commits, append_oid_to_argv, &cp.args);
 865                argv_array_pushl(&cp.args, "--not", "--remotes", "-n", "1" , NULL);
 866
 867                prepare_submodule_repo_env(&cp.env_array);
 868                cp.git_cmd = 1;
 869                cp.no_stdin = 1;
 870                cp.out = -1;
 871                cp.dir = path;
 872                if (start_command(&cp))
 873                        die("Could not run 'git rev-list <commits> --not --remotes -n 1' command in submodule %s",
 874                                        path);
 875                if (strbuf_read(&buf, cp.out, 41))
 876                        needs_pushing = 1;
 877                finish_command(&cp);
 878                close(cp.out);
 879                strbuf_release(&buf);
 880                return needs_pushing;
 881        }
 882
 883        return 0;
 884}
 885
 886int find_unpushed_submodules(struct oid_array *commits,
 887                const char *remotes_name, struct string_list *needs_pushing)
 888{
 889        struct string_list submodules = STRING_LIST_INIT_DUP;
 890        struct string_list_item *submodule;
 891        struct argv_array argv = ARGV_ARRAY_INIT;
 892
 893        /* argv.argv[0] will be ignored by setup_revisions */
 894        argv_array_push(&argv, "find_unpushed_submodules");
 895        oid_array_for_each_unique(commits, append_oid_to_argv, &argv);
 896        argv_array_push(&argv, "--not");
 897        argv_array_pushf(&argv, "--remotes=%s", remotes_name);
 898
 899        collect_changed_submodules(&submodules, &argv);
 900
 901        for_each_string_list_item(submodule, &submodules) {
 902                struct oid_array *commits = submodule->util;
 903                const char *path = submodule->string;
 904
 905                if (submodule_needs_pushing(path, commits))
 906                        string_list_insert(needs_pushing, path);
 907        }
 908
 909        free_submodules_oids(&submodules);
 910        argv_array_clear(&argv);
 911
 912        return needs_pushing->nr;
 913}
 914
 915static int push_submodule(const char *path,
 916                          const struct remote *remote,
 917                          const char **refspec, int refspec_nr,
 918                          const struct string_list *push_options,
 919                          int dry_run)
 920{
 921        if (add_submodule_odb(path))
 922                return 1;
 923
 924        if (for_each_remote_ref_submodule(path, has_remote, NULL) > 0) {
 925                struct child_process cp = CHILD_PROCESS_INIT;
 926                argv_array_push(&cp.args, "push");
 927                if (dry_run)
 928                        argv_array_push(&cp.args, "--dry-run");
 929
 930                if (push_options && push_options->nr) {
 931                        const struct string_list_item *item;
 932                        for_each_string_list_item(item, push_options)
 933                                argv_array_pushf(&cp.args, "--push-option=%s",
 934                                                 item->string);
 935                }
 936
 937                if (remote->origin != REMOTE_UNCONFIGURED) {
 938                        int i;
 939                        argv_array_push(&cp.args, remote->name);
 940                        for (i = 0; i < refspec_nr; i++)
 941                                argv_array_push(&cp.args, refspec[i]);
 942                }
 943
 944                prepare_submodule_repo_env(&cp.env_array);
 945                cp.git_cmd = 1;
 946                cp.no_stdin = 1;
 947                cp.dir = path;
 948                if (run_command(&cp))
 949                        return 0;
 950                close(cp.out);
 951        }
 952
 953        return 1;
 954}
 955
 956/*
 957 * Perform a check in the submodule to see if the remote and refspec work.
 958 * Die if the submodule can't be pushed.
 959 */
 960static void submodule_push_check(const char *path, const char *head,
 961                                 const struct remote *remote,
 962                                 const char **refspec, int refspec_nr)
 963{
 964        struct child_process cp = CHILD_PROCESS_INIT;
 965        int i;
 966
 967        argv_array_push(&cp.args, "submodule--helper");
 968        argv_array_push(&cp.args, "push-check");
 969        argv_array_push(&cp.args, head);
 970        argv_array_push(&cp.args, remote->name);
 971
 972        for (i = 0; i < refspec_nr; i++)
 973                argv_array_push(&cp.args, refspec[i]);
 974
 975        prepare_submodule_repo_env(&cp.env_array);
 976        cp.git_cmd = 1;
 977        cp.no_stdin = 1;
 978        cp.no_stdout = 1;
 979        cp.dir = path;
 980
 981        /*
 982         * Simply indicate if 'submodule--helper push-check' failed.
 983         * More detailed error information will be provided by the
 984         * child process.
 985         */
 986        if (run_command(&cp))
 987                die("process for submodule '%s' failed", path);
 988}
 989
 990int push_unpushed_submodules(struct oid_array *commits,
 991                             const struct remote *remote,
 992                             const char **refspec, int refspec_nr,
 993                             const struct string_list *push_options,
 994                             int dry_run)
 995{
 996        int i, ret = 1;
 997        struct string_list needs_pushing = STRING_LIST_INIT_DUP;
 998
 999        if (!find_unpushed_submodules(commits, remote->name, &needs_pushing))
1000                return 1;
1001
1002        /*
1003         * Verify that the remote and refspec can be propagated to all
1004         * submodules.  This check can be skipped if the remote and refspec
1005         * won't be propagated due to the remote being unconfigured (e.g. a URL
1006         * instead of a remote name).
1007         */
1008        if (remote->origin != REMOTE_UNCONFIGURED) {
1009                char *head;
1010                struct object_id head_oid;
1011
1012                head = resolve_refdup("HEAD", 0, head_oid.hash, NULL);
1013                if (!head)
1014                        die(_("Failed to resolve HEAD as a valid ref."));
1015
1016                for (i = 0; i < needs_pushing.nr; i++)
1017                        submodule_push_check(needs_pushing.items[i].string,
1018                                             head, remote,
1019                                             refspec, refspec_nr);
1020                free(head);
1021        }
1022
1023        /* Actually push the submodules */
1024        for (i = 0; i < needs_pushing.nr; i++) {
1025                const char *path = needs_pushing.items[i].string;
1026                fprintf(stderr, "Pushing submodule '%s'\n", path);
1027                if (!push_submodule(path, remote, refspec, refspec_nr,
1028                                    push_options, dry_run)) {
1029                        fprintf(stderr, "Unable to push submodule '%s'\n", path);
1030                        ret = 0;
1031                }
1032        }
1033
1034        string_list_clear(&needs_pushing, 0);
1035
1036        return ret;
1037}
1038
1039static int append_oid_to_array(const char *ref, const struct object_id *oid,
1040                               int flags, void *data)
1041{
1042        struct oid_array *array = data;
1043        oid_array_append(array, oid);
1044        return 0;
1045}
1046
1047void check_for_new_submodule_commits(struct object_id *oid)
1048{
1049        if (!initialized_fetch_ref_tips) {
1050                for_each_ref(append_oid_to_array, &ref_tips_before_fetch);
1051                initialized_fetch_ref_tips = 1;
1052        }
1053
1054        oid_array_append(&ref_tips_after_fetch, oid);
1055}
1056
1057static void calculate_changed_submodule_paths(void)
1058{
1059        struct argv_array argv = ARGV_ARRAY_INIT;
1060        struct string_list changed_submodules = STRING_LIST_INIT_DUP;
1061        const struct string_list_item *item;
1062
1063        /* No need to check if there are no submodules configured */
1064        if (!submodule_from_path(NULL, NULL))
1065                return;
1066
1067        argv_array_push(&argv, "--"); /* argv[0] program name */
1068        oid_array_for_each_unique(&ref_tips_after_fetch,
1069                                   append_oid_to_argv, &argv);
1070        argv_array_push(&argv, "--not");
1071        oid_array_for_each_unique(&ref_tips_before_fetch,
1072                                   append_oid_to_argv, &argv);
1073
1074        /*
1075         * Collect all submodules (whether checked out or not) for which new
1076         * commits have been recorded upstream in "changed_submodule_paths".
1077         */
1078        collect_changed_submodules(&changed_submodules, &argv);
1079
1080        for_each_string_list_item(item, &changed_submodules) {
1081                struct oid_array *commits = item->util;
1082                const char *path = item->string;
1083
1084                if (!submodule_has_commits(path, commits))
1085                        string_list_append(&changed_submodule_paths, path);
1086        }
1087
1088        free_submodules_oids(&changed_submodules);
1089        argv_array_clear(&argv);
1090        oid_array_clear(&ref_tips_before_fetch);
1091        oid_array_clear(&ref_tips_after_fetch);
1092        initialized_fetch_ref_tips = 0;
1093}
1094
1095int submodule_touches_in_range(struct object_id *excl_oid,
1096                               struct object_id *incl_oid)
1097{
1098        struct string_list subs = STRING_LIST_INIT_DUP;
1099        struct argv_array args = ARGV_ARRAY_INIT;
1100        int ret;
1101
1102        /* No need to check if there are no submodules configured */
1103        if (!submodule_from_path(NULL, NULL))
1104                return 0;
1105
1106        argv_array_push(&args, "--"); /* args[0] program name */
1107        argv_array_push(&args, oid_to_hex(incl_oid));
1108        argv_array_push(&args, "--not");
1109        argv_array_push(&args, oid_to_hex(excl_oid));
1110
1111        collect_changed_submodules(&subs, &args);
1112        ret = subs.nr;
1113
1114        argv_array_clear(&args);
1115
1116        free_submodules_oids(&subs);
1117        return ret;
1118}
1119
1120struct submodule_parallel_fetch {
1121        int count;
1122        struct argv_array args;
1123        const char *work_tree;
1124        const char *prefix;
1125        int command_line_option;
1126        int default_option;
1127        int quiet;
1128        int result;
1129};
1130#define SPF_INIT {0, ARGV_ARRAY_INIT, NULL, NULL, 0, 0, 0, 0}
1131
1132static int get_next_submodule(struct child_process *cp,
1133                              struct strbuf *err, void *data, void **task_cb)
1134{
1135        int ret = 0;
1136        struct submodule_parallel_fetch *spf = data;
1137
1138        for (; spf->count < active_nr; spf->count++) {
1139                struct strbuf submodule_path = STRBUF_INIT;
1140                struct strbuf submodule_git_dir = STRBUF_INIT;
1141                struct strbuf submodule_prefix = STRBUF_INIT;
1142                const struct cache_entry *ce = active_cache[spf->count];
1143                const char *git_dir, *default_argv;
1144                const struct submodule *submodule;
1145
1146                if (!S_ISGITLINK(ce->ce_mode))
1147                        continue;
1148
1149                submodule = submodule_from_path(&null_oid, ce->name);
1150
1151                default_argv = "yes";
1152                if (spf->command_line_option == RECURSE_SUBMODULES_DEFAULT) {
1153                        int fetch_recurse = RECURSE_SUBMODULES_NONE;
1154
1155                        if (submodule) {
1156                                char *key;
1157                                const char *value;
1158
1159                                fetch_recurse = submodule->fetch_recurse;
1160                                key = xstrfmt("submodule.%s.fetchRecurseSubmodules", submodule->name);
1161                                if (!repo_config_get_string_const(the_repository, key, &value)) {
1162                                        fetch_recurse = parse_fetch_recurse_submodules_arg(key, value);
1163                                }
1164                                free(key);
1165                        }
1166
1167                        if (fetch_recurse != RECURSE_SUBMODULES_NONE) {
1168                                if (fetch_recurse == RECURSE_SUBMODULES_OFF)
1169                                        continue;
1170                                if (fetch_recurse == RECURSE_SUBMODULES_ON_DEMAND) {
1171                                        if (!unsorted_string_list_lookup(&changed_submodule_paths, ce->name))
1172                                                continue;
1173                                        default_argv = "on-demand";
1174                                }
1175                        } else {
1176                                if (spf->default_option == RECURSE_SUBMODULES_OFF)
1177                                        continue;
1178                                if (spf->default_option == RECURSE_SUBMODULES_ON_DEMAND) {
1179                                        if (!unsorted_string_list_lookup(&changed_submodule_paths, ce->name))
1180                                                continue;
1181                                        default_argv = "on-demand";
1182                                }
1183                        }
1184                } else if (spf->command_line_option == RECURSE_SUBMODULES_ON_DEMAND) {
1185                        if (!unsorted_string_list_lookup(&changed_submodule_paths, ce->name))
1186                                continue;
1187                        default_argv = "on-demand";
1188                }
1189
1190                strbuf_addf(&submodule_path, "%s/%s", spf->work_tree, ce->name);
1191                strbuf_addf(&submodule_git_dir, "%s/.git", submodule_path.buf);
1192                strbuf_addf(&submodule_prefix, "%s%s/", spf->prefix, ce->name);
1193                git_dir = read_gitfile(submodule_git_dir.buf);
1194                if (!git_dir)
1195                        git_dir = submodule_git_dir.buf;
1196                if (is_directory(git_dir)) {
1197                        child_process_init(cp);
1198                        cp->dir = strbuf_detach(&submodule_path, NULL);
1199                        prepare_submodule_repo_env(&cp->env_array);
1200                        cp->git_cmd = 1;
1201                        if (!spf->quiet)
1202                                strbuf_addf(err, "Fetching submodule %s%s\n",
1203                                            spf->prefix, ce->name);
1204                        argv_array_init(&cp->args);
1205                        argv_array_pushv(&cp->args, spf->args.argv);
1206                        argv_array_push(&cp->args, default_argv);
1207                        argv_array_push(&cp->args, "--submodule-prefix");
1208                        argv_array_push(&cp->args, submodule_prefix.buf);
1209                        ret = 1;
1210                }
1211                strbuf_release(&submodule_path);
1212                strbuf_release(&submodule_git_dir);
1213                strbuf_release(&submodule_prefix);
1214                if (ret) {
1215                        spf->count++;
1216                        return 1;
1217                }
1218        }
1219        return 0;
1220}
1221
1222static int fetch_start_failure(struct strbuf *err,
1223                               void *cb, void *task_cb)
1224{
1225        struct submodule_parallel_fetch *spf = cb;
1226
1227        spf->result = 1;
1228
1229        return 0;
1230}
1231
1232static int fetch_finish(int retvalue, struct strbuf *err,
1233                        void *cb, void *task_cb)
1234{
1235        struct submodule_parallel_fetch *spf = cb;
1236
1237        if (retvalue)
1238                spf->result = 1;
1239
1240        return 0;
1241}
1242
1243int fetch_populated_submodules(const struct argv_array *options,
1244                               const char *prefix, int command_line_option,
1245                               int default_option,
1246                               int quiet, int max_parallel_jobs)
1247{
1248        int i;
1249        struct submodule_parallel_fetch spf = SPF_INIT;
1250
1251        spf.work_tree = get_git_work_tree();
1252        spf.command_line_option = command_line_option;
1253        spf.default_option = default_option;
1254        spf.quiet = quiet;
1255        spf.prefix = prefix;
1256
1257        if (!spf.work_tree)
1258                goto out;
1259
1260        if (read_cache() < 0)
1261                die("index file corrupt");
1262
1263        argv_array_push(&spf.args, "fetch");
1264        for (i = 0; i < options->argc; i++)
1265                argv_array_push(&spf.args, options->argv[i]);
1266        argv_array_push(&spf.args, "--recurse-submodules-default");
1267        /* default value, "--submodule-prefix" and its value are added later */
1268
1269        calculate_changed_submodule_paths();
1270        run_processes_parallel(max_parallel_jobs,
1271                               get_next_submodule,
1272                               fetch_start_failure,
1273                               fetch_finish,
1274                               &spf);
1275
1276        argv_array_clear(&spf.args);
1277out:
1278        string_list_clear(&changed_submodule_paths, 1);
1279        return spf.result;
1280}
1281
1282unsigned is_submodule_modified(const char *path, int ignore_untracked)
1283{
1284        struct child_process cp = CHILD_PROCESS_INIT;
1285        struct strbuf buf = STRBUF_INIT;
1286        FILE *fp;
1287        unsigned dirty_submodule = 0;
1288        const char *git_dir;
1289        int ignore_cp_exit_code = 0;
1290
1291        strbuf_addf(&buf, "%s/.git", path);
1292        git_dir = read_gitfile(buf.buf);
1293        if (!git_dir)
1294                git_dir = buf.buf;
1295        if (!is_git_directory(git_dir)) {
1296                if (is_directory(git_dir))
1297                        die(_("'%s' not recognized as a git repository"), git_dir);
1298                strbuf_release(&buf);
1299                /* The submodule is not checked out, so it is not modified */
1300                return 0;
1301        }
1302        strbuf_reset(&buf);
1303
1304        argv_array_pushl(&cp.args, "status", "--porcelain=2", NULL);
1305        if (ignore_untracked)
1306                argv_array_push(&cp.args, "-uno");
1307
1308        prepare_submodule_repo_env(&cp.env_array);
1309        cp.git_cmd = 1;
1310        cp.no_stdin = 1;
1311        cp.out = -1;
1312        cp.dir = path;
1313        if (start_command(&cp))
1314                die("Could not run 'git status --porcelain=2' in submodule %s", path);
1315
1316        fp = xfdopen(cp.out, "r");
1317        while (strbuf_getwholeline(&buf, fp, '\n') != EOF) {
1318                /* regular untracked files */
1319                if (buf.buf[0] == '?')
1320                        dirty_submodule |= DIRTY_SUBMODULE_UNTRACKED;
1321
1322                if (buf.buf[0] == 'u' ||
1323                    buf.buf[0] == '1' ||
1324                    buf.buf[0] == '2') {
1325                        /* T = line type, XY = status, SSSS = submodule state */
1326                        if (buf.len < strlen("T XY SSSS"))
1327                                die("BUG: invalid status --porcelain=2 line %s",
1328                                    buf.buf);
1329
1330                        if (buf.buf[5] == 'S' && buf.buf[8] == 'U')
1331                                /* nested untracked file */
1332                                dirty_submodule |= DIRTY_SUBMODULE_UNTRACKED;
1333
1334                        if (buf.buf[0] == 'u' ||
1335                            buf.buf[0] == '2' ||
1336                            memcmp(buf.buf + 5, "S..U", 4))
1337                                /* other change */
1338                                dirty_submodule |= DIRTY_SUBMODULE_MODIFIED;
1339                }
1340
1341                if ((dirty_submodule & DIRTY_SUBMODULE_MODIFIED) &&
1342                    ((dirty_submodule & DIRTY_SUBMODULE_UNTRACKED) ||
1343                     ignore_untracked)) {
1344                        /*
1345                         * We're not interested in any further information from
1346                         * the child any more, neither output nor its exit code.
1347                         */
1348                        ignore_cp_exit_code = 1;
1349                        break;
1350                }
1351        }
1352        fclose(fp);
1353
1354        if (finish_command(&cp) && !ignore_cp_exit_code)
1355                die("'git status --porcelain=2' failed in submodule %s", path);
1356
1357        strbuf_release(&buf);
1358        return dirty_submodule;
1359}
1360
1361int submodule_uses_gitfile(const char *path)
1362{
1363        struct child_process cp = CHILD_PROCESS_INIT;
1364        const char *argv[] = {
1365                "submodule",
1366                "foreach",
1367                "--quiet",
1368                "--recursive",
1369                "test -f .git",
1370                NULL,
1371        };
1372        struct strbuf buf = STRBUF_INIT;
1373        const char *git_dir;
1374
1375        strbuf_addf(&buf, "%s/.git", path);
1376        git_dir = read_gitfile(buf.buf);
1377        if (!git_dir) {
1378                strbuf_release(&buf);
1379                return 0;
1380        }
1381        strbuf_release(&buf);
1382
1383        /* Now test that all nested submodules use a gitfile too */
1384        cp.argv = argv;
1385        prepare_submodule_repo_env(&cp.env_array);
1386        cp.git_cmd = 1;
1387        cp.no_stdin = 1;
1388        cp.no_stderr = 1;
1389        cp.no_stdout = 1;
1390        cp.dir = path;
1391        if (run_command(&cp))
1392                return 0;
1393
1394        return 1;
1395}
1396
1397/*
1398 * Check if it is a bad idea to remove a submodule, i.e. if we'd lose data
1399 * when doing so.
1400 *
1401 * Return 1 if we'd lose data, return 0 if the removal is fine,
1402 * and negative values for errors.
1403 */
1404int bad_to_remove_submodule(const char *path, unsigned flags)
1405{
1406        ssize_t len;
1407        struct child_process cp = CHILD_PROCESS_INIT;
1408        struct strbuf buf = STRBUF_INIT;
1409        int ret = 0;
1410
1411        if (!file_exists(path) || is_empty_dir(path))
1412                return 0;
1413
1414        if (!submodule_uses_gitfile(path))
1415                return 1;
1416
1417        argv_array_pushl(&cp.args, "status", "--porcelain",
1418                                   "--ignore-submodules=none", NULL);
1419
1420        if (flags & SUBMODULE_REMOVAL_IGNORE_UNTRACKED)
1421                argv_array_push(&cp.args, "-uno");
1422        else
1423                argv_array_push(&cp.args, "-uall");
1424
1425        if (!(flags & SUBMODULE_REMOVAL_IGNORE_IGNORED_UNTRACKED))
1426                argv_array_push(&cp.args, "--ignored");
1427
1428        prepare_submodule_repo_env(&cp.env_array);
1429        cp.git_cmd = 1;
1430        cp.no_stdin = 1;
1431        cp.out = -1;
1432        cp.dir = path;
1433        if (start_command(&cp)) {
1434                if (flags & SUBMODULE_REMOVAL_DIE_ON_ERROR)
1435                        die(_("could not start 'git status' in submodule '%s'"),
1436                                path);
1437                ret = -1;
1438                goto out;
1439        }
1440
1441        len = strbuf_read(&buf, cp.out, 1024);
1442        if (len > 2)
1443                ret = 1;
1444        close(cp.out);
1445
1446        if (finish_command(&cp)) {
1447                if (flags & SUBMODULE_REMOVAL_DIE_ON_ERROR)
1448                        die(_("could not run 'git status' in submodule '%s'"),
1449                                path);
1450                ret = -1;
1451        }
1452out:
1453        strbuf_release(&buf);
1454        return ret;
1455}
1456
1457static const char *get_super_prefix_or_empty(void)
1458{
1459        const char *s = get_super_prefix();
1460        if (!s)
1461                s = "";
1462        return s;
1463}
1464
1465static int submodule_has_dirty_index(const struct submodule *sub)
1466{
1467        struct child_process cp = CHILD_PROCESS_INIT;
1468
1469        prepare_submodule_repo_env(&cp.env_array);
1470
1471        cp.git_cmd = 1;
1472        argv_array_pushl(&cp.args, "diff-index", "--quiet",
1473                                   "--cached", "HEAD", NULL);
1474        cp.no_stdin = 1;
1475        cp.no_stdout = 1;
1476        cp.dir = sub->path;
1477        if (start_command(&cp))
1478                die("could not recurse into submodule '%s'", sub->path);
1479
1480        return finish_command(&cp);
1481}
1482
1483static void submodule_reset_index(const char *path)
1484{
1485        struct child_process cp = CHILD_PROCESS_INIT;
1486        prepare_submodule_repo_env(&cp.env_array);
1487
1488        cp.git_cmd = 1;
1489        cp.no_stdin = 1;
1490        cp.dir = path;
1491
1492        argv_array_pushf(&cp.args, "--super-prefix=%s%s/",
1493                                   get_super_prefix_or_empty(), path);
1494        argv_array_pushl(&cp.args, "read-tree", "-u", "--reset", NULL);
1495
1496        argv_array_push(&cp.args, EMPTY_TREE_SHA1_HEX);
1497
1498        if (run_command(&cp))
1499                die("could not reset submodule index");
1500}
1501
1502/**
1503 * Moves a submodule at a given path from a given head to another new head.
1504 * For edge cases (a submodule coming into existence or removing a submodule)
1505 * pass NULL for old or new respectively.
1506 */
1507int submodule_move_head(const char *path,
1508                         const char *old,
1509                         const char *new,
1510                         unsigned flags)
1511{
1512        int ret = 0;
1513        struct child_process cp = CHILD_PROCESS_INIT;
1514        const struct submodule *sub;
1515        int *error_code_ptr, error_code;
1516
1517        if (!is_submodule_active(the_repository, path))
1518                return 0;
1519
1520        if (flags & SUBMODULE_MOVE_HEAD_FORCE)
1521                /*
1522                 * Pass non NULL pointer to is_submodule_populated_gently
1523                 * to prevent die()-ing. We'll use connect_work_tree_and_git_dir
1524                 * to fixup the submodule in the force case later.
1525                 */
1526                error_code_ptr = &error_code;
1527        else
1528                error_code_ptr = NULL;
1529
1530        if (old && !is_submodule_populated_gently(path, error_code_ptr))
1531                return 0;
1532
1533        sub = submodule_from_path(&null_oid, path);
1534
1535        if (!sub)
1536                die("BUG: could not get submodule information for '%s'", path);
1537
1538        if (old && !(flags & SUBMODULE_MOVE_HEAD_FORCE)) {
1539                /* Check if the submodule has a dirty index. */
1540                if (submodule_has_dirty_index(sub))
1541                        return error(_("submodule '%s' has dirty index"), path);
1542        }
1543
1544        if (!(flags & SUBMODULE_MOVE_HEAD_DRY_RUN)) {
1545                if (old) {
1546                        if (!submodule_uses_gitfile(path))
1547                                absorb_git_dir_into_superproject("", path,
1548                                        ABSORB_GITDIR_RECURSE_SUBMODULES);
1549                } else {
1550                        char *gitdir = xstrfmt("%s/modules/%s",
1551                                    get_git_common_dir(), sub->name);
1552                        connect_work_tree_and_git_dir(path, gitdir);
1553                        free(gitdir);
1554
1555                        /* make sure the index is clean as well */
1556                        submodule_reset_index(path);
1557                }
1558
1559                if (old && (flags & SUBMODULE_MOVE_HEAD_FORCE)) {
1560                        char *gitdir = xstrfmt("%s/modules/%s",
1561                                    get_git_common_dir(), sub->name);
1562                        connect_work_tree_and_git_dir(path, gitdir);
1563                        free(gitdir);
1564                }
1565        }
1566
1567        prepare_submodule_repo_env(&cp.env_array);
1568
1569        cp.git_cmd = 1;
1570        cp.no_stdin = 1;
1571        cp.dir = path;
1572
1573        argv_array_pushf(&cp.args, "--super-prefix=%s%s/",
1574                        get_super_prefix_or_empty(), path);
1575        argv_array_pushl(&cp.args, "read-tree", "--recurse-submodules", NULL);
1576
1577        if (flags & SUBMODULE_MOVE_HEAD_DRY_RUN)
1578                argv_array_push(&cp.args, "-n");
1579        else
1580                argv_array_push(&cp.args, "-u");
1581
1582        if (flags & SUBMODULE_MOVE_HEAD_FORCE)
1583                argv_array_push(&cp.args, "--reset");
1584        else
1585                argv_array_push(&cp.args, "-m");
1586
1587        argv_array_push(&cp.args, old ? old : EMPTY_TREE_SHA1_HEX);
1588        argv_array_push(&cp.args, new ? new : EMPTY_TREE_SHA1_HEX);
1589
1590        if (run_command(&cp)) {
1591                ret = -1;
1592                goto out;
1593        }
1594
1595        if (!(flags & SUBMODULE_MOVE_HEAD_DRY_RUN)) {
1596                if (new) {
1597                        child_process_init(&cp);
1598                        /* also set the HEAD accordingly */
1599                        cp.git_cmd = 1;
1600                        cp.no_stdin = 1;
1601                        cp.dir = path;
1602
1603                        prepare_submodule_repo_env(&cp.env_array);
1604                        argv_array_pushl(&cp.args, "update-ref", "HEAD", new, NULL);
1605
1606                        if (run_command(&cp)) {
1607                                ret = -1;
1608                                goto out;
1609                        }
1610                } else {
1611                        struct strbuf sb = STRBUF_INIT;
1612
1613                        strbuf_addf(&sb, "%s/.git", path);
1614                        unlink_or_warn(sb.buf);
1615                        strbuf_release(&sb);
1616
1617                        if (is_empty_dir(path))
1618                                rmdir_or_warn(path);
1619                }
1620        }
1621out:
1622        return ret;
1623}
1624
1625static int find_first_merges(struct object_array *result, const char *path,
1626                struct commit *a, struct commit *b)
1627{
1628        int i, j;
1629        struct object_array merges = OBJECT_ARRAY_INIT;
1630        struct commit *commit;
1631        int contains_another;
1632
1633        char merged_revision[42];
1634        const char *rev_args[] = { "rev-list", "--merges", "--ancestry-path",
1635                                   "--all", merged_revision, NULL };
1636        struct rev_info revs;
1637        struct setup_revision_opt rev_opts;
1638
1639        memset(result, 0, sizeof(struct object_array));
1640        memset(&rev_opts, 0, sizeof(rev_opts));
1641
1642        /* get all revisions that merge commit a */
1643        xsnprintf(merged_revision, sizeof(merged_revision), "^%s",
1644                        oid_to_hex(&a->object.oid));
1645        init_revisions(&revs, NULL);
1646        rev_opts.submodule = path;
1647        setup_revisions(ARRAY_SIZE(rev_args)-1, rev_args, &revs, &rev_opts);
1648
1649        /* save all revisions from the above list that contain b */
1650        if (prepare_revision_walk(&revs))
1651                die("revision walk setup failed");
1652        while ((commit = get_revision(&revs)) != NULL) {
1653                struct object *o = &(commit->object);
1654                if (in_merge_bases(b, commit))
1655                        add_object_array(o, NULL, &merges);
1656        }
1657        reset_revision_walk();
1658
1659        /* Now we've got all merges that contain a and b. Prune all
1660         * merges that contain another found merge and save them in
1661         * result.
1662         */
1663        for (i = 0; i < merges.nr; i++) {
1664                struct commit *m1 = (struct commit *) merges.objects[i].item;
1665
1666                contains_another = 0;
1667                for (j = 0; j < merges.nr; j++) {
1668                        struct commit *m2 = (struct commit *) merges.objects[j].item;
1669                        if (i != j && in_merge_bases(m2, m1)) {
1670                                contains_another = 1;
1671                                break;
1672                        }
1673                }
1674
1675                if (!contains_another)
1676                        add_object_array(merges.objects[i].item, NULL, result);
1677        }
1678
1679        free(merges.objects);
1680        return result->nr;
1681}
1682
1683static void print_commit(struct commit *commit)
1684{
1685        struct strbuf sb = STRBUF_INIT;
1686        struct pretty_print_context ctx = {0};
1687        ctx.date_mode.type = DATE_NORMAL;
1688        format_commit_message(commit, " %h: %m %s", &sb, &ctx);
1689        fprintf(stderr, "%s\n", sb.buf);
1690        strbuf_release(&sb);
1691}
1692
1693#define MERGE_WARNING(path, msg) \
1694        warning("Failed to merge submodule %s (%s)", path, msg);
1695
1696int merge_submodule(struct object_id *result, const char *path,
1697                    const struct object_id *base, const struct object_id *a,
1698                    const struct object_id *b, int search)
1699{
1700        struct commit *commit_base, *commit_a, *commit_b;
1701        int parent_count;
1702        struct object_array merges;
1703
1704        int i;
1705
1706        /* store a in result in case we fail */
1707        oidcpy(result, a);
1708
1709        /* we can not handle deletion conflicts */
1710        if (is_null_oid(base))
1711                return 0;
1712        if (is_null_oid(a))
1713                return 0;
1714        if (is_null_oid(b))
1715                return 0;
1716
1717        if (add_submodule_odb(path)) {
1718                MERGE_WARNING(path, "not checked out");
1719                return 0;
1720        }
1721
1722        if (!(commit_base = lookup_commit_reference(base)) ||
1723            !(commit_a = lookup_commit_reference(a)) ||
1724            !(commit_b = lookup_commit_reference(b))) {
1725                MERGE_WARNING(path, "commits not present");
1726                return 0;
1727        }
1728
1729        /* check whether both changes are forward */
1730        if (!in_merge_bases(commit_base, commit_a) ||
1731            !in_merge_bases(commit_base, commit_b)) {
1732                MERGE_WARNING(path, "commits don't follow merge-base");
1733                return 0;
1734        }
1735
1736        /* Case #1: a is contained in b or vice versa */
1737        if (in_merge_bases(commit_a, commit_b)) {
1738                oidcpy(result, b);
1739                return 1;
1740        }
1741        if (in_merge_bases(commit_b, commit_a)) {
1742                oidcpy(result, a);
1743                return 1;
1744        }
1745
1746        /*
1747         * Case #2: There are one or more merges that contain a and b in
1748         * the submodule. If there is only one, then present it as a
1749         * suggestion to the user, but leave it marked unmerged so the
1750         * user needs to confirm the resolution.
1751         */
1752
1753        /* Skip the search if makes no sense to the calling context.  */
1754        if (!search)
1755                return 0;
1756
1757        /* find commit which merges them */
1758        parent_count = find_first_merges(&merges, path, commit_a, commit_b);
1759        switch (parent_count) {
1760        case 0:
1761                MERGE_WARNING(path, "merge following commits not found");
1762                break;
1763
1764        case 1:
1765                MERGE_WARNING(path, "not fast-forward");
1766                fprintf(stderr, "Found a possible merge resolution "
1767                                "for the submodule:\n");
1768                print_commit((struct commit *) merges.objects[0].item);
1769                fprintf(stderr,
1770                        "If this is correct simply add it to the index "
1771                        "for example\n"
1772                        "by using:\n\n"
1773                        "  git update-index --cacheinfo 160000 %s \"%s\"\n\n"
1774                        "which will accept this suggestion.\n",
1775                        oid_to_hex(&merges.objects[0].item->oid), path);
1776                break;
1777
1778        default:
1779                MERGE_WARNING(path, "multiple merges found");
1780                for (i = 0; i < merges.nr; i++)
1781                        print_commit((struct commit *) merges.objects[i].item);
1782        }
1783
1784        free(merges.objects);
1785        return 0;
1786}
1787
1788/*
1789 * Embeds a single submodules git directory into the superprojects git dir,
1790 * non recursively.
1791 */
1792static void relocate_single_git_dir_into_superproject(const char *prefix,
1793                                                      const char *path)
1794{
1795        char *old_git_dir = NULL, *real_old_git_dir = NULL, *real_new_git_dir = NULL;
1796        const char *new_git_dir;
1797        const struct submodule *sub;
1798
1799        if (submodule_uses_worktrees(path))
1800                die(_("relocate_gitdir for submodule '%s' with "
1801                      "more than one worktree not supported"), path);
1802
1803        old_git_dir = xstrfmt("%s/.git", path);
1804        if (read_gitfile(old_git_dir))
1805                /* If it is an actual gitfile, it doesn't need migration. */
1806                return;
1807
1808        real_old_git_dir = real_pathdup(old_git_dir, 1);
1809
1810        sub = submodule_from_path(&null_oid, path);
1811        if (!sub)
1812                die(_("could not lookup name for submodule '%s'"), path);
1813
1814        new_git_dir = git_path("modules/%s", sub->name);
1815        if (safe_create_leading_directories_const(new_git_dir) < 0)
1816                die(_("could not create directory '%s'"), new_git_dir);
1817        real_new_git_dir = real_pathdup(new_git_dir, 1);
1818
1819        fprintf(stderr, _("Migrating git directory of '%s%s' from\n'%s' to\n'%s'\n"),
1820                get_super_prefix_or_empty(), path,
1821                real_old_git_dir, real_new_git_dir);
1822
1823        relocate_gitdir(path, real_old_git_dir, real_new_git_dir);
1824
1825        free(old_git_dir);
1826        free(real_old_git_dir);
1827        free(real_new_git_dir);
1828}
1829
1830/*
1831 * Migrate the git directory of the submodule given by path from
1832 * having its git directory within the working tree to the git dir nested
1833 * in its superprojects git dir under modules/.
1834 */
1835void absorb_git_dir_into_superproject(const char *prefix,
1836                                      const char *path,
1837                                      unsigned flags)
1838{
1839        int err_code;
1840        const char *sub_git_dir;
1841        struct strbuf gitdir = STRBUF_INIT;
1842        strbuf_addf(&gitdir, "%s/.git", path);
1843        sub_git_dir = resolve_gitdir_gently(gitdir.buf, &err_code);
1844
1845        /* Not populated? */
1846        if (!sub_git_dir) {
1847                const struct submodule *sub;
1848
1849                if (err_code == READ_GITFILE_ERR_STAT_FAILED) {
1850                        /* unpopulated as expected */
1851                        strbuf_release(&gitdir);
1852                        return;
1853                }
1854
1855                if (err_code != READ_GITFILE_ERR_NOT_A_REPO)
1856                        /* We don't know what broke here. */
1857                        read_gitfile_error_die(err_code, path, NULL);
1858
1859                /*
1860                * Maybe populated, but no git directory was found?
1861                * This can happen if the superproject is a submodule
1862                * itself and was just absorbed. The absorption of the
1863                * superproject did not rewrite the git file links yet,
1864                * fix it now.
1865                */
1866                sub = submodule_from_path(&null_oid, path);
1867                if (!sub)
1868                        die(_("could not lookup name for submodule '%s'"), path);
1869                connect_work_tree_and_git_dir(path,
1870                        git_path("modules/%s", sub->name));
1871        } else {
1872                /* Is it already absorbed into the superprojects git dir? */
1873                char *real_sub_git_dir = real_pathdup(sub_git_dir, 1);
1874                char *real_common_git_dir = real_pathdup(get_git_common_dir(), 1);
1875
1876                if (!starts_with(real_sub_git_dir, real_common_git_dir))
1877                        relocate_single_git_dir_into_superproject(prefix, path);
1878
1879                free(real_sub_git_dir);
1880                free(real_common_git_dir);
1881        }
1882        strbuf_release(&gitdir);
1883
1884        if (flags & ABSORB_GITDIR_RECURSE_SUBMODULES) {
1885                struct child_process cp = CHILD_PROCESS_INIT;
1886                struct strbuf sb = STRBUF_INIT;
1887
1888                if (flags & ~ABSORB_GITDIR_RECURSE_SUBMODULES)
1889                        die("BUG: we don't know how to pass the flags down?");
1890
1891                strbuf_addstr(&sb, get_super_prefix_or_empty());
1892                strbuf_addstr(&sb, path);
1893                strbuf_addch(&sb, '/');
1894
1895                cp.dir = path;
1896                cp.git_cmd = 1;
1897                cp.no_stdin = 1;
1898                argv_array_pushl(&cp.args, "--super-prefix", sb.buf,
1899                                           "submodule--helper",
1900                                           "absorb-git-dirs", NULL);
1901                prepare_submodule_repo_env(&cp.env_array);
1902                if (run_command(&cp))
1903                        die(_("could not recurse into submodule '%s'"), path);
1904
1905                strbuf_release(&sb);
1906        }
1907}
1908
1909const char *get_superproject_working_tree(void)
1910{
1911        struct child_process cp = CHILD_PROCESS_INIT;
1912        struct strbuf sb = STRBUF_INIT;
1913        const char *one_up = real_path_if_valid("../");
1914        const char *cwd = xgetcwd();
1915        const char *ret = NULL;
1916        const char *subpath;
1917        int code;
1918        ssize_t len;
1919
1920        if (!is_inside_work_tree())
1921                /*
1922                 * FIXME:
1923                 * We might have a superproject, but it is harder
1924                 * to determine.
1925                 */
1926                return NULL;
1927
1928        if (!one_up)
1929                return NULL;
1930
1931        subpath = relative_path(cwd, one_up, &sb);
1932
1933        prepare_submodule_repo_env(&cp.env_array);
1934        argv_array_pop(&cp.env_array);
1935
1936        argv_array_pushl(&cp.args, "--literal-pathspecs", "-C", "..",
1937                        "ls-files", "-z", "--stage", "--full-name", "--",
1938                        subpath, NULL);
1939        strbuf_reset(&sb);
1940
1941        cp.no_stdin = 1;
1942        cp.no_stderr = 1;
1943        cp.out = -1;
1944        cp.git_cmd = 1;
1945
1946        if (start_command(&cp))
1947                die(_("could not start ls-files in .."));
1948
1949        len = strbuf_read(&sb, cp.out, PATH_MAX);
1950        close(cp.out);
1951
1952        if (starts_with(sb.buf, "160000")) {
1953                int super_sub_len;
1954                int cwd_len = strlen(cwd);
1955                char *super_sub, *super_wt;
1956
1957                /*
1958                 * There is a superproject having this repo as a submodule.
1959                 * The format is <mode> SP <hash> SP <stage> TAB <full name> \0,
1960                 * We're only interested in the name after the tab.
1961                 */
1962                super_sub = strchr(sb.buf, '\t') + 1;
1963                super_sub_len = sb.buf + sb.len - super_sub - 1;
1964
1965                if (super_sub_len > cwd_len ||
1966                    strcmp(&cwd[cwd_len - super_sub_len], super_sub))
1967                        die (_("BUG: returned path string doesn't match cwd?"));
1968
1969                super_wt = xstrdup(cwd);
1970                super_wt[cwd_len - super_sub_len] = '\0';
1971
1972                ret = real_path(super_wt);
1973                free(super_wt);
1974        }
1975        strbuf_release(&sb);
1976
1977        code = finish_command(&cp);
1978
1979        if (code == 128)
1980                /* '../' is not a git repository */
1981                return NULL;
1982        if (code == 0 && len == 0)
1983                /* There is an unrelated git repository at '../' */
1984                return NULL;
1985        if (code)
1986                die(_("ls-tree returned unexpected return code %d"), code);
1987
1988        return ret;
1989}
1990
1991int submodule_to_gitdir(struct strbuf *buf, const char *submodule)
1992{
1993        const struct submodule *sub;
1994        const char *git_dir;
1995        int ret = 0;
1996
1997        strbuf_reset(buf);
1998        strbuf_addstr(buf, submodule);
1999        strbuf_complete(buf, '/');
2000        strbuf_addstr(buf, ".git");
2001
2002        git_dir = read_gitfile(buf->buf);
2003        if (git_dir) {
2004                strbuf_reset(buf);
2005                strbuf_addstr(buf, git_dir);
2006        }
2007        if (!is_git_directory(buf->buf)) {
2008                sub = submodule_from_path(&null_oid, submodule);
2009                if (!sub) {
2010                        ret = -1;
2011                        goto cleanup;
2012                }
2013                strbuf_reset(buf);
2014                strbuf_git_path(buf, "%s/%s", "modules", sub->name);
2015        }
2016
2017cleanup:
2018        return ret;
2019}