8abff90d97133dff451d80a84c287071c1102d60
   1#!/usr/bin/env perl
   2# Copyright (C) 2006, Eric Wong <normalperson@yhbt.net>
   3# License: GPL v2 or later
   4use warnings;
   5use strict;
   6use vars qw/    $AUTHOR $VERSION
   7                $SVN_URL
   8                $GIT_SVN_INDEX $GIT_SVN
   9                $GIT_DIR $GIT_SVN_DIR $REVDB/;
  10$AUTHOR = 'Eric Wong <normalperson@yhbt.net>';
  11$VERSION = '@@GIT_VERSION@@';
  12
  13use Cwd qw/abs_path/;
  14$GIT_DIR = abs_path($ENV{GIT_DIR} || '.git');
  15$ENV{GIT_DIR} = $GIT_DIR;
  16
  17my $LC_ALL = $ENV{LC_ALL};
  18my $TZ = $ENV{TZ};
  19# make sure the svn binary gives consistent output between locales and TZs:
  20$ENV{TZ} = 'UTC';
  21$ENV{LC_ALL} = 'C';
  22$| = 1; # unbuffer STDOUT
  23
  24# properties that we do not log:
  25my %SKIP = ( 'svn:wc:ra_dav:version-url' => 1,
  26             'svn:special' => 1,
  27             'svn:executable' => 1,
  28             'svn:entry:committed-rev' => 1,
  29             'svn:entry:last-author' => 1,
  30             'svn:entry:uuid' => 1,
  31             'svn:entry:committed-date' => 1,
  32);
  33
  34sub fatal (@) { print STDERR @_; exit 1 }
  35require SVN::Core; # use()-ing this causes segfaults for me... *shrug*
  36require SVN::Ra;
  37require SVN::Delta;
  38if ($SVN::Core::VERSION lt '1.1.0') {
  39        fatal "Need SVN::Core 1.1.0 or better (got $SVN::Core::VERSION)\n";
  40}
  41push @Git::SVN::Ra::ISA, 'SVN::Ra';
  42push @SVN::Git::Editor::ISA, 'SVN::Delta::Editor';
  43push @SVN::Git::Fetcher::ISA, 'SVN::Delta::Editor';
  44use Carp qw/croak/;
  45use IO::File qw//;
  46use File::Basename qw/dirname basename/;
  47use File::Path qw/mkpath/;
  48use Getopt::Long qw/:config gnu_getopt no_ignore_case auto_abbrev pass_through/;
  49use POSIX qw/strftime/;
  50use IPC::Open3;
  51use Memoize;
  52use Git;
  53memoize('revisions_eq');
  54memoize('cmt_metadata');
  55memoize('get_commit_time');
  56
  57BEGIN {
  58        my $s;
  59        foreach (qw/command command_oneline command_noisy command_output_pipe
  60                    command_input_pipe command_close_pipe/) {
  61                $s .= "*SVN::Git::Editor::$_ = *SVN::Git::Fetcher::$_ = ".
  62                      "*$_ = *Git::$_; ";
  63        }
  64        eval $s;
  65}
  66
  67my ($SVN);
  68
  69my $_optimize_commits = 1 unless $ENV{GIT_SVN_NO_OPTIMIZE_COMMITS};
  70my $sha1 = qr/[a-f\d]{40}/;
  71my $sha1_short = qr/[a-f\d]{4,40}/;
  72my $_esc_color = qr/(?:\033\[(?:(?:\d+;)*\d*)?m)*/;
  73my ($_revision,$_stdin,$_help,$_rmdir,$_edit,
  74        $_find_copies_harder, $_l, $_cp_similarity, $_cp_remote,
  75        $_repack, $_repack_nr, $_repack_flags, $_q,
  76        $_message, $_file, $_no_metadata,
  77        $_template, $_shared, $_no_default_regex, $_no_graft_copy,
  78        $_limit, $_verbose, $_incremental, $_oneline, $_l_fmt, $_show_commit,
  79        $_version, $_upgrade, $_authors, $_branch_all_refs, @_opt_m,
  80        $_merge, $_strategy, $_dry_run, $_ignore_nodate, $_non_recursive,
  81        $_pager, $_color, $_prefix);
  82my (@_branch_from, %tree_map, %users, %rusers);
  83my @repo_path_split_cache;
  84use vars qw/$_follow_parent/;
  85
  86my %fc_opts = ( 'branch|b=s' => \@_branch_from,
  87                'follow-parent|follow' => \$_follow_parent,
  88                'branch-all-refs|B' => \$_branch_all_refs,
  89                'authors-file|A=s' => \$_authors,
  90                'repack:i' => \$_repack,
  91                'no-metadata' => \$_no_metadata,
  92                'quiet|q' => \$_q,
  93                'username=s' => \$Git::SVN::Prompt::_username,
  94                'config-dir=s' => \$Git::SVN::Ra::config_dir,
  95                'no-auth-cache' => \$Git::SVN::Prompt::_no_auth_cache,
  96                'ignore-nodate' => \$_ignore_nodate,
  97                'repack-flags|repack-args|repack-opts=s' => \$_repack_flags);
  98
  99my ($_trunk, $_tags, $_branches);
 100my %multi_opts = ( 'trunk|T=s' => \$_trunk,
 101                'tags|t=s' => \$_tags,
 102                'branches|b=s' => \$_branches );
 103my %init_opts = ( 'template=s' => \$_template, 'shared' => \$_shared );
 104my %cmt_opts = ( 'edit|e' => \$_edit,
 105                'rmdir' => \$_rmdir,
 106                'find-copies-harder' => \$_find_copies_harder,
 107                'l=i' => \$_l,
 108                'copy-similarity|C=i'=> \$_cp_similarity
 109);
 110
 111my %cmd = (
 112        fetch => [ \&cmd_fetch, "Download new revisions from SVN",
 113                        { 'revision|r=s' => \$_revision, %fc_opts } ],
 114        init => [ \&init, "Initialize a repo for tracking" .
 115                          " (requires URL argument)",
 116                          \%init_opts ],
 117        dcommit => [ \&dcommit, 'Commit several diffs to merge with upstream',
 118                        { 'merge|m|M' => \$_merge,
 119                          'strategy|s=s' => \$_strategy,
 120                          'dry-run|n' => \$_dry_run,
 121                        %cmt_opts, %fc_opts } ],
 122        'set-tree' => [ \&commit, "Set an SVN repository to a git tree-ish",
 123                        {       'stdin|' => \$_stdin, %cmt_opts, %fc_opts, } ],
 124        'show-ignore' => [ \&show_ignore, "Show svn:ignore listings",
 125                        { 'revision|r=i' => \$_revision } ],
 126        rebuild => [ \&rebuild, "Rebuild git-svn metadata (after git clone)",
 127                        { 'copy-remote|remote=s' => \$_cp_remote,
 128                          'upgrade' => \$_upgrade } ],
 129        'graft-branches' => [ \&graft_branches,
 130                        'Detect merges/branches from already imported history',
 131                        { 'merge-rx|m' => \@_opt_m,
 132                          'branch|b=s' => \@_branch_from,
 133                          'branch-all-refs|B' => \$_branch_all_refs,
 134                          'no-default-regex' => \$_no_default_regex,
 135                          'no-graft-copy' => \$_no_graft_copy } ],
 136        'multi-init' => [ \&multi_init,
 137                        'Initialize multiple trees (like git-svnimport)',
 138                        { %multi_opts, %init_opts,
 139                         'revision|r=i' => \$_revision,
 140                         'username=s' => \$Git::SVN::Prompt::_username,
 141                         'config-dir=s' => \$Git::SVN::Ra::config_dir,
 142                         'no-auth-cache' => \$Git::SVN::Prompt::_no_auth_cache,
 143                         'prefix=s' => \$_prefix,
 144                        } ],
 145        'multi-fetch' => [ \&multi_fetch,
 146                        'Fetch multiple trees (like git-svnimport)',
 147                        \%fc_opts ],
 148        'log' => [ \&show_log, 'Show commit logs',
 149                        { 'limit=i' => \$_limit,
 150                          'revision|r=s' => \$_revision,
 151                          'verbose|v' => \$_verbose,
 152                          'incremental' => \$_incremental,
 153                          'oneline' => \$_oneline,
 154                          'show-commit' => \$_show_commit,
 155                          'non-recursive' => \$_non_recursive,
 156                          'authors-file|A=s' => \$_authors,
 157                          'color' => \$_color,
 158                          'pager=s' => \$_pager,
 159                        } ],
 160        'commit-diff' => [ \&commit_diff, 'Commit a diff between two trees',
 161                        { 'message|m=s' => \$_message,
 162                          'file|F=s' => \$_file,
 163                          'revision|r=s' => \$_revision,
 164                        %cmt_opts } ],
 165);
 166
 167my $cmd;
 168for (my $i = 0; $i < @ARGV; $i++) {
 169        if (defined $cmd{$ARGV[$i]}) {
 170                $cmd = $ARGV[$i];
 171                splice @ARGV, $i, 1;
 172                last;
 173        }
 174};
 175
 176my %opts = %{$cmd{$cmd}->[2]} if (defined $cmd);
 177
 178read_repo_config(\%opts);
 179my $rv = GetOptions(%opts, 'help|H|h' => \$_help,
 180                                'version|V' => \$_version,
 181                                'id|i=s' => \$GIT_SVN);
 182exit 1 if (!$rv && $cmd ne 'log');
 183
 184set_default_vals();
 185usage(0) if $_help;
 186version() if $_version;
 187usage(1) unless defined $cmd;
 188init_vars();
 189load_authors() if $_authors;
 190load_all_refs() if $_branch_all_refs;
 191migration_check() unless $cmd =~ /^(?:init|rebuild|multi-init|commit-diff)$/;
 192$cmd{$cmd}->[0]->(@ARGV);
 193exit 0;
 194
 195####################### primary functions ######################
 196sub usage {
 197        my $exit = shift || 0;
 198        my $fd = $exit ? \*STDERR : \*STDOUT;
 199        print $fd <<"";
 200git-svn - bidirectional operations between a single Subversion tree and git
 201Usage: $0 <command> [options] [arguments]\n
 202
 203        print $fd "Available commands:\n" unless $cmd;
 204
 205        foreach (sort keys %cmd) {
 206                next if $cmd && $cmd ne $_;
 207                print $fd '  ',pack('A17',$_),$cmd{$_}->[1],"\n";
 208                foreach (keys %{$cmd{$_}->[2]}) {
 209                        # prints out arguments as they should be passed:
 210                        my $x = s#[:=]s$## ? '<arg>' : s#[:=]i$## ? '<num>' : '';
 211                        print $fd ' ' x 21, join(', ', map { length $_ > 1 ?
 212                                                        "--$_" : "-$_" }
 213                                                split /\|/,$_)," $x\n";
 214                }
 215        }
 216        print $fd <<"";
 217\nGIT_SVN_ID may be set in the environment or via the --id/-i switch to an
 218arbitrary identifier if you're tracking multiple SVN branches/repositories in
 219one git repository and want to keep them separate.  See git-svn(1) for more
 220information.
 221
 222        exit $exit;
 223}
 224
 225sub version {
 226        print "git-svn version $VERSION (svn $SVN::Core::VERSION)\n";
 227        exit 0;
 228}
 229
 230sub rebuild {
 231        if (!verify_ref("refs/remotes/$GIT_SVN^0")) {
 232                copy_remote_ref();
 233        }
 234        $SVN_URL = shift or undef;
 235        my $newest_rev = 0;
 236        if ($_upgrade) {
 237                command_noisy('update-ref',"refs/remotes/$GIT_SVN","
 238                              $GIT_SVN-HEAD");
 239        } else {
 240                check_upgrade_needed();
 241        }
 242
 243        my ($rev_list, $ctx) = command_output_pipe("rev-list",
 244                                                   "refs/remotes/$GIT_SVN");
 245        my $latest;
 246        my $svn_uuid;
 247        while (<$rev_list>) {
 248                chomp;
 249                my $c = $_;
 250                croak "Non-SHA1: $c\n" unless $c =~ /^$sha1$/o;
 251                my @commit = grep(/^git-svn-id: /,
 252                                  command(qw/cat-file commit/, $c));
 253                next if (!@commit); # skip merges
 254                my ($url, $rev, $uuid) = extract_metadata($commit[$#commit]);
 255                if (!defined $rev || !$uuid) {
 256                        croak "Unable to extract revision or UUID from ",
 257                                "$c, $commit[$#commit]\n";
 258                }
 259
 260                # if we merged or otherwise started elsewhere, this is
 261                # how we break out of it
 262                next if (defined $svn_uuid && ($uuid ne $svn_uuid));
 263                next if (defined $SVN_URL && defined $url && ($url ne $SVN_URL));
 264
 265                unless (defined $latest) {
 266                        if (!$SVN_URL && !$url) {
 267                                croak "SVN repository location required: $url\n";
 268                        }
 269                        $SVN_URL ||= $url;
 270                        $svn_uuid ||= $uuid;
 271                        setup_git_svn();
 272                        $latest = $rev;
 273                }
 274                revdb_set($REVDB, $rev, $c);
 275                print "r$rev = $c\n";
 276                $newest_rev = $rev if ($rev > $newest_rev);
 277        }
 278        command_close_pipe($rev_list, $ctx);
 279}
 280
 281sub init {
 282        my $url = shift or die "SVN repository location required " .
 283                                "as a command-line argument\n";
 284        $url =~ s!/+$!!; # strip trailing slash
 285
 286        if (my $repo_path = shift) {
 287                unless (-d $repo_path) {
 288                        mkpath([$repo_path]);
 289                }
 290                $GIT_DIR = $ENV{GIT_DIR} = $repo_path . "/.git";
 291                init_vars();
 292        }
 293
 294        $SVN_URL = $url;
 295        unless (-d $GIT_DIR) {
 296                my @init_db = ('init');
 297                push @init_db, "--template=$_template" if defined $_template;
 298                push @init_db, "--shared" if defined $_shared;
 299                command_noisy(@init_db);
 300        }
 301        setup_git_svn();
 302}
 303
 304sub cmd_fetch {
 305        fetch_child_id($GIT_SVN, @_);
 306}
 307
 308sub fetch {
 309        check_upgrade_needed();
 310        $SVN_URL ||= file_to_s("$GIT_SVN_DIR/info/url");
 311        my $ret = fetch_lib(@_);
 312        if ($ret->{commit} && !verify_ref('refs/heads/master^0')) {
 313                command_noisy(qw(update-ref refs/heads/master),$ret->{commit});
 314        }
 315        return $ret;
 316}
 317
 318sub fetch_lib {
 319        my (@parents) = @_;
 320        $SVN_URL ||= file_to_s("$GIT_SVN_DIR/info/url");
 321        $SVN ||= Git::SVN::Ra->new($SVN_URL);
 322        my ($last_rev, $last_commit) = svn_grab_base_rev();
 323        my ($base, $head) = libsvn_parse_revision($last_rev);
 324        if ($base > $head) {
 325                return { revision => $last_rev, commit => $last_commit }
 326        }
 327        my $index = set_index($GIT_SVN_INDEX);
 328
 329        # limit ourselves and also fork() since get_log won't release memory
 330        # after processing a revision and SVN stuff seems to leak
 331        my $inc = 1000;
 332        my ($min, $max) = ($base, $head < $base+$inc ? $head : $base+$inc);
 333        if (defined $last_commit) {
 334                unless (-e $GIT_SVN_INDEX) {
 335                        command_noisy('read-tree', $last_commit);
 336                }
 337                my $x = command_oneline('write-tree');
 338                my ($y) = (command(qw/cat-file commit/, $last_commit)
 339                                                        =~ /^tree ($sha1)/m);
 340                if ($y ne $x) {
 341                        unlink $GIT_SVN_INDEX or croak $!;
 342                        command_noisy('read-tree', $last_commit);
 343                }
 344                $x = command_oneline('write-tree');
 345                if ($y ne $x) {
 346                        print STDERR "trees ($last_commit) $y != $x\n",
 347                                 "Something is seriously wrong...\n";
 348                }
 349        }
 350        while (1) {
 351                # fork, because using SVN::Pool with get_log() still doesn't
 352                # seem to help enough to keep memory usage down.
 353                defined(my $pid = fork) or croak $!;
 354                if (!$pid) {
 355                        $SVN::Error::handler = \&libsvn_skip_unknown_revs;
 356
 357                        # Yes I'm perfectly aware that the fourth argument
 358                        # below is the limit revisions number.  Unfortunately
 359                        # performance sucks with it enabled, so it's much
 360                        # faster to fetch revision ranges instead of relying
 361                        # on the limiter.
 362                        $SVN->dup->get_log([''], $min, $max, 0, 1, 1,
 363                                sub {
 364                                        my $log_msg;
 365                                        if ($last_commit) {
 366                                                $log_msg = libsvn_fetch(
 367                                                        $last_commit, @_);
 368                                                $last_commit = git_commit(
 369                                                        $log_msg,
 370                                                        $last_commit,
 371                                                        @parents);
 372                                        } else {
 373                                                $log_msg = libsvn_new_tree(@_);
 374                                                $last_commit = git_commit(
 375                                                        $log_msg, @parents);
 376                                        }
 377                                });
 378                        exit 0;
 379                }
 380                waitpid $pid, 0;
 381                croak $? if $?;
 382                ($last_rev, $last_commit) = svn_grab_base_rev();
 383                last if ($max >= $head);
 384                $min = $max + 1;
 385                $max += $inc;
 386                $max = $head if ($max > $head);
 387                $SVN = Git::SVN::Ra->new($SVN_URL);
 388        }
 389        restore_index($index);
 390        return { revision => $last_rev, commit => $last_commit };
 391}
 392
 393sub commit {
 394        my (@commits) = @_;
 395        check_upgrade_needed();
 396        if ($_stdin || !@commits) {
 397                print "Reading from stdin...\n";
 398                @commits = ();
 399                while (<STDIN>) {
 400                        if (/\b($sha1_short)\b/o) {
 401                                unshift @commits, $1;
 402                        }
 403                }
 404        }
 405        my @revs;
 406        foreach my $c (@commits) {
 407                my @tmp = command('rev-parse',$c);
 408                if (scalar @tmp == 1) {
 409                        push @revs, $tmp[0];
 410                } elsif (scalar @tmp > 1) {
 411                        push @revs, reverse(command('rev-list',@tmp));
 412                } else {
 413                        die "Failed to rev-parse $c\n";
 414                }
 415        }
 416        commit_lib(@revs);
 417        print "Done committing ",scalar @revs," revisions to SVN\n";
 418}
 419
 420sub commit_lib {
 421        my (@revs) = @_;
 422        my ($r_last, $cmt_last) = svn_grab_base_rev();
 423        defined $r_last or die "Must have an existing revision to commit\n";
 424        my $fetched = fetch();
 425        if ($r_last != $fetched->{revision}) {
 426                print STDERR "There are new revisions that were fetched ",
 427                                "and need to be merged (or acknowledged) ",
 428                                "before committing.\n",
 429                                "last rev: $r_last\n",
 430                                " current: $fetched->{revision}\n";
 431                exit 1;
 432        }
 433        my $commit_msg = "$GIT_SVN_DIR/.svn-commit.tmp.$$";
 434
 435        my $repo;
 436        set_svn_commit_env();
 437        foreach my $c (@revs) {
 438                my $log_msg = get_commit_message($c, $commit_msg);
 439
 440                # fork for each commit because there's a memory leak I
 441                # can't track down... (it's probably in the SVN code)
 442                defined(my $pid = open my $fh, '-|') or croak $!;
 443                if (!$pid) {
 444                        my $pool = SVN::Pool->new;
 445                        my $ed = SVN::Git::Editor->new(
 446                                        {       r => $r_last,
 447                                                ra => $SVN->dup,
 448                                                c => $c,
 449                                                svn_path => $SVN->{svn_path},
 450                                        },
 451                                        $SVN->get_commit_editor(
 452                                                $log_msg->{msg},
 453                                                sub {
 454                                                        libsvn_commit_cb(
 455                                                                @_, $c,
 456                                                                $log_msg->{msg},
 457                                                                $r_last,
 458                                                                $cmt_last)
 459                                                }, $pool)
 460                                        );
 461                        my $mods = libsvn_checkout_tree($cmt_last, $c, $ed);
 462                        if (@$mods == 0) {
 463                                print "No changes\nr$r_last = $cmt_last\n";
 464                                $ed->abort_edit;
 465                        } else {
 466                                $ed->close_edit;
 467                        }
 468                        $pool->clear;
 469                        exit 0;
 470                }
 471                my ($r_new, $cmt_new, $no);
 472                while (<$fh>) {
 473                        print $_;
 474                        chomp;
 475                        if (/^r(\d+) = ($sha1)$/o) {
 476                                ($r_new, $cmt_new) = ($1, $2);
 477                        } elsif ($_ eq 'No changes') {
 478                                $no = 1;
 479                        }
 480                }
 481                close $fh or exit 1;
 482                if (! defined $r_new && ! defined $cmt_new) {
 483                        unless ($no) {
 484                                die "Failed to parse revision information\n";
 485                        }
 486                } else {
 487                        ($r_last, $cmt_last) = ($r_new, $cmt_new);
 488                }
 489        }
 490        $ENV{LC_ALL} = 'C';
 491        unlink $commit_msg;
 492}
 493
 494sub dcommit {
 495        my $head = shift || 'HEAD';
 496        my $gs = "refs/remotes/$GIT_SVN";
 497        my @refs = command(qw/rev-list --no-merges/, "$gs..$head");
 498        my $last_rev;
 499        foreach my $d (reverse @refs) {
 500                if (!verify_ref("$d~1")) {
 501                        die "Commit $d\n",
 502                            "has no parent commit, and therefore ",
 503                            "nothing to diff against.\n",
 504                            "You should be working from a repository ",
 505                            "originally created by git-svn\n";
 506                }
 507                unless (defined $last_rev) {
 508                        (undef, $last_rev, undef) = cmt_metadata("$d~1");
 509                        unless (defined $last_rev) {
 510                                die "Unable to extract revision information ",
 511                                    "from commit $d~1\n";
 512                        }
 513                }
 514                if ($_dry_run) {
 515                        print "diff-tree $d~1 $d\n";
 516                } else {
 517                        if (my $r = commit_diff("$d~1", $d, undef, $last_rev)) {
 518                                $last_rev = $r;
 519                        } # else: no changes, same $last_rev
 520                }
 521        }
 522        return if $_dry_run;
 523        fetch();
 524        my @diff = command('diff-tree', 'HEAD', $gs, '--');
 525        my @finish;
 526        if (@diff) {
 527                @finish = qw/rebase/;
 528                push @finish, qw/--merge/ if $_merge;
 529                push @finish, "--strategy=$_strategy" if $_strategy;
 530                print STDERR "W: HEAD and $gs differ, using @finish:\n", @diff;
 531        } else {
 532                print "No changes between current HEAD and $gs\n",
 533                      "Resetting to the latest $gs\n";
 534                @finish = qw/reset --mixed/;
 535        }
 536        command_noisy(@finish, $gs);
 537}
 538
 539sub show_ignore {
 540        $SVN_URL ||= file_to_s("$GIT_SVN_DIR/info/url");
 541        my $repo;
 542        $SVN ||= Git::SVN::Ra->new($SVN_URL);
 543        my $r = defined $_revision ? $_revision : $SVN->get_latest_revnum;
 544        libsvn_traverse_ignore(\*STDOUT, '', $r);
 545}
 546
 547sub graft_branches {
 548        my $gr_file = "$GIT_DIR/info/grafts";
 549        my ($grafts, $comments) = read_grafts($gr_file);
 550        my $gr_sha1;
 551
 552        if (%$grafts) {
 553                # temporarily disable our grafts file to make this idempotent
 554                chomp($gr_sha1 = command(qw/hash-object -w/,$gr_file));
 555                rename $gr_file, "$gr_file~$gr_sha1" or croak $!;
 556        }
 557
 558        my $l_map = read_url_paths();
 559        my @re = map { qr/$_/is } @_opt_m if @_opt_m;
 560        unless ($_no_default_regex) {
 561                push @re, (qr/\b(?:merge|merging|merged)\s+with\s+([\w\.\-]+)/i,
 562                        qr/\b(?:merge|merging|merged)\s+([\w\.\-]+)/i,
 563                        qr/\b(?:from|of)\s+([\w\.\-]+)/i );
 564        }
 565        foreach my $u (keys %$l_map) {
 566                if (@re) {
 567                        foreach my $p (keys %{$l_map->{$u}}) {
 568                                graft_merge_msg($grafts,$l_map,$u,$p,@re);
 569                        }
 570                }
 571                unless ($_no_graft_copy) {
 572                        graft_file_copy_lib($grafts,$l_map,$u);
 573                }
 574        }
 575        graft_tree_joins($grafts);
 576
 577        write_grafts($grafts, $comments, $gr_file);
 578        unlink "$gr_file~$gr_sha1" if $gr_sha1;
 579}
 580
 581sub multi_init {
 582        my $url = shift;
 583        unless (defined $_trunk || defined $_branches || defined $_tags) {
 584                usage(1);
 585        }
 586        if (defined $_trunk) {
 587                my $trunk_url = complete_svn_url($url, $_trunk);
 588                my $ch_id;
 589                if ($GIT_SVN eq 'git-svn') {
 590                        $ch_id = 1;
 591                        $GIT_SVN = $ENV{GIT_SVN_ID} = 'trunk';
 592                }
 593                init_vars();
 594                unless (-d $GIT_SVN_DIR) {
 595                        if ($ch_id) {
 596                                print "GIT_SVN_ID set to 'trunk' for ",
 597                                      "$trunk_url ($_trunk)\n";
 598                        }
 599                        init($trunk_url);
 600                        command_noisy('config', 'svn.trunk', $trunk_url);
 601                }
 602        }
 603        $_prefix = '' unless defined $_prefix;
 604        complete_url_ls_init($url, $_branches, '--branches/-b', $_prefix);
 605        complete_url_ls_init($url, $_tags, '--tags/-t', $_prefix . 'tags/');
 606}
 607
 608sub multi_fetch {
 609        # try to do trunk first, since branches/tags
 610        # may be descended from it.
 611        if (-e "$GIT_DIR/svn/trunk/info/url") {
 612                fetch_child_id('trunk', @_);
 613        }
 614        rec_fetch('', "$GIT_DIR/svn", @_);
 615}
 616
 617sub show_log {
 618        my (@args) = @_;
 619        my ($r_min, $r_max);
 620        my $r_last = -1; # prevent dupes
 621        rload_authors() if $_authors;
 622        if (defined $TZ) {
 623                $ENV{TZ} = $TZ;
 624        } else {
 625                delete $ENV{TZ};
 626        }
 627        if (defined $_revision) {
 628                if ($_revision =~ /^(\d+):(\d+)$/) {
 629                        ($r_min, $r_max) = ($1, $2);
 630                } elsif ($_revision =~ /^\d+$/) {
 631                        $r_min = $r_max = $_revision;
 632                } else {
 633                        print STDERR "-r$_revision is not supported, use ",
 634                                "standard \'git log\' arguments instead\n";
 635                        exit 1;
 636                }
 637        }
 638
 639        config_pager();
 640        @args = (git_svn_log_cmd($r_min, $r_max), @args);
 641        my $log = command_output_pipe(@args);
 642        run_pager();
 643        my (@k, $c, $d);
 644
 645        while (<$log>) {
 646                if (/^${_esc_color}commit ($sha1_short)/o) {
 647                        my $cmt = $1;
 648                        if ($c && cmt_showable($c) && $c->{r} != $r_last) {
 649                                $r_last = $c->{r};
 650                                process_commit($c, $r_min, $r_max, \@k) or
 651                                                                goto out;
 652                        }
 653                        $d = undef;
 654                        $c = { c => $cmt };
 655                } elsif (/^${_esc_color}author (.+) (\d+) ([\-\+]?\d+)$/) {
 656                        get_author_info($c, $1, $2, $3);
 657                } elsif (/^${_esc_color}(?:tree|parent|committer) /) {
 658                        # ignore
 659                } elsif (/^${_esc_color}:\d{6} \d{6} $sha1_short/o) {
 660                        push @{$c->{raw}}, $_;
 661                } elsif (/^${_esc_color}[ACRMDT]\t/) {
 662                        # we could add $SVN->{svn_path} here, but that requires
 663                        # remote access at the moment (repo_path_split)...
 664                        s#^(${_esc_color})([ACRMDT])\t#$1   $2 #;
 665                        push @{$c->{changed}}, $_;
 666                } elsif (/^${_esc_color}diff /) {
 667                        $d = 1;
 668                        push @{$c->{diff}}, $_;
 669                } elsif ($d) {
 670                        push @{$c->{diff}}, $_;
 671                } elsif (/^${_esc_color}    (git-svn-id:.+)$/) {
 672                        ($c->{url}, $c->{r}, undef) = extract_metadata($1);
 673                } elsif (s/^${_esc_color}    //) {
 674                        push @{$c->{l}}, $_;
 675                }
 676        }
 677        if ($c && defined $c->{r} && $c->{r} != $r_last) {
 678                $r_last = $c->{r};
 679                process_commit($c, $r_min, $r_max, \@k);
 680        }
 681        if (@k) {
 682                my $swap = $r_max;
 683                $r_max = $r_min;
 684                $r_min = $swap;
 685                process_commit($_, $r_min, $r_max) foreach reverse @k;
 686        }
 687out:
 688        close $log;
 689        print '-' x72,"\n" unless $_incremental || $_oneline;
 690}
 691
 692sub commit_diff_usage {
 693        print STDERR "Usage: $0 commit-diff <tree-ish> <tree-ish> [<URL>]\n";
 694        exit 1
 695}
 696
 697sub commit_diff {
 698        my $ta = shift or commit_diff_usage();
 699        my $tb = shift or commit_diff_usage();
 700        if (!eval { $SVN_URL = shift || file_to_s("$GIT_SVN_DIR/info/url") }) {
 701                print STDERR "Needed URL or usable git-svn id command-line\n";
 702                commit_diff_usage();
 703        }
 704        my $r = shift;
 705        unless (defined $r) {
 706                if (defined $_revision) {
 707                        $r = $_revision
 708                } else {
 709                        die "-r|--revision is a required argument\n";
 710                }
 711        }
 712        if (defined $_message && defined $_file) {
 713                print STDERR "Both --message/-m and --file/-F specified ",
 714                                "for the commit message.\n",
 715                                "I have no idea what you mean\n";
 716                exit 1;
 717        }
 718        if (defined $_file) {
 719                $_message = file_to_s($_file);
 720        } else {
 721                $_message ||= get_commit_message($tb,
 722                                        "$GIT_DIR/.svn-commit.tmp.$$")->{msg};
 723        }
 724        $SVN ||= Git::SVN::Ra->new($SVN_URL);
 725        if ($r eq 'HEAD') {
 726                $r = $SVN->get_latest_revnum;
 727        } elsif ($r !~ /^\d+$/) {
 728                die "revision argument: $r not understood by git-svn\n";
 729        }
 730        my $rev_committed;
 731        my $pool = SVN::Pool->new;
 732        my $ed = SVN::Git::Editor->new({        r => $r,
 733                                                ra => $SVN->dup,
 734                                                c => $tb,
 735                                                svn_path => $SVN->{svn_path}
 736                                        },
 737                                $SVN->get_commit_editor($_message,
 738                                        sub {
 739                                                $rev_committed = $_[0];
 740                                                print "Committed $_[0]\n";
 741                                        },
 742                                        $pool)
 743                                );
 744        eval {
 745                my $mods = libsvn_checkout_tree($ta, $tb, $ed);
 746                if (@$mods == 0) {
 747                        print "No changes\n$ta == $tb\n";
 748                        $ed->abort_edit;
 749                } else {
 750                        $ed->close_edit;
 751                }
 752        };
 753        $pool->clear;
 754        fatal "$@\n" if $@;
 755        $_message = $_file = undef;
 756        return $rev_committed;
 757}
 758
 759########################### utility functions #########################
 760
 761sub cmt_showable {
 762        my ($c) = @_;
 763        return 1 if defined $c->{r};
 764        if ($c->{l} && $c->{l}->[-1] eq "...\n" &&
 765                                $c->{a_raw} =~ /\@([a-f\d\-]+)>$/) {
 766                my @msg = command(qw/cat-file commit/, $c->{c});
 767                shift @msg while ($msg[0] ne "\n");
 768                shift @msg;
 769                @{$c->{l}} = grep !/^git-svn-id: /, @msg;
 770
 771                (undef, $c->{r}, undef) = extract_metadata(
 772                                (grep(/^git-svn-id: /, @msg))[-1]);
 773        }
 774        return defined $c->{r};
 775}
 776
 777sub log_use_color {
 778        return 1 if $_color;
 779        my ($dc, $dcvar);
 780        $dcvar = 'color.diff';
 781        $dc = `git-config --get $dcvar`;
 782        if ($dc eq '') {
 783                # nothing at all; fallback to "diff.color"
 784                $dcvar = 'diff.color';
 785                $dc = `git-config --get $dcvar`;
 786        }
 787        chomp($dc);
 788        if ($dc eq 'auto') {
 789                my $pc;
 790                $pc = `git-config --get color.pager`;
 791                if ($pc eq '') {
 792                        # does not have it -- fallback to pager.color
 793                        $pc = `git-config --bool --get pager.color`;
 794                }
 795                else {
 796                        $pc = `git-config --bool --get color.pager`;
 797                        if ($?) {
 798                                $pc = 'false';
 799                        }
 800                }
 801                chomp($pc);
 802                if (-t *STDOUT || (defined $_pager && $pc eq 'true')) {
 803                        return ($ENV{TERM} && $ENV{TERM} ne 'dumb');
 804                }
 805                return 0;
 806        }
 807        return 0 if $dc eq 'never';
 808        return 1 if $dc eq 'always';
 809        chomp($dc = `git-config --bool --get $dcvar`);
 810        return ($dc eq 'true');
 811}
 812
 813sub git_svn_log_cmd {
 814        my ($r_min, $r_max) = @_;
 815        my @cmd = (qw/log --abbrev-commit --pretty=raw
 816                        --default/, "refs/remotes/$GIT_SVN");
 817        push @cmd, '-r' unless $_non_recursive;
 818        push @cmd, qw/--raw --name-status/ if $_verbose;
 819        push @cmd, '--color' if log_use_color();
 820        return @cmd unless defined $r_max;
 821        if ($r_max == $r_min) {
 822                push @cmd, '--max-count=1';
 823                if (my $c = revdb_get($REVDB, $r_max)) {
 824                        push @cmd, $c;
 825                }
 826        } else {
 827                my ($c_min, $c_max);
 828                $c_max = revdb_get($REVDB, $r_max);
 829                $c_min = revdb_get($REVDB, $r_min);
 830                if (defined $c_min && defined $c_max) {
 831                        if ($r_max > $r_max) {
 832                                push @cmd, "$c_min..$c_max";
 833                        } else {
 834                                push @cmd, "$c_max..$c_min";
 835                        }
 836                } elsif ($r_max > $r_min) {
 837                        push @cmd, $c_max;
 838                } else {
 839                        push @cmd, $c_min;
 840                }
 841        }
 842        return @cmd;
 843}
 844
 845sub fetch_child_id {
 846        my $id = shift;
 847        print "Fetching $id\n";
 848        my $ref = "$GIT_DIR/refs/remotes/$id";
 849        defined(my $pid = open my $fh, '-|') or croak $!;
 850        if (!$pid) {
 851                $GIT_SVN = $ENV{GIT_SVN_ID} = $id;
 852                init_vars();
 853                fetch(@_);
 854                exit 0;
 855        }
 856        while (<$fh>) {
 857                print $_;
 858                check_repack() if (/^r\d+ = $sha1/o);
 859        }
 860        close $fh or croak $?;
 861}
 862
 863sub rec_fetch {
 864        my ($pfx, $p, @args) = @_;
 865        my @dir;
 866        foreach (sort <$p/*>) {
 867                if (-r "$_/info/url") {
 868                        $pfx .= '/' if $pfx && $pfx !~ m!/$!;
 869                        my $id = $pfx . basename $_;
 870                        next if $id eq 'trunk';
 871                        fetch_child_id($id, @args);
 872                } elsif (-d $_) {
 873                        push @dir, $_;
 874                }
 875        }
 876        foreach (@dir) {
 877                my $x = $_;
 878                $x =~ s!^\Q$GIT_DIR\E/svn/!!;
 879                rec_fetch($x, $_);
 880        }
 881}
 882
 883sub complete_svn_url {
 884        my ($url, $path) = @_;
 885        $path =~ s#/+$##;
 886        $url =~ s#/+$## if $url;
 887        if ($path !~ m#^[a-z\+]+://#) {
 888                $path = '/' . $path if ($path !~ m#^/#);
 889                if (!defined $url || $url !~ m#^[a-z\+]+://#) {
 890                        fatal("E: '$path' is not a complete URL ",
 891                              "and a separate URL is not specified\n");
 892                }
 893                $path = $url . $path;
 894        }
 895        return $path;
 896}
 897
 898sub complete_url_ls_init {
 899        my ($url, $path, $switch, $pfx) = @_;
 900        unless ($path) {
 901                print STDERR "W: $switch not specified\n";
 902                return;
 903        }
 904        my $full_url = complete_svn_url($url, $path);
 905        my @ls = libsvn_ls_fullurl($full_url);
 906        defined(my $pid = fork) or croak $!;
 907        if (!$pid) {
 908                foreach my $u (map { "$full_url/$_" } (grep m!/$!, @ls)) {
 909                        $u =~ s#/+$##;
 910                        if ($u !~ m!\Q$full_url\E/(.+)$!) {
 911                                print STDERR "W: Unrecognized URL: $u\n";
 912                                die "This should never happen\n";
 913                        }
 914                        # don't try to init already existing refs
 915                        my $id = $pfx.$1;
 916                        $GIT_SVN = $ENV{GIT_SVN_ID} = $id;
 917                        init_vars();
 918                        unless (-d $GIT_SVN_DIR) {
 919                                print "init $u => $id\n";
 920                                init($u);
 921                        }
 922                }
 923                exit 0;
 924        }
 925        waitpid $pid, 0;
 926        croak $? if $?;
 927        my ($n) = ($switch =~ /^--(\w+)/);
 928        command_noisy('config', "svn.$n", $full_url);
 929}
 930
 931sub common_prefix {
 932        my $paths = shift;
 933        my %common;
 934        foreach (@$paths) {
 935                my @tmp = split m#/#, $_;
 936                my $p = '';
 937                while (my $x = shift @tmp) {
 938                        $p .= "/$x";
 939                        $common{$p} ||= 0;
 940                        $common{$p}++;
 941                }
 942        }
 943        foreach (sort {length $b <=> length $a} keys %common) {
 944                if ($common{$_} == @$paths) {
 945                        return $_;
 946                }
 947        }
 948        return '';
 949}
 950
 951# grafts set here are 'stronger' in that they're based on actual tree
 952# matches, and won't be deleted from merge-base checking in write_grafts()
 953sub graft_tree_joins {
 954        my $grafts = shift;
 955        map_tree_joins() if (@_branch_from && !%tree_map);
 956        return unless %tree_map;
 957
 958        git_svn_each(sub {
 959                my $i = shift;
 960                my @args = (qw/rev-list --pretty=raw/, "refs/remotes/$i");
 961                my ($fh, $ctx) = command_output_pipe(@args);
 962                while (<$fh>) {
 963                        next unless /^commit ($sha1)$/o;
 964                        my $c = $1;
 965                        my ($t) = (<$fh> =~ /^tree ($sha1)$/o);
 966                        next unless $tree_map{$t};
 967
 968                        my $l;
 969                        do {
 970                                $l = readline $fh;
 971                        } until ($l =~ /^committer (?:.+) (\d+) ([\-\+]?\d+)$/);
 972
 973                        my ($s, $tz) = ($1, $2);
 974                        if ($tz =~ s/^\+//) {
 975                                $s += tz_to_s_offset($tz);
 976                        } elsif ($tz =~ s/^\-//) {
 977                                $s -= tz_to_s_offset($tz);
 978                        }
 979
 980                        my ($url_a, $r_a, $uuid_a) = cmt_metadata($c);
 981
 982                        foreach my $p (@{$tree_map{$t}}) {
 983                                next if $p eq $c;
 984                                my $mb = eval { command('merge-base', $c, $p) };
 985                                next unless ($@ || $?);
 986                                if (defined $r_a) {
 987                                        # see if SVN says it's a relative
 988                                        my ($url_b, $r_b, $uuid_b) =
 989                                                        cmt_metadata($p);
 990                                        next if (defined $url_b &&
 991                                                        defined $url_a &&
 992                                                        ($url_a eq $url_b) &&
 993                                                        ($uuid_a eq $uuid_b));
 994                                        if ($uuid_a eq $uuid_b) {
 995                                                if ($r_b < $r_a) {
 996                                                        $grafts->{$c}->{$p} = 2;
 997                                                        next;
 998                                                } elsif ($r_b > $r_a) {
 999                                                        $grafts->{$p}->{$c} = 2;
1000                                                        next;
1001                                                }
1002                                        }
1003                                }
1004                                my $ct = get_commit_time($p);
1005                                if ($ct < $s) {
1006                                        $grafts->{$c}->{$p} = 2;
1007                                } elsif ($ct > $s) {
1008                                        $grafts->{$p}->{$c} = 2;
1009                                }
1010                                # what should we do when $ct == $s ?
1011                        }
1012                }
1013                command_close_pipe($fh, $ctx);
1014        });
1015}
1016
1017sub graft_file_copy_lib {
1018        my ($grafts, $l_map, $u) = @_;
1019        my $tree_paths = $l_map->{$u};
1020        my $pfx = common_prefix([keys %$tree_paths]);
1021        my ($repo, $path) = repo_path_split($u.$pfx);
1022        $SVN = Git::SVN::Ra->new($repo);
1023
1024        my ($base, $head) = libsvn_parse_revision();
1025        my $inc = 1000;
1026        my ($min, $max) = ($base, $head < $base+$inc ? $head : $base+$inc);
1027        my $eh = $SVN::Error::handler;
1028        $SVN::Error::handler = \&libsvn_skip_unknown_revs;
1029        while (1) {
1030                $SVN->dup->get_log([$path], $min, $max, 0, 2, 1,
1031                        sub {
1032                                libsvn_graft_file_copies($grafts, $tree_paths,
1033                                                        $path, @_);
1034                        });
1035                last if ($max >= $head);
1036                $min = $max + 1;
1037                $max += $inc;
1038                $max = $head if ($max > $head);
1039        }
1040        $SVN::Error::handler = $eh;
1041}
1042
1043sub process_merge_msg_matches {
1044        my ($grafts, $l_map, $u, $p, $c, @matches) = @_;
1045        my (@strong, @weak);
1046        foreach (@matches) {
1047                # merging with ourselves is not interesting
1048                next if $_ eq $p;
1049                if ($l_map->{$u}->{$_}) {
1050                        push @strong, $_;
1051                } else {
1052                        push @weak, $_;
1053                }
1054        }
1055        foreach my $w (@weak) {
1056                last if @strong;
1057                # no exact match, use branch name as regexp.
1058                my $re = qr/\Q$w\E/i;
1059                foreach (keys %{$l_map->{$u}}) {
1060                        if (/$re/) {
1061                                push @strong, $l_map->{$u}->{$_};
1062                                last;
1063                        }
1064                }
1065                last if @strong;
1066                $w = basename($w);
1067                $re = qr/\Q$w\E/i;
1068                foreach (keys %{$l_map->{$u}}) {
1069                        if (/$re/) {
1070                                push @strong, $l_map->{$u}->{$_};
1071                                last;
1072                        }
1073                }
1074        }
1075        my ($rev) = ($c->{m} =~ /^git-svn-id:\s(?:\S+?)\@(\d+)
1076                                        \s(?:[a-f\d\-]+)$/xsm);
1077        unless (defined $rev) {
1078                ($rev) = ($c->{m} =~/^git-svn-id:\s(\d+)
1079                                        \@(?:[a-f\d\-]+)/xsm);
1080                return unless defined $rev;
1081        }
1082        foreach my $m (@strong) {
1083                my ($r0, $s0) = find_rev_before($rev, $m, 1);
1084                $grafts->{$c->{c}}->{$s0} = 1 if defined $s0;
1085        }
1086}
1087
1088sub graft_merge_msg {
1089        my ($grafts, $l_map, $u, $p, @re) = @_;
1090
1091        my $x = $l_map->{$u}->{$p};
1092        my $rl = rev_list_raw("refs/remotes/$x");
1093        while (my $c = next_rev_list_entry($rl)) {
1094                foreach my $re (@re) {
1095                        my (@br) = ($c->{m} =~ /$re/g);
1096                        next unless @br;
1097                        process_merge_msg_matches($grafts,$l_map,$u,$p,$c,@br);
1098                }
1099        }
1100}
1101
1102sub verify_ref {
1103        my ($ref) = @_;
1104        eval { command_oneline([ 'rev-parse', '--verify', $ref ],
1105                               { STDERR => 0 }); };
1106}
1107
1108sub repo_path_split {
1109        my $full_url = shift;
1110        $full_url =~ s#/+$##;
1111
1112        foreach (@repo_path_split_cache) {
1113                if ($full_url =~ s#$_##) {
1114                        my $u = $1;
1115                        $full_url =~ s#^/+##;
1116                        return ($u, $full_url);
1117                }
1118        }
1119        my $tmp = Git::SVN::Ra->new($full_url);
1120        return ($tmp->{repos_root}, $tmp->{svn_path});
1121}
1122
1123sub setup_git_svn {
1124        defined $SVN_URL or croak "SVN repository location required\n";
1125        unless (-d $GIT_DIR) {
1126                croak "GIT_DIR=$GIT_DIR does not exist!\n";
1127        }
1128        mkpath([$GIT_SVN_DIR]);
1129        mkpath(["$GIT_SVN_DIR/info"]);
1130        open my $fh, '>>',$REVDB or croak $!;
1131        close $fh;
1132        s_to_file($SVN_URL,"$GIT_SVN_DIR/info/url");
1133
1134}
1135
1136sub get_tree_from_treeish {
1137        my ($treeish) = @_;
1138        croak "Not a sha1: $treeish\n" unless $treeish =~ /^$sha1$/o;
1139        my $type = command_oneline(qw/cat-file -t/, $treeish);
1140        my $expected;
1141        while ($type eq 'tag') {
1142                ($treeish, $type) = command(qw/cat-file tag/, $treeish);
1143        }
1144        if ($type eq 'commit') {
1145                $expected = (grep /^tree /, command(qw/cat-file commit/,
1146                                                    $treeish))[0];
1147                ($expected) = ($expected =~ /^tree ($sha1)$/);
1148                die "Unable to get tree from $treeish\n" unless $expected;
1149        } elsif ($type eq 'tree') {
1150                $expected = $treeish;
1151        } else {
1152                die "$treeish is a $type, expected tree, tag or commit\n";
1153        }
1154        return $expected;
1155}
1156
1157sub get_diff {
1158        my ($from, $treeish) = @_;
1159        print "diff-tree $from $treeish\n";
1160        my @diff_tree = qw(diff-tree -z -r);
1161        if ($_cp_similarity) {
1162                push @diff_tree, "-C$_cp_similarity";
1163        } else {
1164                push @diff_tree, '-C';
1165        }
1166        push @diff_tree, '--find-copies-harder' if $_find_copies_harder;
1167        push @diff_tree, "-l$_l" if defined $_l;
1168        push @diff_tree, $from, $treeish;
1169        my ($diff_fh, $ctx) = command_output_pipe(@diff_tree);
1170        local $/ = "\0";
1171        my $state = 'meta';
1172        my @mods;
1173        while (<$diff_fh>) {
1174                chomp $_; # this gets rid of the trailing "\0"
1175                if ($state eq 'meta' && /^:(\d{6})\s(\d{6})\s
1176                                        $sha1\s($sha1)\s([MTCRAD])\d*$/xo) {
1177                        push @mods, {   mode_a => $1, mode_b => $2,
1178                                        sha1_b => $3, chg => $4 };
1179                        if ($4 =~ /^(?:C|R)$/) {
1180                                $state = 'file_a';
1181                        } else {
1182                                $state = 'file_b';
1183                        }
1184                } elsif ($state eq 'file_a') {
1185                        my $x = $mods[$#mods] or croak "Empty array\n";
1186                        if ($x->{chg} !~ /^(?:C|R)$/) {
1187                                croak "Error parsing $_, $x->{chg}\n";
1188                        }
1189                        $x->{file_a} = $_;
1190                        $state = 'file_b';
1191                } elsif ($state eq 'file_b') {
1192                        my $x = $mods[$#mods] or croak "Empty array\n";
1193                        if (exists $x->{file_a} && $x->{chg} !~ /^(?:C|R)$/) {
1194                                croak "Error parsing $_, $x->{chg}\n";
1195                        }
1196                        if (!exists $x->{file_a} && $x->{chg} =~ /^(?:C|R)$/) {
1197                                croak "Error parsing $_, $x->{chg}\n";
1198                        }
1199                        $x->{file_b} = $_;
1200                        $state = 'meta';
1201                } else {
1202                        croak "Error parsing $_\n";
1203                }
1204        }
1205        command_close_pipe($diff_fh, $ctx);
1206        return \@mods;
1207}
1208
1209sub libsvn_checkout_tree {
1210        my ($from, $treeish, $ed) = @_;
1211        my $mods = get_diff($from, $treeish);
1212        return $mods unless (scalar @$mods);
1213        my %o = ( D => 1, R => 0, C => -1, A => 3, M => 3, T => 3 );
1214        foreach my $m (sort { $o{$a->{chg}} <=> $o{$b->{chg}} } @$mods) {
1215                my $f = $m->{chg};
1216                if (defined $o{$f}) {
1217                        $ed->$f($m, $_q);
1218                } else {
1219                        croak "Invalid change type: $f\n";
1220                }
1221        }
1222        $ed->rmdirs($_q) if $_rmdir;
1223        return $mods;
1224}
1225
1226sub get_commit_message {
1227        my ($commit, $commit_msg) = (@_);
1228        my %log_msg = ( msg => '' );
1229        open my $msg, '>', $commit_msg or croak $!;
1230
1231        my $type = command_oneline(qw/cat-file -t/, $commit);
1232        if ($type eq 'commit' || $type eq 'tag') {
1233                my ($msg_fh, $ctx) = command_output_pipe('cat-file',
1234                                                         $type, $commit);
1235                my $in_msg = 0;
1236                while (<$msg_fh>) {
1237                        if (!$in_msg) {
1238                                $in_msg = 1 if (/^\s*$/);
1239                        } elsif (/^git-svn-id: /) {
1240                                # skip this, we regenerate the correct one
1241                                # on re-fetch anyways
1242                        } else {
1243                                print $msg $_ or croak $!;
1244                        }
1245                }
1246                command_close_pipe($msg_fh, $ctx);
1247        }
1248        close $msg or croak $!;
1249
1250        if ($_edit || ($type eq 'tree')) {
1251                my $editor = $ENV{VISUAL} || $ENV{EDITOR} || 'vi';
1252                system($editor, $commit_msg);
1253        }
1254
1255        # file_to_s removes all trailing newlines, so just use chomp() here:
1256        open $msg, '<', $commit_msg or croak $!;
1257        { local $/; chomp($log_msg{msg} = <$msg>); }
1258        close $msg or croak $!;
1259
1260        return \%log_msg;
1261}
1262
1263sub set_svn_commit_env {
1264        if (defined $LC_ALL) {
1265                $ENV{LC_ALL} = $LC_ALL;
1266        } else {
1267                delete $ENV{LC_ALL};
1268        }
1269}
1270
1271sub rev_list_raw {
1272        my ($fh, $c) = command_output_pipe(qw/rev-list --pretty=raw/, @_);
1273        return { fh => $fh, ctx => $c, t => { } };
1274}
1275
1276sub next_rev_list_entry {
1277        my $rl = shift;
1278        my $fh = $rl->{fh};
1279        my $x = $rl->{t};
1280        while (<$fh>) {
1281                if (/^commit ($sha1)$/o) {
1282                        if ($x->{c}) {
1283                                $rl->{t} = { c => $1 };
1284                                return $x;
1285                        } else {
1286                                $x->{c} = $1;
1287                        }
1288                } elsif (/^parent ($sha1)$/o) {
1289                        $x->{p}->{$1} = 1;
1290                } elsif (s/^    //) {
1291                        $x->{m} ||= '';
1292                        $x->{m} .= $_;
1293                }
1294        }
1295        command_close_pipe($fh, $rl->{ctx});
1296        return ($x != $rl->{t}) ? $x : undef;
1297}
1298
1299sub s_to_file {
1300        my ($str, $file, $mode) = @_;
1301        open my $fd,'>',$file or croak $!;
1302        print $fd $str,"\n" or croak $!;
1303        close $fd or croak $!;
1304        chmod ($mode &~ umask, $file) if (defined $mode);
1305}
1306
1307sub file_to_s {
1308        my $file = shift;
1309        open my $fd,'<',$file or croak "$!: file: $file\n";
1310        local $/;
1311        my $ret = <$fd>;
1312        close $fd or croak $!;
1313        $ret =~ s/\s*$//s;
1314        return $ret;
1315}
1316
1317sub assert_revision_unknown {
1318        my $r = shift;
1319        if (my $c = revdb_get($REVDB, $r)) {
1320                croak "$r = $c already exists! Why are we refetching it?";
1321        }
1322}
1323
1324sub git_commit {
1325        my ($log_msg, @parents) = @_;
1326        assert_revision_unknown($log_msg->{revision});
1327        map_tree_joins() if (@_branch_from && !%tree_map);
1328
1329        my (@tmp_parents, @exec_parents, %seen_parent);
1330        if (my $lparents = $log_msg->{parents}) {
1331                @tmp_parents = @$lparents
1332        }
1333        # commit parents can be conditionally bound to a particular
1334        # svn revision via: "svn_revno=commit_sha1", filter them out here:
1335        foreach my $p (@parents) {
1336                next unless defined $p;
1337                if ($p =~ /^(\d+)=($sha1_short)$/o) {
1338                        if ($1 == $log_msg->{revision}) {
1339                                push @tmp_parents, $2;
1340                        }
1341                } else {
1342                        push @tmp_parents, $p if $p =~ /$sha1_short/o;
1343                }
1344        }
1345        my $tree = $log_msg->{tree};
1346        if (!defined $tree) {
1347                my $index = set_index($GIT_SVN_INDEX);
1348                $tree = command_oneline('write-tree');
1349                croak $? if $?;
1350                restore_index($index);
1351        }
1352        # just in case we clobber the existing ref, we still want that ref
1353        # as our parent:
1354        if (my $cur = verify_ref("refs/remotes/$GIT_SVN^0")) {
1355                chomp $cur;
1356                push @tmp_parents, $cur;
1357        }
1358
1359        if (exists $tree_map{$tree}) {
1360                foreach my $p (@{$tree_map{$tree}}) {
1361                        my $skip;
1362                        foreach (@tmp_parents) {
1363                                # see if a common parent is found
1364                                my $mb = eval { command('merge-base', $_, $p) };
1365                                next if ($@ || $?);
1366                                $skip = 1;
1367                                last;
1368                        }
1369                        next if $skip;
1370                        my ($url_p, $r_p, $uuid_p) = cmt_metadata($p);
1371                        next if (($SVN->uuid eq $uuid_p) &&
1372                                                ($log_msg->{revision} > $r_p));
1373                        next if (defined $url_p && defined $SVN_URL &&
1374                                                ($SVN->uuid eq $uuid_p) &&
1375                                                ($url_p eq $SVN_URL));
1376                        push @tmp_parents, $p;
1377                }
1378        }
1379        foreach (@tmp_parents) {
1380                next if $seen_parent{$_};
1381                $seen_parent{$_} = 1;
1382                push @exec_parents, $_;
1383                # MAXPARENT is defined to 16 in commit-tree.c:
1384                last if @exec_parents > 16;
1385        }
1386
1387        set_commit_env($log_msg);
1388        my @exec = ('git-commit-tree', $tree);
1389        push @exec, '-p', $_  foreach @exec_parents;
1390        defined(my $pid = open3(my $msg_fh, my $out_fh, '>&STDERR', @exec))
1391                                                                or croak $!;
1392        print $msg_fh $log_msg->{msg} or croak $!;
1393        unless ($_no_metadata) {
1394                print $msg_fh "\ngit-svn-id: $SVN_URL\@$log_msg->{revision} ",
1395                                        $SVN->uuid,"\n" or croak $!;
1396        }
1397        $msg_fh->flush == 0 or croak $!;
1398        close $msg_fh or croak $!;
1399        chomp(my $commit = do { local $/; <$out_fh> });
1400        close $out_fh or croak $!;
1401        waitpid $pid, 0;
1402        croak $? if $?;
1403        if ($commit !~ /^$sha1$/o) {
1404                die "Failed to commit, invalid sha1: $commit\n";
1405        }
1406        command_noisy('update-ref',"refs/remotes/$GIT_SVN",$commit);
1407        revdb_set($REVDB, $log_msg->{revision}, $commit);
1408
1409        # this output is read via pipe, do not change:
1410        print "r$log_msg->{revision} = $commit\n";
1411        return $commit;
1412}
1413
1414sub check_repack {
1415        if ($_repack && (--$_repack_nr == 0)) {
1416                $_repack_nr = $_repack;
1417                # repack doesn't use any arguments with spaces in them, does it?
1418                command_noisy('repack', split(/\s+/, $_repack_flags));
1419        }
1420}
1421
1422sub set_commit_env {
1423        my ($log_msg) = @_;
1424        my $author = $log_msg->{author};
1425        if (!defined $author || length $author == 0) {
1426                $author = '(no author)';
1427        }
1428        my ($name,$email) = defined $users{$author} ?  @{$users{$author}}
1429                                : ($author,$author . '@' . $SVN->uuid);
1430        $ENV{GIT_AUTHOR_NAME} = $ENV{GIT_COMMITTER_NAME} = $name;
1431        $ENV{GIT_AUTHOR_EMAIL} = $ENV{GIT_COMMITTER_EMAIL} = $email;
1432        $ENV{GIT_AUTHOR_DATE} = $ENV{GIT_COMMITTER_DATE} = $log_msg->{date};
1433}
1434
1435sub check_upgrade_needed {
1436        if (!-r $REVDB) {
1437                -d $GIT_SVN_DIR or mkpath([$GIT_SVN_DIR]);
1438                open my $fh, '>>',$REVDB or croak $!;
1439                close $fh;
1440        }
1441        return unless eval {
1442                command([qw/rev-parse --verify/,"$GIT_SVN-HEAD^0"],
1443                        {STDERR => 0});
1444        };
1445        my $head = eval { command('rev-parse',"refs/remotes/$GIT_SVN") };
1446        if ($@ || !$head) {
1447                print STDERR "Please run: $0 rebuild --upgrade\n";
1448                exit 1;
1449        }
1450}
1451
1452# fills %tree_map with a reverse mapping of trees to commits.  Useful
1453# for finding parents to commit on.
1454sub map_tree_joins {
1455        my %seen;
1456        foreach my $br (@_branch_from) {
1457                my $pipe = command_output_pipe(qw/rev-list
1458                                            --topo-order --pretty=raw/, $br);
1459                while (<$pipe>) {
1460                        if (/^commit ($sha1)$/o) {
1461                                my $commit = $1;
1462
1463                                # if we've seen a commit,
1464                                # we've seen its parents
1465                                last if $seen{$commit};
1466                                my ($tree) = (<$pipe> =~ /^tree ($sha1)$/o);
1467                                unless (defined $tree) {
1468                                        die "Failed to parse commit $commit\n";
1469                                }
1470                                push @{$tree_map{$tree}}, $commit;
1471                                $seen{$commit} = 1;
1472                        }
1473                }
1474                close $pipe;
1475        }
1476}
1477
1478sub load_all_refs {
1479        if (@_branch_from) {
1480                print STDERR '--branch|-b parameters are ignored when ',
1481                        "--branch-all-refs|-B is passed\n";
1482        }
1483
1484        # don't worry about rev-list on non-commit objects/tags,
1485        # it shouldn't blow up if a ref is a blob or tree...
1486        @_branch_from = command(qw/rev-parse --symbolic --all/);
1487}
1488
1489# '<svn username> = real-name <email address>' mapping based on git-svnimport:
1490sub load_authors {
1491        open my $authors, '<', $_authors or die "Can't open $_authors $!\n";
1492        while (<$authors>) {
1493                chomp;
1494                next unless /^(\S+?|\(no author\))\s*=\s*(.+?)\s*<(.+)>\s*$/;
1495                my ($user, $name, $email) = ($1, $2, $3);
1496                $users{$user} = [$name, $email];
1497        }
1498        close $authors or croak $!;
1499}
1500
1501sub rload_authors {
1502        open my $authors, '<', $_authors or die "Can't open $_authors $!\n";
1503        while (<$authors>) {
1504                chomp;
1505                next unless /^(\S+?)\s*=\s*(.+?)\s*<(.+)>\s*$/;
1506                my ($user, $name, $email) = ($1, $2, $3);
1507                $rusers{"$name <$email>"} = $user;
1508        }
1509        close $authors or croak $!;
1510}
1511
1512sub git_svn_each {
1513        my $sub = shift;
1514        foreach (command(qw/rev-parse --symbolic --all/)) {
1515                next unless s#^refs/remotes/##;
1516                chomp $_;
1517                next unless -f "$GIT_DIR/svn/$_/info/url";
1518                &$sub($_);
1519        }
1520}
1521
1522sub migrate_revdb {
1523        git_svn_each(sub {
1524                my $id = shift;
1525                defined(my $pid = fork) or croak $!;
1526                if (!$pid) {
1527                        $GIT_SVN = $ENV{GIT_SVN_ID} = $id;
1528                        init_vars();
1529                        exit 0 if -r $REVDB;
1530                        print "Upgrading svn => git mapping...\n";
1531                        -d $GIT_SVN_DIR or mkpath([$GIT_SVN_DIR]);
1532                        open my $fh, '>>',$REVDB or croak $!;
1533                        close $fh;
1534                        rebuild();
1535                        print "Done upgrading. You may now delete the ",
1536                                "deprecated $GIT_SVN_DIR/revs directory\n";
1537                        exit 0;
1538                }
1539                waitpid $pid, 0;
1540                croak $? if $?;
1541        });
1542}
1543
1544sub migration_check {
1545        migrate_revdb() unless (-e $REVDB);
1546        return if (-d "$GIT_DIR/svn" || !-d $GIT_DIR);
1547        print "Upgrading repository...\n";
1548        unless (-d "$GIT_DIR/svn") {
1549                mkdir "$GIT_DIR/svn" or croak $!;
1550        }
1551        print "Data from a previous version of git-svn exists, but\n\t",
1552                                "$GIT_SVN_DIR\n\t(required for this version ",
1553                                "($VERSION) of git-svn) does not.\n";
1554
1555        foreach my $x (command(qw/rev-parse --symbolic --all/)) {
1556                next unless $x =~ s#^refs/remotes/##;
1557                chomp $x;
1558                next unless -f "$GIT_DIR/$x/info/url";
1559                my $u = eval { file_to_s("$GIT_DIR/$x/info/url") };
1560                next unless $u;
1561                my $dn = dirname("$GIT_DIR/svn/$x");
1562                mkpath([$dn]) unless -d $dn;
1563                rename "$GIT_DIR/$x", "$GIT_DIR/svn/$x" or croak "$!: $x";
1564        }
1565        migrate_revdb() if (-d $GIT_SVN_DIR && !-w $REVDB);
1566        print "Done upgrading.\n";
1567}
1568
1569sub find_rev_before {
1570        my ($r, $id, $eq_ok) = @_;
1571        my $f = "$GIT_DIR/svn/$id/.rev_db";
1572        return (undef,undef) unless -r $f;
1573        --$r unless $eq_ok;
1574        while ($r > 0) {
1575                if (my $c = revdb_get($f, $r)) {
1576                        return ($r, $c);
1577                }
1578                --$r;
1579        }
1580        return (undef, undef);
1581}
1582
1583sub init_vars {
1584        $GIT_SVN ||= $ENV{GIT_SVN_ID} || 'git-svn';
1585        $GIT_SVN_DIR = "$GIT_DIR/svn/$GIT_SVN";
1586        $REVDB = "$GIT_SVN_DIR/.rev_db";
1587        $GIT_SVN_INDEX = "$GIT_SVN_DIR/index";
1588        $SVN_URL = undef;
1589        %tree_map = ();
1590}
1591
1592# convert GetOpt::Long specs for use by git-config
1593sub read_repo_config {
1594        return unless -d $GIT_DIR;
1595        my $opts = shift;
1596        foreach my $o (keys %$opts) {
1597                my $v = $opts->{$o};
1598                my ($key) = ($o =~ /^([a-z\-]+)/);
1599                $key =~ s/-//g;
1600                my $arg = 'git-config';
1601                $arg .= ' --int' if ($o =~ /[:=]i$/);
1602                $arg .= ' --bool' if ($o !~ /[:=][sfi]$/);
1603                if (ref $v eq 'ARRAY') {
1604                        chomp(my @tmp = `$arg --get-all svn.$key`);
1605                        @$v = @tmp if @tmp;
1606                } else {
1607                        chomp(my $tmp = `$arg --get svn.$key`);
1608                        if ($tmp && !($arg =~ / --bool/ && $tmp eq 'false')) {
1609                                $$v = $tmp;
1610                        }
1611                }
1612        }
1613}
1614
1615sub set_default_vals {
1616        if (defined $_repack) {
1617                $_repack = 1000 if ($_repack <= 0);
1618                $_repack_nr = $_repack;
1619                $_repack_flags ||= '-d';
1620        }
1621}
1622
1623sub read_grafts {
1624        my $gr_file = shift;
1625        my ($grafts, $comments) = ({}, {});
1626        if (open my $fh, '<', $gr_file) {
1627                my @tmp;
1628                while (<$fh>) {
1629                        if (/^($sha1)\s+/) {
1630                                my $c = $1;
1631                                if (@tmp) {
1632                                        @{$comments->{$c}} = @tmp;
1633                                        @tmp = ();
1634                                }
1635                                foreach my $p (split /\s+/, $_) {
1636                                        $grafts->{$c}->{$p} = 1;
1637                                }
1638                        } else {
1639                                push @tmp, $_;
1640                        }
1641                }
1642                close $fh or croak $!;
1643                @{$comments->{'END'}} = @tmp if @tmp;
1644        }
1645        return ($grafts, $comments);
1646}
1647
1648sub write_grafts {
1649        my ($grafts, $comments, $gr_file) = @_;
1650
1651        open my $fh, '>', $gr_file or croak $!;
1652        foreach my $c (sort keys %$grafts) {
1653                if ($comments->{$c}) {
1654                        print $fh $_ foreach @{$comments->{$c}};
1655                }
1656                my $p = $grafts->{$c};
1657                my %x; # real parents
1658                delete $p->{$c}; # commits are not self-reproducing...
1659                my $ch = command_output_pipe(qw/cat-file commit/, $c);
1660                while (<$ch>) {
1661                        if (/^parent ($sha1)/) {
1662                                $x{$1} = $p->{$1} = 1;
1663                        } else {
1664                                last unless /^\S/;
1665                        }
1666                }
1667                close $ch; # breaking the pipe
1668
1669                # if real parents are the only ones in the grafts, drop it
1670                next if join(' ',sort keys %$p) eq join(' ',sort keys %x);
1671
1672                my (@ip, @jp, $mb);
1673                my %del = %x;
1674                @ip = @jp = keys %$p;
1675                foreach my $i (@ip) {
1676                        next if $del{$i} || $p->{$i} == 2;
1677                        foreach my $j (@jp) {
1678                                next if $i eq $j || $del{$j} || $p->{$j} == 2;
1679                                $mb = eval { command('merge-base', $i, $j) };
1680                                next unless $mb;
1681                                chomp $mb;
1682                                next if $x{$mb};
1683                                if ($mb eq $j) {
1684                                        delete $p->{$i};
1685                                        $del{$i} = 1;
1686                                } elsif ($mb eq $i) {
1687                                        delete $p->{$j};
1688                                        $del{$j} = 1;
1689                                }
1690                        }
1691                }
1692
1693                # if real parents are the only ones in the grafts, drop it
1694                next if join(' ',sort keys %$p) eq join(' ',sort keys %x);
1695
1696                print $fh $c, ' ', join(' ', sort keys %$p),"\n";
1697        }
1698        if ($comments->{'END'}) {
1699                print $fh $_ foreach @{$comments->{'END'}};
1700        }
1701        close $fh or croak $!;
1702}
1703
1704sub read_url_paths_all {
1705        my ($l_map, $pfx, $p) = @_;
1706        my @dir;
1707        foreach (<$p/*>) {
1708                if (-r "$_/info/url") {
1709                        $pfx .= '/' if $pfx && $pfx !~ m!/$!;
1710                        my $id = $pfx . basename $_;
1711                        my $url = file_to_s("$_/info/url");
1712                        my ($u, $p) = repo_path_split($url);
1713                        $l_map->{$u}->{$p} = $id;
1714                } elsif (-d $_) {
1715                        push @dir, $_;
1716                }
1717        }
1718        foreach (@dir) {
1719                my $x = $_;
1720                $x =~ s!^\Q$GIT_DIR\E/svn/!!o;
1721                read_url_paths_all($l_map, $x, $_);
1722        }
1723}
1724
1725# this one only gets ids that have been imported, not new ones
1726sub read_url_paths {
1727        my $l_map = {};
1728        git_svn_each(sub { my $x = shift;
1729                        my $url = file_to_s("$GIT_DIR/svn/$x/info/url");
1730                        my ($u, $p) = repo_path_split($url);
1731                        $l_map->{$u}->{$p} = $x;
1732                        });
1733        return $l_map;
1734}
1735
1736sub extract_metadata {
1737        my $id = shift or return (undef, undef, undef);
1738        my ($url, $rev, $uuid) = ($id =~ /^git-svn-id:\s(\S+?)\@(\d+)
1739                                                        \s([a-f\d\-]+)$/x);
1740        if (!defined $rev || !$uuid || !$url) {
1741                # some of the original repositories I made had
1742                # identifiers like this:
1743                ($rev, $uuid) = ($id =~/^git-svn-id:\s(\d+)\@([a-f\d\-]+)/);
1744        }
1745        return ($url, $rev, $uuid);
1746}
1747
1748sub cmt_metadata {
1749        return extract_metadata((grep(/^git-svn-id: /,
1750                command(qw/cat-file commit/, shift)))[-1]);
1751}
1752
1753sub get_commit_time {
1754        my $cmt = shift;
1755        my $fh = command_output_pipe(qw/rev-list --pretty=raw -n1/, $cmt);
1756        while (<$fh>) {
1757                /^committer\s(?:.+) (\d+) ([\-\+]?\d+)$/ or next;
1758                my ($s, $tz) = ($1, $2);
1759                if ($tz =~ s/^\+//) {
1760                        $s += tz_to_s_offset($tz);
1761                } elsif ($tz =~ s/^\-//) {
1762                        $s -= tz_to_s_offset($tz);
1763                }
1764                close $fh;
1765                return $s;
1766        }
1767        die "Can't get commit time for commit: $cmt\n";
1768}
1769
1770sub tz_to_s_offset {
1771        my ($tz) = @_;
1772        $tz =~ s/(\d\d)$//;
1773        return ($1 * 60) + ($tz * 3600);
1774}
1775
1776# adapted from pager.c
1777sub config_pager {
1778        $_pager ||= $ENV{GIT_PAGER} || $ENV{PAGER};
1779        if (!defined $_pager) {
1780                $_pager = 'less';
1781        } elsif (length $_pager == 0 || $_pager eq 'cat') {
1782                $_pager = undef;
1783        }
1784}
1785
1786sub run_pager {
1787        return unless -t *STDOUT;
1788        pipe my $rfd, my $wfd or return;
1789        defined(my $pid = fork) or croak $!;
1790        if (!$pid) {
1791                open STDOUT, '>&', $wfd or croak $!;
1792                return;
1793        }
1794        open STDIN, '<&', $rfd or croak $!;
1795        $ENV{LESS} ||= 'FRSX';
1796        exec $_pager or croak "Can't run pager: $! ($_pager)\n";
1797}
1798
1799sub get_author_info {
1800        my ($dest, $author, $t, $tz) = @_;
1801        $author =~ s/(?:^\s*|\s*$)//g;
1802        $dest->{a_raw} = $author;
1803        my $_a;
1804        if ($_authors) {
1805                $_a = $rusers{$author} || undef;
1806        }
1807        if (!$_a) {
1808                ($_a) = ($author =~ /<([^>]+)\@[^>]+>$/);
1809        }
1810        $dest->{t} = $t;
1811        $dest->{tz} = $tz;
1812        $dest->{a} = $_a;
1813        # Date::Parse isn't in the standard Perl distro :(
1814        if ($tz =~ s/^\+//) {
1815                $t += tz_to_s_offset($tz);
1816        } elsif ($tz =~ s/^\-//) {
1817                $t -= tz_to_s_offset($tz);
1818        }
1819        $dest->{t_utc} = $t;
1820}
1821
1822sub process_commit {
1823        my ($c, $r_min, $r_max, $defer) = @_;
1824        if (defined $r_min && defined $r_max) {
1825                if ($r_min == $c->{r} && $r_min == $r_max) {
1826                        show_commit($c);
1827                        return 0;
1828                }
1829                return 1 if $r_min == $r_max;
1830                if ($r_min < $r_max) {
1831                        # we need to reverse the print order
1832                        return 0 if (defined $_limit && --$_limit < 0);
1833                        push @$defer, $c;
1834                        return 1;
1835                }
1836                if ($r_min != $r_max) {
1837                        return 1 if ($r_min < $c->{r});
1838                        return 1 if ($r_max > $c->{r});
1839                }
1840        }
1841        return 0 if (defined $_limit && --$_limit < 0);
1842        show_commit($c);
1843        return 1;
1844}
1845
1846sub show_commit {
1847        my $c = shift;
1848        if ($_oneline) {
1849                my $x = "\n";
1850                if (my $l = $c->{l}) {
1851                        while ($l->[0] =~ /^\s*$/) { shift @$l }
1852                        $x = $l->[0];
1853                }
1854                $_l_fmt ||= 'A' . length($c->{r});
1855                print 'r',pack($_l_fmt, $c->{r}),' | ';
1856                print "$c->{c} | " if $_show_commit;
1857                print $x;
1858        } else {
1859                show_commit_normal($c);
1860        }
1861}
1862
1863sub show_commit_changed_paths {
1864        my ($c) = @_;
1865        return unless $c->{changed};
1866        print "Changed paths:\n", @{$c->{changed}};
1867}
1868
1869sub show_commit_normal {
1870        my ($c) = @_;
1871        print '-' x72, "\nr$c->{r} | ";
1872        print "$c->{c} | " if $_show_commit;
1873        print "$c->{a} | ", strftime("%Y-%m-%d %H:%M:%S %z (%a, %d %b %Y)",
1874                                 localtime($c->{t_utc})), ' | ';
1875        my $nr_line = 0;
1876
1877        if (my $l = $c->{l}) {
1878                while ($l->[$#$l] eq "\n" && $#$l > 0
1879                                          && $l->[($#$l - 1)] eq "\n") {
1880                        pop @$l;
1881                }
1882                $nr_line = scalar @$l;
1883                if (!$nr_line) {
1884                        print "1 line\n\n\n";
1885                } else {
1886                        if ($nr_line == 1) {
1887                                $nr_line = '1 line';
1888                        } else {
1889                                $nr_line .= ' lines';
1890                        }
1891                        print $nr_line, "\n";
1892                        show_commit_changed_paths($c);
1893                        print "\n";
1894                        print $_ foreach @$l;
1895                }
1896        } else {
1897                print "1 line\n";
1898                show_commit_changed_paths($c);
1899                print "\n";
1900
1901        }
1902        foreach my $x (qw/raw diff/) {
1903                if ($c->{$x}) {
1904                        print "\n";
1905                        print $_ foreach @{$c->{$x}}
1906                }
1907        }
1908}
1909
1910package Git::SVN;
1911use strict;
1912use warnings;
1913use vars qw/$default/;
1914use Carp qw/croak/;
1915use File::Path qw/mkpath/;
1916use IPC::Open3;
1917
1918# properties that we do not log:
1919my %SKIP_PROP;
1920BEGIN {
1921        %SKIP_PROP = map { $_ => 1 } qw/svn:wc:ra_dav:version-url
1922                                        svn:special svn:executable
1923                                        svn:entry:committed-rev
1924                                        svn:entry:last-author
1925                                        svn:entry:uuid
1926                                        svn:entry:committed-date/;
1927}
1928
1929sub init {
1930        my ($class, $id, $url) = @_;
1931        my $self = _new($class, $id);
1932        mkpath(["$self->{dir}/info"]);
1933        if (defined $url) {
1934                $url =~ s!/+$!!; # strip trailing slash
1935                s_to_file($url, "$self->{dir}/info/url");
1936        }
1937        $self->{url} = $url;
1938        open my $fh, '>>', $self->{db_path} or croak $!;
1939        close $fh or croak $!;
1940        $self;
1941}
1942
1943sub new {
1944        my ($class, $id) = @_;
1945        my $self = _new($class, $id);
1946        $self->{url} = file_to_s("$self->{dir}/info/url");
1947        $self;
1948}
1949
1950sub refname { "refs/remotes/$_[0]->{id}" }
1951
1952sub ra {
1953        my ($self) = shift;
1954        $self->{ra} ||= Git::SVN::Ra->new($self->{url});
1955}
1956
1957sub copy_remote_ref {
1958        my ($self) = @_;
1959        my $origin = $::_cp_remote ? $::_cp_remote : 'origin';
1960        my $ref = $self->refname;
1961        if (command('ls-remote', $origin, $ref)) {
1962                command_noisy('fetch', $origin, "$ref:$ref");
1963        } elsif ($::_cp_remote && !$::_upgrade) {
1964                die "Unable to find remote reference: $ref on $origin\n";
1965        }
1966}
1967
1968sub traverse_ignore {
1969        my ($self, $fh, $path, $r) = @_;
1970        $path =~ s#^/+##g;
1971        my ($dirent, undef, $props) = $self->ra->get_dir($path, $r);
1972        my $p = $path;
1973        $p =~ s#^\Q$self->{ra}->{svn_path}\E/##;
1974        print $fh length $p ? "\n# $p\n" : "\n# /\n";
1975        if (my $s = $props->{'svn:ignore'}) {
1976                $s =~ s/[\r\n]+/\n/g;
1977                chomp $s;
1978                if (length $p == 0) {
1979                        $s =~ s#\n#\n/$p#g;
1980                        print $fh "/$s\n";
1981                } else {
1982                        $s =~ s#\n#\n/$p/#g;
1983                        print $fh "/$p/$s\n";
1984                }
1985        }
1986        foreach (sort keys %$dirent) {
1987                next if $dirent->{$_}->kind != $SVN::Node::dir;
1988                $self->traverse_ignore($fh, "$path/$_", $r);
1989        }
1990}
1991
1992# returns the newest SVN revision number and newest commit SHA1
1993sub last_rev_commit {
1994        my ($self) = @_;
1995        if (defined $self->{last_rev} && defined $self->{last_commit}) {
1996                return ($self->{last_rev}, $self->{last_commit});
1997        }
1998        my $c = verify_ref($self->refname.'^0');
1999        if (defined $c && length $c) {
2000                my $rev = (cmt_metadata($c))[1];
2001                if (defined $rev) {
2002                        ($self->{last_rev}, $self->{last_commit}) = ($rev, $c);
2003                        return ($rev, $c);
2004                }
2005        }
2006        my $offset = -41; # from tail
2007        my $rl;
2008        open my $fh, '<', $self->{db_path} or
2009                                 croak "$self->{db_path} not readable: $!\n";
2010        seek $fh, $offset, 2;
2011        $rl = readline $fh;
2012        defined $rl or return (undef, undef);
2013        chomp $rl;
2014        while ($c ne $rl && tell $fh != 0) {
2015                $offset -= 41;
2016                seek $fh, $offset, 2;
2017                $rl = readline $fh;
2018                defined $rl or return (undef, undef);
2019                chomp $rl;
2020        }
2021        my $rev = tell $fh;
2022        croak $! if ($rev < 0);
2023        $rev =  ($rev - 41) / 41;
2024        close $fh or croak $!;
2025        ($self->{last_rev}, $self->{last_commit}) = ($rev, $c);
2026        return ($rev, $c);
2027}
2028
2029sub parse_revision {
2030        my ($self, $base) = @_;
2031        my $head = $self->ra->get_latest_revnum;
2032        if (!defined $::_revision || $::_revision eq 'BASE:HEAD') {
2033                return ($base + 1, $head) if (defined $base);
2034                return (0, $head);
2035        }
2036        return ($1, $2) if ($::_revision =~ /^(\d+):(\d+)$/);
2037        return ($::_revision, $::_revision) if ($::_revision =~ /^\d+$/);
2038        if ($::_revision =~ /^BASE:(\d+)$/) {
2039                return ($base + 1, $1) if (defined $base);
2040                return (0, $head);
2041        }
2042        return ($1, $head) if ($::_revision =~ /^(\d+):HEAD$/);
2043        die "revision argument: $::_revision not understood by git-svn\n",
2044                "Try using the command-line svn client instead\n";
2045}
2046
2047sub tmp_index_do {
2048        my ($self, $sub) = @_;
2049        my $old_index = $ENV{GIT_INDEX_FILE};
2050        $ENV{GIT_INDEX_FILE} = $self->{index};
2051        my @ret = &$sub;
2052        if ($old_index) {
2053                $ENV{GIT_INDEX_FILE} = $old_index;
2054        } else {
2055                delete $ENV{GIT_INDEX_FILE};
2056        }
2057        wantarray ? @ret : $ret[0];
2058}
2059
2060sub assert_index_clean {
2061        my ($self, $treeish) = @_;
2062
2063        $self->tmp_index_do(sub {
2064                command_noisy('read-tree', $treeish) unless -e $self->{index};
2065                my $x = command_oneline('write-tree');
2066                my ($y) = (command(qw/cat-file commit/, $treeish) =~
2067                           /^tree ($::sha1)/mo);
2068                if ($y ne $x) {
2069                        unlink $self->{index} or croak $!;
2070                        command_noisy('read-tree', $treeish);
2071                }
2072                $x = command_oneline('write-tree');
2073                if ($y ne $x) {
2074                        ::fatal "trees ($treeish) $y != $x\n",
2075                                "Something is seriously wrong...\n";
2076                }
2077        });
2078}
2079
2080sub get_commit_parents {
2081        my ($self, $log_msg, @parents) = @_;
2082        my (%seen, @ret, @tmp);
2083        # commit parents can be conditionally bound to a particular
2084        # svn revision via: "svn_revno=commit_sha1", filter them out here:
2085        foreach my $p (@parents) {
2086                next unless defined $p;
2087                if ($p =~ /^(\d+)=($::sha1_short)$/o) {
2088                        push @tmp, $2 if $1 == $log_msg->{revision};
2089                } else {
2090                        push @tmp, $p if $p =~ /^$::sha1_short$/o;
2091                }
2092        }
2093        if (my $cur = verify_ref($self->refname.'^0')) {
2094                push @tmp, $cur;
2095        }
2096        push @tmp, $_ foreach (@{$log_msg->{parents}}, @tmp);
2097        while (my $p = shift @tmp) {
2098                next if $seen{$p};
2099                $seen{$p} = 1;
2100                push @ret, $p;
2101                # MAXPARENT is defined to 16 in commit-tree.c:
2102                last if @ret >= 16;
2103        }
2104        if (@tmp) {
2105                die "r$log_msg->{revision}: No room for parents:\n\t",
2106                    join("\n\t", @tmp), "\n";
2107        }
2108        @ret;
2109}
2110
2111sub check_upgrade_needed {
2112        my ($self) = @_;
2113        if (!-r $self->{db_path}) {
2114                -d $self->{dir} or mkpath([$self->{dir}]);
2115                open my $fh, '>>', $self->{db_path} or croak $!;
2116                close $fh;
2117        }
2118        return unless verify_ref($self->{id}.'-HEAD^0');
2119        my $head = verify_ref($self->refname.'^0');
2120        if ($@ || !$head) {
2121                fatal("Please run: $0 rebuild --upgrade\n");
2122        }
2123}
2124
2125sub do_git_commit {
2126        my ($self, $log_msg, @parents) = @_;
2127        if (my $c = $self->rev_db_get($log_msg->{revision})) {
2128                croak "$log_msg->{revision} = $c already exists! ",
2129                      "Why are we refetching it?\n";
2130        }
2131        my ($name, $email) = author_name_email($log_msg->{author}, $self->ra);
2132        $ENV{GIT_AUTHOR_NAME} = $ENV{GIT_COMMITTER_NAME} = $name;
2133        $ENV{GIT_AUTHOR_EMAIL} = $ENV{GIT_COMMITTER_EMAIL} = $email;
2134        $ENV{GIT_AUTHOR_DATE} = $ENV{GIT_COMMITTER_DATE} = $log_msg->{date};
2135
2136        my $tree = $log_msg->{tree};
2137        if (!defined $tree) {
2138                $tree = $self->tmp_index_do(sub {
2139                                            command_oneline('write-tree') });
2140        }
2141        die "Tree is not a valid sha1: $tree\n" if $tree !~ /^$::sha1$/o;
2142
2143        my @exec = ('git-commit-tree', $tree);
2144        foreach ($self->get_commit_parents($log_msg, @parents)) {
2145                push @exec, '-p', $_;
2146        }
2147        defined(my $pid = open3(my $msg_fh, my $out_fh, '>&STDERR', @exec))
2148                                                                   or croak $!;
2149        print $msg_fh $log_msg->{log} or croak $!;
2150        print $msg_fh "\ngit-svn-id: $self->{ra}->{url}\@$log_msg->{revision}",
2151                      " ", $self->ra->uuid,"\n" or croak $!;
2152        $msg_fh->flush == 0 or croak $!;
2153        close $msg_fh or croak $!;
2154        chomp(my $commit = do { local $/; <$out_fh> });
2155        close $out_fh or croak $!;
2156        waitpid $pid, 0;
2157        croak $? if $?;
2158        if ($commit !~ /^$::sha1$/o) {
2159                die "Failed to commit, invalid sha1: $commit\n";
2160        }
2161
2162        command_noisy('update-ref',$self->refname, $commit);
2163        $self->rev_db_set($log_msg->{revision}, $commit);
2164
2165        $self->{last_rev} = $log_msg->{revision};
2166        $self->{last_commit} = $commit;
2167        print "r$log_msg->{revision} = $commit\n";
2168        return $commit;
2169}
2170
2171sub do_fetch {
2172        my ($self, $paths, $rev) = @_; #, $author, $date, $msg) = @_;
2173        my $ed = SVN::Git::Fetcher->new($self);
2174        my ($last_rev, @parents);
2175        if ($self->{last_commit}) {
2176                $last_rev = $self->{last_rev};
2177                $ed->{c} = $self->{last_commit};
2178                @parents = ($self->{last_commit});
2179        } else {
2180                $last_rev = $rev;
2181        }
2182        unless ($self->ra->do_update($last_rev, $rev, '', 1, $ed)) {
2183                die "SVN connection failed somewhere...\n";
2184        }
2185        $self->make_log_entry($rev, \@parents, $ed);
2186}
2187
2188sub write_untracked {
2189        my ($self, $rev, $fh, $untracked) = @_;
2190        my $h;
2191        print $fh "r$rev\n" or croak $!;
2192        $h = $untracked->{empty};
2193        foreach (sort keys %$h) {
2194                my $act = $h->{$_} ? '+empty_dir' : '-empty_dir';
2195                print $fh "  $act: ", uri_encode($_), "\n" or croak $!;
2196                warn "W: $act: $_\n";
2197        }
2198        foreach my $t (qw/dir_prop file_prop/) {
2199                $h = $untracked->{$t} or next;
2200                foreach my $path (sort keys %$h) {
2201                        my $ppath = $path eq '' ? '.' : $path;
2202                        foreach my $prop (sort keys %{$h->{$path}}) {
2203                                next if $SKIP{$prop};
2204                                my $v = $h->{$path}->{$prop};
2205                                if (defined $v) {
2206                                        print $fh "  +$t: ",
2207                                                  uri_encode($ppath), ' ',
2208                                                  uri_encode($prop), ' ',
2209                                                  uri_encode($v), "\n"
2210                                                  or croak $!;
2211                                } else {
2212                                        print $fh "  -$t: ",
2213                                                  uri_encode($ppath), ' ',
2214                                                  uri_encode($prop), "\n"
2215                                                  or croak $!;
2216                                }
2217                        }
2218                }
2219        }
2220        foreach my $t (qw/absent_file absent_directory/) {
2221                $h = $untracked->{$t} or next;
2222                foreach my $parent (sort keys %$h) {
2223                        foreach my $path (sort @{$h->{$parent}}) {
2224                                print $fh "  $t: ",
2225                                      uri_encode("$parent/$path"), "\n"
2226                                      or croak $!;
2227                                warn "W: $t: $parent/$path ",
2228                                     "Insufficient permissions?\n";
2229                        }
2230                }
2231        }
2232}
2233
2234sub make_log_entry {
2235        my ($self, $rev, $parents, $untracked) = @_;
2236        my $rp = $self->ra->rev_proplist($rev);
2237        my %log_entry = ( parents => $parents || [], revision => $rev,
2238                          revprops => $rp, log => '');
2239        open my $un, '>>', "$self->{dir}/unhandled.log" or croak $!;
2240        $self->write_untracked($rev, $un, $untracked);
2241        foreach (sort keys %$rp) {
2242                my $v = $rp->{$_};
2243                if (/^svn:(author|date|log)$/) {
2244                        $log_entry{$1} = $v;
2245                } else {
2246                        print $un "  rev_prop: ", uri_encode($_), ' ',
2247                                  uri_encode($v), "\n";
2248                }
2249        }
2250        close $un or croak $!;
2251        $log_entry{date} = parse_svn_date($log_entry{date});
2252        $log_entry{author} = check_author($log_entry{author});
2253        $log_entry{log} .= "\n";
2254        \%log_entry;
2255}
2256
2257sub fetch {
2258        my ($self, @parents) = @_;
2259        my ($last_rev, $last_commit) = $self->last_rev_commit;
2260        my ($base, $head) = $self->parse_revision($last_rev);
2261        return if ($base > $head);
2262        if (defined $last_commit) {
2263                $self->assert_index_clean($last_commit);
2264        }
2265        my $inc = 1000;
2266        my ($min, $max) = ($base, $head < $base + $inc ? $head : $base + $inc);
2267        my $err_handler = $SVN::Error::handler;
2268        $SVN::Error::handler = \&skip_unknown_revs;
2269        while (1) {
2270                my @revs;
2271                $self->ra->get_log([''], $min, $max, 0, 1, 1, sub {
2272                        my ($paths, $rev, $author, $date, $msg) = @_;
2273                        push @revs, $rev });
2274                foreach (@revs) {
2275                        my $log_entry = $self->do_fetch(undef, $_);
2276                        $self->do_git_commit($log_entry, @parents);
2277                }
2278                last if $max >= $head;
2279                $min = $max + 1;
2280                $max += $inc;
2281                $max = $head if ($max > $head);
2282        }
2283        $SVN::Error::handler = $err_handler;
2284}
2285
2286sub set_tree_cb {
2287        my ($self, $log_entry, $tree, $rev, $date, $author) = @_;
2288        # TODO: enable and test optimized commits:
2289        if (0 && $rev == ($self->{last_rev} + 1)) {
2290                $log_entry->{revision} = $rev;
2291                $log_entry->{author} = $author;
2292                $self->do_git_commit($log_entry, "$rev=$tree");
2293        } else {
2294                $self->fetch("$rev=$tree");
2295        }
2296}
2297
2298sub set_tree {
2299        my ($self, $tree) = (shift, shift);
2300        my $log_entry = get_commit_entry($tree);
2301        unless ($self->{last_rev}) {
2302                fatal("Must have an existing revision to commit\n");
2303        }
2304        my $pool = SVN::Pool->new;
2305        my $ed = SVN::Git::Editor->new({ r => $self->{last_rev},
2306                                         ra => $self->ra->dup,
2307                                         c => $tree,
2308                                         svn_path => $self->ra->{svn_path}
2309                                       },
2310                                       $self->ra->get_commit_editor(
2311                                         $log_entry->{log}, sub {
2312                                           $self->set_tree_cb($log_entry,
2313                                                              $tree, @_);
2314                                       }),
2315                                       $pool);
2316        my $mods = $ed->apply_diff($self->{last_commit}, $tree);
2317        if (@$mods == 0) {
2318                print "No changes\nr$self->{last_rev} = $tree\n";
2319        }
2320        $pool->clear;
2321}
2322
2323sub skip_unknown_revs {
2324        my ($err) = @_;
2325        my $errno = $err->apr_err();
2326        # Maybe the branch we're tracking didn't
2327        # exist when the repo started, so it's
2328        # not an error if it doesn't, just continue
2329        #
2330        # Wonderfully consistent library, eh?
2331        # 160013 - svn:// and file://
2332        # 175002 - http(s)://
2333        # 175007 - http(s):// (this repo required authorization, too...)
2334        #   More codes may be discovered later...
2335        if ($errno == 175007 || $errno == 175002 || $errno == 160013) {
2336                return;
2337        }
2338        croak "Error from SVN, ($errno): ", $err->expanded_message,"\n";
2339}
2340
2341# rev_db:
2342# Tie::File seems to be prone to offset errors if revisions get sparse,
2343# it's not that fast, either.  Tie::File is also not in Perl 5.6.  So
2344# one of my favorite modules is out :<  Next up would be one of the DBM
2345# modules, but I'm not sure which is most portable...  So I'll just
2346# go with something that's plain-text, but still capable of
2347# being randomly accessed.  So here's my ultra-simple fixed-width
2348# database.  All records are 40 characters + "\n", so it's easy to seek
2349# to a revision: (41 * rev) is the byte offset.
2350# A record of 40 0s denotes an empty revision.
2351# And yes, it's still pretty fast (faster than Tie::File).
2352
2353sub rev_db_set {
2354        my ($self, $rev, $commit) = @_;
2355        length $commit == 40 or croak "arg3 must be a full SHA1 hexsum\n";
2356        open my $fh, '+<', $self->{db_path} or croak $!;
2357        my $offset = $rev * 41;
2358        # assume that append is the common case:
2359        seek $fh, 0, 2 or croak $!;
2360        my $pos = tell $fh;
2361        if ($pos < $offset) {
2362                print $fh (('0' x 40),"\n") x (($offset - $pos) / 41)
2363                  or croak $!;
2364        }
2365        seek $fh, $offset, 0 or croak $!;
2366        print $fh $commit,"\n" or croak $!;
2367        close $fh or croak $!;
2368}
2369
2370sub rev_db_get {
2371        my ($self, $rev) = @_;
2372        my $ret;
2373        my $offset = $rev * 41;
2374        open my $fh, '<', $self->{db_path} or croak $!;
2375        if (seek $fh, $offset, 0) {
2376                $ret = readline $fh;
2377                if (defined $ret) {
2378                        chomp $ret;
2379                        $ret = undef if ($ret =~ /^0{40}$/);
2380                }
2381        }
2382        close $fh or croak $!;
2383        $ret;
2384}
2385
2386sub _new {
2387        my ($class, $id) = @_;
2388        $id ||= $Git::SVN::default;
2389        my $dir = "$ENV{GIT_DIR}/svn/$id";
2390        bless { id => $id, dir => $dir, index => "$dir/index",
2391                db_path => "$dir/.rev_db" }, $class;
2392}
2393
2394
2395package Git::SVN::Prompt;
2396use strict;
2397use warnings;
2398require SVN::Core;
2399use vars qw/$_no_auth_cache $_username/;
2400
2401sub simple {
2402        my ($cred, $realm, $default_username, $may_save, $pool) = @_;
2403        $may_save = undef if $_no_auth_cache;
2404        $default_username = $_username if defined $_username;
2405        if (defined $default_username && length $default_username) {
2406                if (defined $realm && length $realm) {
2407                        print STDERR "Authentication realm: $realm\n";
2408                        STDERR->flush;
2409                }
2410                $cred->username($default_username);
2411        } else {
2412                username($cred, $realm, $may_save, $pool);
2413        }
2414        $cred->password(_read_password("Password for '" .
2415                                       $cred->username . "': ", $realm));
2416        $cred->may_save($may_save);
2417        $SVN::_Core::SVN_NO_ERROR;
2418}
2419
2420sub ssl_server_trust {
2421        my ($cred, $realm, $failures, $cert_info, $may_save, $pool) = @_;
2422        $may_save = undef if $_no_auth_cache;
2423        print STDERR "Error validating server certificate for '$realm':\n";
2424        if ($failures & $SVN::Auth::SSL::UNKNOWNCA) {
2425                print STDERR " - The certificate is not issued by a trusted ",
2426                      "authority. Use the\n",
2427                      "   fingerprint to validate the certificate manually!\n";
2428        }
2429        if ($failures & $SVN::Auth::SSL::CNMISMATCH) {
2430                print STDERR " - The certificate hostname does not match.\n";
2431        }
2432        if ($failures & $SVN::Auth::SSL::NOTYETVALID) {
2433                print STDERR " - The certificate is not yet valid.\n";
2434        }
2435        if ($failures & $SVN::Auth::SSL::EXPIRED) {
2436                print STDERR " - The certificate has expired.\n";
2437        }
2438        if ($failures & $SVN::Auth::SSL::OTHER) {
2439                print STDERR " - The certificate has an unknown error.\n";
2440        }
2441        printf STDERR
2442                "Certificate information:\n".
2443                " - Hostname: %s\n".
2444                " - Valid: from %s until %s\n".
2445                " - Issuer: %s\n".
2446                " - Fingerprint: %s\n",
2447                map $cert_info->$_, qw(hostname valid_from valid_until
2448                                       issuer_dname fingerprint);
2449        my $choice;
2450prompt:
2451        print STDERR $may_save ?
2452              "(R)eject, accept (t)emporarily or accept (p)ermanently? " :
2453              "(R)eject or accept (t)emporarily? ";
2454        STDERR->flush;
2455        $choice = lc(substr(<STDIN> || 'R', 0, 1));
2456        if ($choice =~ /^t$/i) {
2457                $cred->may_save(undef);
2458        } elsif ($choice =~ /^r$/i) {
2459                return -1;
2460        } elsif ($may_save && $choice =~ /^p$/i) {
2461                $cred->may_save($may_save);
2462        } else {
2463                goto prompt;
2464        }
2465        $cred->accepted_failures($failures);
2466        $SVN::_Core::SVN_NO_ERROR;
2467}
2468
2469sub ssl_client_cert {
2470        my ($cred, $realm, $may_save, $pool) = @_;
2471        $may_save = undef if $_no_auth_cache;
2472        print STDERR "Client certificate filename: ";
2473        STDERR->flush;
2474        chomp(my $filename = <STDIN>);
2475        $cred->cert_file($filename);
2476        $cred->may_save($may_save);
2477        $SVN::_Core::SVN_NO_ERROR;
2478}
2479
2480sub ssl_client_cert_pw {
2481        my ($cred, $realm, $may_save, $pool) = @_;
2482        $may_save = undef if $_no_auth_cache;
2483        $cred->password(_read_password("Password: ", $realm));
2484        $cred->may_save($may_save);
2485        $SVN::_Core::SVN_NO_ERROR;
2486}
2487
2488sub username {
2489        my ($cred, $realm, $may_save, $pool) = @_;
2490        $may_save = undef if $_no_auth_cache;
2491        if (defined $realm && length $realm) {
2492                print STDERR "Authentication realm: $realm\n";
2493        }
2494        my $username;
2495        if (defined $_username) {
2496                $username = $_username;
2497        } else {
2498                print STDERR "Username: ";
2499                STDERR->flush;
2500                chomp($username = <STDIN>);
2501        }
2502        $cred->username($username);
2503        $cred->may_save($may_save);
2504        $SVN::_Core::SVN_NO_ERROR;
2505}
2506
2507sub _read_password {
2508        my ($prompt, $realm) = @_;
2509        print STDERR $prompt;
2510        STDERR->flush;
2511        require Term::ReadKey;
2512        Term::ReadKey::ReadMode('noecho');
2513        my $password = '';
2514        while (defined(my $key = Term::ReadKey::ReadKey(0))) {
2515                last if $key =~ /[\012\015]/; # \n\r
2516                $password .= $key;
2517        }
2518        Term::ReadKey::ReadMode('restore');
2519        print STDERR "\n";
2520        STDERR->flush;
2521        $password;
2522}
2523
2524package main;
2525
2526sub uri_encode {
2527        my ($f) = @_;
2528        $f =~ s#([^a-zA-Z0-9\*!\:_\./\-])#uc sprintf("%%%02x",ord($1))#eg;
2529        $f
2530}
2531
2532sub uri_decode {
2533        my ($f) = @_;
2534        $f =~ tr/+/ /;
2535        $f =~ s/%([A-F0-9]{2})/chr hex($1)/ge;
2536        $f
2537}
2538
2539sub libsvn_log_entry {
2540        my ($rev, $author, $date, $msg, $parents, $untracked) = @_;
2541        my ($Y,$m,$d,$H,$M,$S) = ($date =~ /^(\d{4})\-(\d\d)\-(\d\d)T
2542                                         (\d\d)\:(\d\d)\:(\d\d).\d+Z$/x)
2543                                or die "Unable to parse date: $date\n";
2544        if (defined $author && length $author > 0 &&
2545            defined $_authors && ! defined $users{$author}) {
2546                die "Author: $author not defined in $_authors file\n";
2547        }
2548        $msg = '' if ($rev == 0 && !defined $msg);
2549
2550        open my $un, '>>', "$GIT_SVN_DIR/unhandled.log" or croak $!;
2551        my $h;
2552        print $un "r$rev\n" or croak $!;
2553        $h = $untracked->{empty};
2554        foreach (sort keys %$h) {
2555                my $act = $h->{$_} ? '+empty_dir' : '-empty_dir';
2556                print $un "  $act: ", uri_encode($_), "\n" or croak $!;
2557                warn "W: $act: $_\n";
2558        }
2559        foreach my $t (qw/dir_prop file_prop/) {
2560                $h = $untracked->{$t} or next;
2561                foreach my $path (sort keys %$h) {
2562                        my $ppath = $path eq '' ? '.' : $path;
2563                        foreach my $prop (sort keys %{$h->{$path}}) {
2564                                next if $SKIP{$prop};
2565                                my $v = $h->{$path}->{$prop};
2566                                if (defined $v) {
2567                                        print $un "  +$t: ",
2568                                                  uri_encode($ppath), ' ',
2569                                                  uri_encode($prop), ' ',
2570                                                  uri_encode($v), "\n"
2571                                                  or croak $!;
2572                                } else {
2573                                        print $un "  -$t: ",
2574                                                  uri_encode($ppath), ' ',
2575                                                  uri_encode($prop), "\n"
2576                                                  or croak $!;
2577                                }
2578                        }
2579                }
2580        }
2581        foreach my $t (qw/absent_file absent_directory/) {
2582                $h = $untracked->{$t} or next;
2583                foreach my $parent (sort keys %$h) {
2584                        foreach my $path (sort @{$h->{$parent}}) {
2585                                print $un "  $t: ",
2586                                      uri_encode("$parent/$path"), "\n"
2587                                      or croak $!;
2588                                warn "W: $t: $parent/$path ",
2589                                     "Insufficient permissions?\n";
2590                        }
2591                }
2592        }
2593
2594        # revprops (make this optional? it's an extra network trip...)
2595        my $rp = $SVN->rev_proplist($rev);
2596        foreach (sort keys %$rp) {
2597                next if /^svn:(?:author|date|log)$/;
2598                print $un "  rev_prop: ", uri_encode($_), ' ',
2599                          uri_encode($rp->{$_}), "\n";
2600        }
2601        close $un or croak $!;
2602
2603        { revision => $rev, date => "+0000 $Y-$m-$d $H:$M:$S",
2604          author => $author, msg => $msg."\n", parents => $parents || [],
2605          revprops => $rp }
2606}
2607
2608sub libsvn_fetch {
2609        my ($last_commit, $paths, $rev, $author, $date, $msg) = @_;
2610        my $ed = SVN::Git::Fetcher->new({ c => $last_commit, q => $_q });
2611        my (undef, $last_rev, undef) = cmt_metadata($last_commit);
2612        unless ($SVN->gs_do_update($last_rev, $rev, '', 1, $ed)) {
2613                die "SVN connection failed somewhere...\n";
2614        }
2615        libsvn_log_entry($rev, $author, $date, $msg, [$last_commit], $ed);
2616}
2617
2618sub svn_grab_base_rev {
2619        my $c = eval { command_oneline([qw/rev-parse --verify/,
2620                                        "refs/remotes/$GIT_SVN^0"],
2621                                        { STDERR => 0 }) };
2622        if (defined $c && length $c) {
2623                my ($url, $rev, $uuid) = cmt_metadata($c);
2624                return ($rev, $c) if defined $rev;
2625        }
2626        if ($_no_metadata) {
2627                my $offset = -41; # from tail
2628                my $rl;
2629                open my $fh, '<', $REVDB or
2630                        die "--no-metadata specified and $REVDB not readable\n";
2631                seek $fh, $offset, 2;
2632                $rl = readline $fh;
2633                defined $rl or return (undef, undef);
2634                chomp $rl;
2635                while ($c ne $rl && tell $fh != 0) {
2636                        $offset -= 41;
2637                        seek $fh, $offset, 2;
2638                        $rl = readline $fh;
2639                        defined $rl or return (undef, undef);
2640                        chomp $rl;
2641                }
2642                my $rev = tell $fh;
2643                croak $! if ($rev < -1);
2644                $rev =  ($rev - 41) / 41;
2645                close $fh or croak $!;
2646                return ($rev, $c);
2647        }
2648        return (undef, undef);
2649}
2650
2651sub libsvn_parse_revision {
2652        my $base = shift;
2653        my $head = $SVN->get_latest_revnum();
2654        if (!defined $_revision || $_revision eq 'BASE:HEAD') {
2655                return ($base + 1, $head) if (defined $base);
2656                return (0, $head);
2657        }
2658        return ($1, $2) if ($_revision =~ /^(\d+):(\d+)$/);
2659        return ($_revision, $_revision) if ($_revision =~ /^\d+$/);
2660        if ($_revision =~ /^BASE:(\d+)$/) {
2661                return ($base + 1, $1) if (defined $base);
2662                return (0, $head);
2663        }
2664        return ($1, $head) if ($_revision =~ /^(\d+):HEAD$/);
2665        die "revision argument: $_revision not understood by git-svn\n",
2666                "Try using the command-line svn client instead\n";
2667}
2668
2669sub libsvn_traverse_ignore {
2670        my ($fh, $path, $r) = @_;
2671        $path =~ s#^/+##g;
2672        my ($dirent, undef, $props) = $SVN->get_dir($path, $r);
2673        my $p = $path;
2674        $p =~ s#^\Q$SVN->{svn_path}\E/##;
2675        print $fh length $p ? "\n# $p\n" : "\n# /\n";
2676        if (my $s = $props->{'svn:ignore'}) {
2677                $s =~ s/[\r\n]+/\n/g;
2678                chomp $s;
2679                if (length $p == 0) {
2680                        $s =~ s#\n#\n/$p#g;
2681                        print $fh "/$s\n";
2682                } else {
2683                        $s =~ s#\n#\n/$p/#g;
2684                        print $fh "/$p/$s\n";
2685                }
2686        }
2687        foreach (sort keys %$dirent) {
2688                next if $dirent->{$_}->kind != $SVN::Node::dir;
2689                libsvn_traverse_ignore($fh, "$path/$_", $r);
2690        }
2691}
2692
2693sub revisions_eq {
2694        my ($path, $r0, $r1) = @_;
2695        return 1 if $r0 == $r1;
2696        my $nr = 0;
2697        # should be OK to use Pool here (r1 - r0) should be small
2698        $SVN->get_log([$path], $r0, $r1, 0, 0, 1, sub {$nr++});
2699        return 0 if ($nr > 1);
2700        return 1;
2701}
2702
2703sub libsvn_find_parent_branch {
2704        my ($paths, $rev, $author, $date, $msg) = @_;
2705        my $svn_path = '/'.$SVN->{svn_path};
2706
2707        # look for a parent from another branch:
2708        my $i = $paths->{$svn_path} or return;
2709        my $branch_from = $i->copyfrom_path or return;
2710        my $r = $i->copyfrom_rev;
2711        print STDERR  "Found possible branch point: ",
2712                                "$branch_from => $svn_path, $r\n";
2713        $branch_from =~ s#^/##;
2714        my $l_map = {};
2715        read_url_paths_all($l_map, '', "$GIT_DIR/svn");
2716        my $url = $SVN->{repos_root};
2717        defined $l_map->{$url} or return;
2718        my $id = $l_map->{$url}->{$branch_from};
2719        if (!defined $id && $_follow_parent) {
2720                print STDERR "Following parent: $branch_from\@$r\n";
2721                # auto create a new branch and follow it
2722                $id = basename($branch_from);
2723                $id .= '@'.$r if -r "$GIT_DIR/svn/$id";
2724                while (-r "$GIT_DIR/svn/$id") {
2725                        # just grow a tail if we're not unique enough :x
2726                        $id .= '-';
2727                }
2728        }
2729        return unless defined $id;
2730
2731        my ($r0, $parent) = find_rev_before($r,$id,1);
2732        if ($_follow_parent && (!defined $r0 || !defined $parent)) {
2733                defined(my $pid = fork) or croak $!;
2734                if (!$pid) {
2735                        $GIT_SVN = $ENV{GIT_SVN_ID} = $id;
2736                        init_vars();
2737                        $SVN_URL = "$url/$branch_from";
2738                        $SVN = undef;
2739                        setup_git_svn();
2740                        # we can't assume SVN_URL exists at r+1:
2741                        $_revision = "0:$r";
2742                        fetch_lib();
2743                        exit 0;
2744                }
2745                waitpid $pid, 0;
2746                croak $? if $?;
2747                ($r0, $parent) = find_rev_before($r,$id,1);
2748        }
2749        return unless (defined $r0 && defined $parent);
2750        if (revisions_eq($branch_from, $r0, $r)) {
2751                unlink $GIT_SVN_INDEX;
2752                print STDERR "Found branch parent: ($GIT_SVN) $parent\n";
2753                command_noisy('read-tree', $parent);
2754                unless ($SVN->can_do_switch) {
2755                        return _libsvn_new_tree($paths, $rev, $author, $date,
2756                                                $msg, [$parent]);
2757                }
2758                # do_switch works with svn/trunk >= r22312, but that is not
2759                # included with SVN 1.4.2 (the latest version at the moment),
2760                # so we can't rely on it.
2761                my $ra = Git::SVN::Ra->new("$url/$branch_from");
2762                my $ed = SVN::Git::Fetcher->new({c => $parent, q => $_q });
2763                $ra->gs_do_switch($r0, $rev, '', 1, $SVN->{url}, $ed) or
2764                                   die "SVN connection failed somewhere...\n";
2765                return libsvn_log_entry($rev, $author, $date, $msg, [$parent]);
2766        }
2767        print STDERR "Nope, branch point not imported or unknown\n";
2768        return undef;
2769}
2770
2771sub libsvn_new_tree {
2772        if (my $log_entry = libsvn_find_parent_branch(@_)) {
2773                return $log_entry;
2774        }
2775        my ($paths, $rev, $author, $date, $msg) = @_; # $pool is last
2776        _libsvn_new_tree($paths, $rev, $author, $date, $msg, []);
2777}
2778
2779sub _libsvn_new_tree {
2780        my ($paths, $rev, $author, $date, $msg, $parents) = @_;
2781        my $ed = SVN::Git::Fetcher->new({q => $_q});
2782        unless ($SVN->gs_do_update($rev, $rev, '', 1, $ed)) {
2783                die "SVN connection failed somewhere...\n";
2784        }
2785        libsvn_log_entry($rev, $author, $date, $msg, $parents, $ed);
2786}
2787
2788sub find_graft_path_commit {
2789        my ($tree_paths, $p1, $r1) = @_;
2790        foreach my $x (keys %$tree_paths) {
2791                next unless ($p1 =~ /^\Q$x\E/);
2792                my $i = $tree_paths->{$x};
2793                my ($r0, $parent) = find_rev_before($r1,$i,1);
2794                return $parent if (defined $r0 && $r0 == $r1);
2795                print STDERR "r$r1 of $i not imported\n";
2796                next;
2797        }
2798        return undef;
2799}
2800
2801sub find_graft_path_parents {
2802        my ($grafts, $tree_paths, $c, $p0, $r0) = @_;
2803        foreach my $x (keys %$tree_paths) {
2804                next unless ($p0 =~ /^\Q$x\E/);
2805                my $i = $tree_paths->{$x};
2806                my ($r, $parent) = find_rev_before($r0, $i, 1);
2807                if (defined $r && defined $parent && revisions_eq($x,$r,$r0)) {
2808                        my ($url_b, undef, $uuid_b) = cmt_metadata($c);
2809                        my ($url_a, undef, $uuid_a) = cmt_metadata($parent);
2810                        next if ($url_a && $url_b && $url_a eq $url_b &&
2811                                                        $uuid_b eq $uuid_a);
2812                        $grafts->{$c}->{$parent} = 1;
2813                }
2814        }
2815}
2816
2817sub libsvn_graft_file_copies {
2818        my ($grafts, $tree_paths, $path, $paths, $rev) = @_;
2819        foreach (keys %$paths) {
2820                my $i = $paths->{$_};
2821                my ($m, $p0, $r0) = ($i->action, $i->copyfrom_path,
2822                                        $i->copyfrom_rev);
2823                next unless (defined $p0 && defined $r0);
2824
2825                my $p1 = $_;
2826                $p1 =~ s#^/##;
2827                $p0 =~ s#^/##;
2828                my $c = find_graft_path_commit($tree_paths, $p1, $rev);
2829                next unless $c;
2830                find_graft_path_parents($grafts, $tree_paths, $c, $p0, $r0);
2831        }
2832}
2833
2834sub set_index {
2835        my $old = $ENV{GIT_INDEX_FILE};
2836        $ENV{GIT_INDEX_FILE} = shift;
2837        return $old;
2838}
2839
2840sub restore_index {
2841        my ($old) = @_;
2842        if (defined $old) {
2843                $ENV{GIT_INDEX_FILE} = $old;
2844        } else {
2845                delete $ENV{GIT_INDEX_FILE};
2846        }
2847}
2848
2849sub libsvn_commit_cb {
2850        my ($rev, $date, $committer, $c, $msg, $r_last, $cmt_last) = @_;
2851        if ($_optimize_commits && $rev == ($r_last + 1)) {
2852                my $log = libsvn_log_entry($rev,$committer,$date,$msg);
2853                $log->{tree} = get_tree_from_treeish($c);
2854                my $cmt = git_commit($log, $cmt_last, $c);
2855                my @diff = command('diff-tree', $cmt, $c);
2856                if (@diff) {
2857                        print STDERR "Trees differ: $cmt $c\n",
2858                                        join('',@diff),"\n";
2859                        exit 1;
2860                }
2861        } else {
2862                fetch("$rev=$c");
2863        }
2864}
2865
2866sub libsvn_ls_fullurl {
2867        my $fullurl = shift;
2868        my $ra = Git::SVN::Ra->new($fullurl);
2869        my @ret;
2870        my $r = defined $_revision ? $_revision : $ra->get_latest_revnum;
2871        my ($dirent, undef, undef) = $ra->get_dir('', $r);
2872        foreach my $d (sort keys %$dirent) {
2873                if ($dirent->{$d}->kind == $SVN::Node::dir) {
2874                        push @ret, "$d/"; # add '/' for compat with cli svn
2875                }
2876        }
2877        return @ret;
2878}
2879
2880sub libsvn_skip_unknown_revs {
2881        my $err = shift;
2882        my $errno = $err->apr_err();
2883        # Maybe the branch we're tracking didn't
2884        # exist when the repo started, so it's
2885        # not an error if it doesn't, just continue
2886        #
2887        # Wonderfully consistent library, eh?
2888        # 160013 - svn:// and file://
2889        # 175002 - http(s)://
2890        # 175007 - http(s):// (this repo required authorization, too...)
2891        #   More codes may be discovered later...
2892        if ($errno == 175007 || $errno == 175002 || $errno == 160013) {
2893                return;
2894        }
2895        croak "Error from SVN, ($errno): ", $err->expanded_message,"\n";
2896};
2897
2898# Tie::File seems to be prone to offset errors if revisions get sparse,
2899# it's not that fast, either.  Tie::File is also not in Perl 5.6.  So
2900# one of my favorite modules is out :<  Next up would be one of the DBM
2901# modules, but I'm not sure which is most portable...  So I'll just
2902# go with something that's plain-text, but still capable of
2903# being randomly accessed.  So here's my ultra-simple fixed-width
2904# database.  All records are 40 characters + "\n", so it's easy to seek
2905# to a revision: (41 * rev) is the byte offset.
2906# A record of 40 0s denotes an empty revision.
2907# And yes, it's still pretty fast (faster than Tie::File).
2908sub revdb_set {
2909        my ($file, $rev, $commit) = @_;
2910        length $commit == 40 or croak "arg3 must be a full SHA1 hexsum\n";
2911        open my $fh, '+<', $file or croak $!;
2912        my $offset = $rev * 41;
2913        # assume that append is the common case:
2914        seek $fh, 0, 2 or croak $!;
2915        my $pos = tell $fh;
2916        if ($pos < $offset) {
2917                print $fh (('0' x 40),"\n") x (($offset - $pos) / 41);
2918        }
2919        seek $fh, $offset, 0 or croak $!;
2920        print $fh $commit,"\n";
2921        close $fh or croak $!;
2922}
2923
2924sub revdb_get {
2925        my ($file, $rev) = @_;
2926        my $ret;
2927        my $offset = $rev * 41;
2928        open my $fh, '<', $file or croak $!;
2929        seek $fh, $offset, 0;
2930        if (tell $fh == $offset) {
2931                $ret = readline $fh;
2932                if (defined $ret) {
2933                        chomp $ret;
2934                        $ret = undef if ($ret =~ /^0{40}$/);
2935                }
2936        }
2937        close $fh or croak $!;
2938        return $ret;
2939}
2940
2941sub copy_remote_ref {
2942        my $origin = $_cp_remote ? $_cp_remote : 'origin';
2943        my $ref = "refs/remotes/$GIT_SVN";
2944        if (command('ls-remote', $origin, $ref)) {
2945                command_noisy('fetch', $origin, "$ref:$ref");
2946        } elsif ($_cp_remote && !$_upgrade) {
2947                die "Unable to find remote reference: ",
2948                                "refs/remotes/$GIT_SVN on $origin\n";
2949        }
2950}
2951
2952{
2953        my $kill_stupid_warnings = $SVN::Node::none.$SVN::Node::file.
2954                                $SVN::Node::dir.$SVN::Node::unknown.
2955                                $SVN::Node::none.$SVN::Node::file.
2956                                $SVN::Node::dir.$SVN::Node::unknown.
2957                                $SVN::Auth::SSL::CNMISMATCH.
2958                                $SVN::Auth::SSL::NOTYETVALID.
2959                                $SVN::Auth::SSL::EXPIRED.
2960                                $SVN::Auth::SSL::UNKNOWNCA.
2961                                $SVN::Auth::SSL::OTHER;
2962}
2963
2964package SVN::Git::Fetcher;
2965use vars qw/@ISA/;
2966use strict;
2967use warnings;
2968use Carp qw/croak/;
2969use IO::File qw//;
2970
2971# file baton members: path, mode_a, mode_b, pool, fh, blob, base
2972sub new {
2973        my ($class, $git_svn) = @_;
2974        my $self = SVN::Delta::Editor->new;
2975        bless $self, $class;
2976        $self->{c} = $git_svn->{c} if exists $git_svn->{c};
2977        $self->{q} = $git_svn->{q};
2978        $self->{empty} = {};
2979        $self->{dir_prop} = {};
2980        $self->{file_prop} = {};
2981        $self->{absent_dir} = {};
2982        $self->{absent_file} = {};
2983        ($self->{gui}, $self->{ctx}) = command_input_pipe(
2984                                             qw/update-index -z --index-info/);
2985        require Digest::MD5;
2986        $self;
2987}
2988
2989sub open_root {
2990        { path => '' };
2991}
2992
2993sub open_directory {
2994        my ($self, $path, $pb, $rev) = @_;
2995        { path => $path };
2996}
2997
2998sub delete_entry {
2999        my ($self, $path, $rev, $pb) = @_;
3000        my $gui = $self->{gui};
3001
3002        # remove entire directories.
3003        if (command('ls-tree', $self->{c}, '--', $path) =~ /^040000 tree/) {
3004                my ($ls, $ctx) = command_output_pipe(qw/ls-tree
3005                                                     -r --name-only -z/,
3006                                                     $self->{c}, '--', $path);
3007                local $/ = "\0";
3008                while (<$ls>) {
3009                        print $gui '0 ',0 x 40,"\t",$_ or croak $!;
3010                        print "\tD\t$_\n" unless $self->{q};
3011                }
3012                print "\tD\t$path/\n" unless $self->{q};
3013                command_close_pipe($ls, $ctx);
3014                $self->{empty}->{$path} = 0
3015        } else {
3016                print $gui '0 ',0 x 40,"\t",$path,"\0" or croak $!;
3017                print "\tD\t$path\n" unless $self->{q};
3018        }
3019        undef;
3020}
3021
3022sub open_file {
3023        my ($self, $path, $pb, $rev) = @_;
3024        my ($mode, $blob) = (command('ls-tree', $self->{c}, '--',$path)
3025                             =~ /^(\d{6}) blob ([a-f\d]{40})\t/);
3026        unless (defined $mode && defined $blob) {
3027                die "$path was not found in commit $self->{c} (r$rev)\n";
3028        }
3029        { path => $path, mode_a => $mode, mode_b => $mode, blob => $blob,
3030          pool => SVN::Pool->new, action => 'M' };
3031}
3032
3033sub add_file {
3034        my ($self, $path, $pb, $cp_path, $cp_rev) = @_;
3035        my ($dir, $file) = ($path =~ m#^(.*?)/?([^/]+)$#);
3036        delete $self->{empty}->{$dir};
3037        { path => $path, mode_a => 100644, mode_b => 100644,
3038          pool => SVN::Pool->new, action => 'A' };
3039}
3040
3041sub add_directory {
3042        my ($self, $path, $cp_path, $cp_rev) = @_;
3043        my ($dir, $file) = ($path =~ m#^(.*?)/?([^/]+)$#);
3044        delete $self->{empty}->{$dir};
3045        $self->{empty}->{$path} = 1;
3046        { path => $path };
3047}
3048
3049sub change_dir_prop {
3050        my ($self, $db, $prop, $value) = @_;
3051        $self->{dir_prop}->{$db->{path}} ||= {};
3052        $self->{dir_prop}->{$db->{path}}->{$prop} = $value;
3053        undef;
3054}
3055
3056sub absent_directory {
3057        my ($self, $path, $pb) = @_;
3058        $self->{absent_dir}->{$pb->{path}} ||= [];
3059        push @{$self->{absent_dir}->{$pb->{path}}}, $path;
3060        undef;
3061}
3062
3063sub absent_file {
3064        my ($self, $path, $pb) = @_;
3065        $self->{absent_file}->{$pb->{path}} ||= [];
3066        push @{$self->{absent_file}->{$pb->{path}}}, $path;
3067        undef;
3068}
3069
3070sub change_file_prop {
3071        my ($self, $fb, $prop, $value) = @_;
3072        if ($prop eq 'svn:executable') {
3073                if ($fb->{mode_b} != 120000) {
3074                        $fb->{mode_b} = defined $value ? 100755 : 100644;
3075                }
3076        } elsif ($prop eq 'svn:special') {
3077                $fb->{mode_b} = defined $value ? 120000 : 100644;
3078        } else {
3079                $self->{file_prop}->{$fb->{path}} ||= {};
3080                $self->{file_prop}->{$fb->{path}}->{$prop} = $value;
3081        }
3082        undef;
3083}
3084
3085sub apply_textdelta {
3086        my ($self, $fb, $exp) = @_;
3087        my $fh = IO::File->new_tmpfile;
3088        $fh->autoflush(1);
3089        # $fh gets auto-closed() by SVN::TxDelta::apply(),
3090        # (but $base does not,) so dup() it for reading in close_file
3091        open my $dup, '<&', $fh or croak $!;
3092        my $base = IO::File->new_tmpfile;
3093        $base->autoflush(1);
3094        if ($fb->{blob}) {
3095                defined (my $pid = fork) or croak $!;
3096                if (!$pid) {
3097                        open STDOUT, '>&', $base or croak $!;
3098                        print STDOUT 'link ' if ($fb->{mode_a} == 120000);
3099                        exec qw/git-cat-file blob/, $fb->{blob} or croak $!;
3100                }
3101                waitpid $pid, 0;
3102                croak $? if $?;
3103
3104                if (defined $exp) {
3105                        seek $base, 0, 0 or croak $!;
3106                        my $md5 = Digest::MD5->new;
3107                        $md5->addfile($base);
3108                        my $got = $md5->hexdigest;
3109                        die "Checksum mismatch: $fb->{path} $fb->{blob}\n",
3110                            "expected: $exp\n",
3111                            "     got: $got\n" if ($got ne $exp);
3112                }
3113        }
3114        seek $base, 0, 0 or croak $!;
3115        $fb->{fh} = $dup;
3116        $fb->{base} = $base;
3117        [ SVN::TxDelta::apply($base, $fh, undef, $fb->{path}, $fb->{pool}) ];
3118}
3119
3120sub close_file {
3121        my ($self, $fb, $exp) = @_;
3122        my $hash;
3123        my $path = $fb->{path};
3124        if (my $fh = $fb->{fh}) {
3125                seek($fh, 0, 0) or croak $!;
3126                my $md5 = Digest::MD5->new;
3127                $md5->addfile($fh);
3128                my $got = $md5->hexdigest;
3129                die "Checksum mismatch: $path\n",
3130                    "expected: $exp\n    got: $got\n" if ($got ne $exp);
3131                seek($fh, 0, 0) or croak $!;
3132                if ($fb->{mode_b} == 120000) {
3133                        read($fh, my $buf, 5) == 5 or croak $!;
3134                        $buf eq 'link ' or die "$path has mode 120000",
3135                                               "but is not a link\n";
3136                }
3137                defined(my $pid = open my $out,'-|') or die "Can't fork: $!\n";
3138                if (!$pid) {
3139                        open STDIN, '<&', $fh or croak $!;
3140                        exec qw/git-hash-object -w --stdin/ or croak $!;
3141                }
3142                chomp($hash = do { local $/; <$out> });
3143                close $out or croak $!;
3144                close $fh or croak $!;
3145                $hash =~ /^[a-f\d]{40}$/ or die "not a sha1: $hash\n";
3146                close $fb->{base} or croak $!;
3147        } else {
3148                $hash = $fb->{blob} or die "no blob information\n";
3149        }
3150        $fb->{pool}->clear;
3151        my $gui = $self->{gui};
3152        print $gui "$fb->{mode_b} $hash\t$path\0" or croak $!;
3153        print "\t$fb->{action}\t$path\n" if $fb->{action} && ! $self->{q};
3154        undef;
3155}
3156
3157sub abort_edit {
3158        my $self = shift;
3159        eval { command_close_pipe($self->{gui}, $self->{ctx}) };
3160        $self->SUPER::abort_edit(@_);
3161}
3162
3163sub close_edit {
3164        my $self = shift;
3165        command_close_pipe($self->{gui}, $self->{ctx});
3166        $self->{git_commit_ok} = 1;
3167        $self->SUPER::close_edit(@_);
3168}
3169
3170package SVN::Git::Editor;
3171use vars qw/@ISA/;
3172use strict;
3173use warnings;
3174use Carp qw/croak/;
3175use IO::File;
3176
3177sub new {
3178        my $class = shift;
3179        my $git_svn = shift;
3180        my $self = SVN::Delta::Editor->new(@_);
3181        bless $self, $class;
3182        foreach (qw/svn_path c r ra /) {
3183                die "$_ required!\n" unless (defined $git_svn->{$_});
3184                $self->{$_} = $git_svn->{$_};
3185        }
3186        $self->{pool} = SVN::Pool->new;
3187        $self->{bat} = { '' => $self->open_root($self->{r}, $self->{pool}) };
3188        $self->{rm} = { };
3189        require Digest::MD5;
3190        return $self;
3191}
3192
3193sub split_path {
3194        return ($_[0] =~ m#^(.*?)/?([^/]+)$#);
3195}
3196
3197sub repo_path {
3198        (defined $_[1] && length $_[1]) ? $_[1] : ''
3199}
3200
3201sub url_path {
3202        my ($self, $path) = @_;
3203        $self->{ra}->{url} . '/' . $self->repo_path($path);
3204}
3205
3206sub rmdirs {
3207        my ($self, $q) = @_;
3208        my $rm = $self->{rm};
3209        delete $rm->{''}; # we never delete the url we're tracking
3210        return unless %$rm;
3211
3212        foreach (keys %$rm) {
3213                my @d = split m#/#, $_;
3214                my $c = shift @d;
3215                $rm->{$c} = 1;
3216                while (@d) {
3217                        $c .= '/' . shift @d;
3218                        $rm->{$c} = 1;
3219                }
3220        }
3221        delete $rm->{$self->{svn_path}};
3222        delete $rm->{''}; # we never delete the url we're tracking
3223        return unless %$rm;
3224
3225        my ($fh, $ctx) = command_output_pipe(
3226                                   qw/ls-tree --name-only -r -z/, $self->{c});
3227        local $/ = "\0";
3228        while (<$fh>) {
3229                chomp;
3230                my @dn = split m#/#, $_;
3231                while (pop @dn) {
3232                        delete $rm->{join '/', @dn};
3233                }
3234                unless (%$rm) {
3235                        close $fh;
3236                        return;
3237                }
3238        }
3239        command_close_pipe($fh, $ctx);
3240
3241        my ($r, $p, $bat) = ($self->{r}, $self->{pool}, $self->{bat});
3242        foreach my $d (sort { $b =~ tr#/#/# <=> $a =~ tr#/#/# } keys %$rm) {
3243                $self->close_directory($bat->{$d}, $p);
3244                my ($dn) = ($d =~ m#^(.*?)/?(?:[^/]+)$#);
3245                print "\tD+\t$d/\n" unless $q;
3246                $self->SUPER::delete_entry($d, $r, $bat->{$dn}, $p);
3247                delete $bat->{$d};
3248        }
3249}
3250
3251sub open_or_add_dir {
3252        my ($self, $full_path, $baton) = @_;
3253        my $t = $self->{ra}->check_path($full_path, $self->{r});
3254        if ($t == $SVN::Node::none) {
3255                return $self->add_directory($full_path, $baton,
3256                                                undef, -1, $self->{pool});
3257        } elsif ($t == $SVN::Node::dir) {
3258                return $self->open_directory($full_path, $baton,
3259                                                $self->{r}, $self->{pool});
3260        }
3261        print STDERR "$full_path already exists in repository at ",
3262                "r$self->{r} and it is not a directory (",
3263                ($t == $SVN::Node::file ? 'file' : 'unknown'),"/$t)\n";
3264        exit 1;
3265}
3266
3267sub ensure_path {
3268        my ($self, $path) = @_;
3269        my $bat = $self->{bat};
3270        $path = $self->repo_path($path);
3271        return $bat->{''} unless (length $path);
3272        my @p = split m#/+#, $path;
3273        my $c = shift @p;
3274        $bat->{$c} ||= $self->open_or_add_dir($c, $bat->{''});
3275        while (@p) {
3276                my $c0 = $c;
3277                $c .= '/' . shift @p;
3278                $bat->{$c} ||= $self->open_or_add_dir($c, $bat->{$c0});
3279        }
3280        return $bat->{$c};
3281}
3282
3283sub A {
3284        my ($self, $m, $q) = @_;
3285        my ($dir, $file) = split_path($m->{file_b});
3286        my $pbat = $self->ensure_path($dir);
3287        my $fbat = $self->add_file($self->repo_path($m->{file_b}), $pbat,
3288                                        undef, -1);
3289        print "\tA\t$m->{file_b}\n" unless $q;
3290        $self->chg_file($fbat, $m);
3291        $self->close_file($fbat,undef,$self->{pool});
3292}
3293
3294sub C {
3295        my ($self, $m, $q) = @_;
3296        my ($dir, $file) = split_path($m->{file_b});
3297        my $pbat = $self->ensure_path($dir);
3298        my $fbat = $self->add_file($self->repo_path($m->{file_b}), $pbat,
3299                                $self->url_path($m->{file_a}), $self->{r});
3300        print "\tC\t$m->{file_a} => $m->{file_b}\n" unless $q;
3301        $self->chg_file($fbat, $m);
3302        $self->close_file($fbat,undef,$self->{pool});
3303}
3304
3305sub delete_entry {
3306        my ($self, $path, $pbat) = @_;
3307        my $rpath = $self->repo_path($path);
3308        my ($dir, $file) = split_path($rpath);
3309        $self->{rm}->{$dir} = 1;
3310        $self->SUPER::delete_entry($rpath, $self->{r}, $pbat, $self->{pool});
3311}
3312
3313sub R {
3314        my ($self, $m, $q) = @_;
3315        my ($dir, $file) = split_path($m->{file_b});
3316        my $pbat = $self->ensure_path($dir);
3317        my $fbat = $self->add_file($self->repo_path($m->{file_b}), $pbat,
3318                                $self->url_path($m->{file_a}), $self->{r});
3319        print "\tR\t$m->{file_a} => $m->{file_b}\n" unless $q;
3320        $self->chg_file($fbat, $m);
3321        $self->close_file($fbat,undef,$self->{pool});
3322
3323        ($dir, $file) = split_path($m->{file_a});
3324        $pbat = $self->ensure_path($dir);
3325        $self->delete_entry($m->{file_a}, $pbat);
3326}
3327
3328sub M {
3329        my ($self, $m, $q) = @_;
3330        my ($dir, $file) = split_path($m->{file_b});
3331        my $pbat = $self->ensure_path($dir);
3332        my $fbat = $self->open_file($self->repo_path($m->{file_b}),
3333                                $pbat,$self->{r},$self->{pool});
3334        print "\t$m->{chg}\t$m->{file_b}\n" unless $q;
3335        $self->chg_file($fbat, $m);
3336        $self->close_file($fbat,undef,$self->{pool});
3337}
3338
3339sub T { shift->M(@_) }
3340
3341sub change_file_prop {
3342        my ($self, $fbat, $pname, $pval) = @_;
3343        $self->SUPER::change_file_prop($fbat, $pname, $pval, $self->{pool});
3344}
3345
3346sub chg_file {
3347        my ($self, $fbat, $m) = @_;
3348        if ($m->{mode_b} =~ /755$/ && $m->{mode_a} !~ /755$/) {
3349                $self->change_file_prop($fbat,'svn:executable','*');
3350        } elsif ($m->{mode_b} !~ /755$/ && $m->{mode_a} =~ /755$/) {
3351                $self->change_file_prop($fbat,'svn:executable',undef);
3352        }
3353        my $fh = IO::File->new_tmpfile or croak $!;
3354        if ($m->{mode_b} =~ /^120/) {
3355                print $fh 'link ' or croak $!;
3356                $self->change_file_prop($fbat,'svn:special','*');
3357        } elsif ($m->{mode_a} =~ /^120/ && $m->{mode_b} !~ /^120/) {
3358                $self->change_file_prop($fbat,'svn:special',undef);
3359        }
3360        defined(my $pid = fork) or croak $!;
3361        if (!$pid) {
3362                open STDOUT, '>&', $fh or croak $!;
3363                exec qw/git-cat-file blob/, $m->{sha1_b} or croak $!;
3364        }
3365        waitpid $pid, 0;
3366        croak $? if $?;
3367        $fh->flush == 0 or croak $!;
3368        seek $fh, 0, 0 or croak $!;
3369
3370        my $md5 = Digest::MD5->new;
3371        $md5->addfile($fh) or croak $!;
3372        seek $fh, 0, 0 or croak $!;
3373
3374        my $exp = $md5->hexdigest;
3375        my $pool = SVN::Pool->new;
3376        my $atd = $self->apply_textdelta($fbat, undef, $pool);
3377        my $got = SVN::TxDelta::send_stream($fh, @$atd, $pool);
3378        die "Checksum mismatch\nexpected: $exp\ngot: $got\n" if ($got ne $exp);
3379        $pool->clear;
3380
3381        close $fh or croak $!;
3382}
3383
3384sub D {
3385        my ($self, $m, $q) = @_;
3386        my ($dir, $file) = split_path($m->{file_b});
3387        my $pbat = $self->ensure_path($dir);
3388        print "\tD\t$m->{file_b}\n" unless $q;
3389        $self->delete_entry($m->{file_b}, $pbat);
3390}
3391
3392sub close_edit {
3393        my ($self) = @_;
3394        my ($p,$bat) = ($self->{pool}, $self->{bat});
3395        foreach (sort { $b =~ tr#/#/# <=> $a =~ tr#/#/# } keys %$bat) {
3396                $self->close_directory($bat->{$_}, $p);
3397        }
3398        $self->SUPER::close_edit($p);
3399        $p->clear;
3400}
3401
3402sub abort_edit {
3403        my ($self) = @_;
3404        $self->SUPER::abort_edit($self->{pool});
3405        $self->{pool}->clear;
3406}
3407
3408package Git::SVN::Ra;
3409use vars qw/@ISA $config_dir/;
3410use strict;
3411use warnings;
3412my ($can_do_switch);
3413
3414BEGIN {
3415        # enforce temporary pool usage for some simple functions
3416        my $e;
3417        foreach (qw/get_latest_revnum rev_proplist get_file
3418                    check_path get_dir get_uuid get_repos_root/) {
3419                $e .= "sub $_ {
3420                        my \$self = shift;
3421                        my \$pool = SVN::Pool->new;
3422                        my \@ret = \$self->SUPER::$_(\@_,\$pool);
3423                        \$pool->clear;
3424                        wantarray ? \@ret : \$ret[0]; }\n";
3425        }
3426        eval $e;
3427}
3428
3429sub new {
3430        my ($class, $url) = @_;
3431        SVN::_Core::svn_config_ensure($config_dir, undef);
3432        my ($baton, $callbacks) = SVN::Core::auth_open_helper([
3433            SVN::Client::get_simple_provider(),
3434            SVN::Client::get_ssl_server_trust_file_provider(),
3435            SVN::Client::get_simple_prompt_provider(
3436              \&Git::SVN::Prompt::simple, 2),
3437            SVN::Client::get_ssl_client_cert_prompt_provider(
3438              \&Git::SVN::Prompt::ssl_client_cert, 2),
3439            SVN::Client::get_ssl_client_cert_pw_prompt_provider(
3440              \&Git::SVN::Prompt::ssl_client_cert_pw, 2),
3441            SVN::Client::get_username_provider(),
3442            SVN::Client::get_ssl_server_trust_prompt_provider(
3443              \&Git::SVN::Prompt::ssl_server_trust),
3444            SVN::Client::get_username_prompt_provider(
3445              \&Git::SVN::Prompt::username, 2),
3446          ]);
3447        my $config = SVN::Core::config_get_config($config_dir);
3448        my $self = SVN::Ra->new(url => $url, auth => $baton,
3449                              config => $config,
3450                              pool => SVN::Pool->new,
3451                              auth_provider_callbacks => $callbacks);
3452        $self->{svn_path} = $url;
3453        $self->{repos_root} = $self->get_repos_root;
3454        $self->{svn_path} =~ s#^\Q$self->{repos_root}\E/*##;
3455        bless $self, $class;
3456}
3457
3458sub DESTROY {
3459        my $self = shift;
3460        $self->{pool}->clear if $self->{pool};
3461        $self->SUPER::DESTROY(@_);
3462}
3463
3464sub dup {
3465        my ($self) = @_;
3466        my $dup = SVN::Ra->new(pool => SVN::Pool->new,
3467                                map { $_ => $self->{$_} } qw/config url
3468                     auth auth_provider_callbacks repos_root svn_path/);
3469        bless $dup, ref $self;
3470}
3471
3472sub get_log {
3473        my ($self, @args) = @_;
3474        my $pool = SVN::Pool->new;
3475        $args[4]-- if $args[4] && ! $::_follow_parent;
3476        splice(@args, 3, 1) if ($SVN::Core::VERSION le '1.2.0');
3477        my $ret = $self->SUPER::get_log(@args, $pool);
3478        $pool->clear;
3479        $ret;
3480}
3481
3482sub get_commit_editor {
3483        my ($self, $msg, $cb, $pool) = @_;
3484        my @lock = $SVN::Core::VERSION ge '1.2.0' ? (undef, 0) : ();
3485        $self->SUPER::get_commit_editor($msg, $cb, @lock, $pool);
3486}
3487
3488sub uuid {
3489        my ($self) = @_;
3490        $self->{uuid} ||= $self->get_uuid;
3491}
3492
3493sub gs_do_update {
3494        my ($self, $rev_a, $rev_b, $path, $recurse, $editor) = @_;
3495        my $pool = SVN::Pool->new;
3496        my $reporter = $self->do_update($rev_b, $path, $recurse,
3497                                        $editor, $pool);
3498        my @lock = $SVN::Core::VERSION ge '1.2.0' ? (undef) : ();
3499        my $new = ($rev_a == $rev_b);
3500        $reporter->set_path($path, $rev_a, $new, @lock, $pool);
3501        $reporter->finish_report($pool);
3502        $pool->clear;
3503        $editor->{git_commit_ok};
3504}
3505
3506sub gs_do_switch {
3507        my ($self, $rev_a, $rev_b, $path, $recurse, $url_b, $editor) = @_;
3508        my $pool = SVN::Pool->new;
3509        my $reporter = $self->do_switch($rev_b, $path, $recurse,
3510                                        $url_b, $editor, $pool);
3511        my @lock = $SVN::Core::VERSION ge '1.2.0' ? (undef) : ();
3512        $reporter->set_path($path, $rev_a, 0, @lock, $pool);
3513        $reporter->finish_report($pool);
3514        $pool->clear;
3515        $editor->{git_commit_ok};
3516}
3517
3518sub can_do_switch {
3519        my $self = shift;
3520        unless (defined $can_do_switch) {
3521                my $pool = SVN::Pool->new;
3522                my $rep = eval {
3523                        $self->do_switch(1, '', 0, $self->{url},
3524                                         SVN::Delta::Editor->new, $pool);
3525                };
3526                if ($@) {
3527                        $can_do_switch = 0;
3528                } else {
3529                        $rep->abort_report($pool);
3530                        $can_do_switch = 1;
3531                }
3532                $pool->clear;
3533        }
3534        $can_do_switch;
3535}
3536
3537__END__
3538
3539Data structures:
3540
3541$log_msg hashref as returned by libsvn_log_entry()
3542{
3543        msg => 'whitespace-formatted log entry
3544',                                              # trailing newline is preserved
3545        revision => '8',                        # integer
3546        date => '2004-02-24T17:01:44.108345Z',  # commit date
3547        author => 'committer name'
3548};
3549
3550@mods = array of diff-index line hashes, each element represents one line
3551        of diff-index output
3552
3553diff-index line ($m hash)
3554{
3555        mode_a => first column of diff-index output, no leading ':',
3556        mode_b => second column of diff-index output,
3557        sha1_b => sha1sum of the final blob,
3558        chg => change type [MCRADT],
3559        file_a => original file name of a file (iff chg is 'C' or 'R')
3560        file_b => new/current file name of a file (any chg)
3561}
3562;
3563
3564# retval of read_url_paths{,_all}();
3565$l_map = {
3566        # repository root url
3567        'https://svn.musicpd.org' => {
3568                # repository path               # GIT_SVN_ID
3569                'mpd/trunk'             =>      'trunk',
3570                'mpd/tags/0.11.5'       =>      'tags/0.11.5',
3571        },
3572}
3573
3574Notes:
3575        I don't trust the each() function on unless I created %hash myself
3576        because the internal iterator may not have started at base.