perl / Git.pmon commit builtin-cat-file.c: use parse_options() (15d8e56)
   1=head1 NAME
   2
   3Git - Perl interface to the Git version control system
   4
   5=cut
   6
   7
   8package Git;
   9
  10use strict;
  11
  12
  13BEGIN {
  14
  15our ($VERSION, @ISA, @EXPORT, @EXPORT_OK);
  16
  17# Totally unstable API.
  18$VERSION = '0.01';
  19
  20
  21=head1 SYNOPSIS
  22
  23  use Git;
  24
  25  my $version = Git::command_oneline('version');
  26
  27  git_cmd_try { Git::command_noisy('update-server-info') }
  28              '%s failed w/ code %d';
  29
  30  my $repo = Git->repository (Directory => '/srv/git/cogito.git');
  31
  32
  33  my @revs = $repo->command('rev-list', '--since=last monday', '--all');
  34
  35  my ($fh, $c) = $repo->command_output_pipe('rev-list', '--since=last monday', '--all');
  36  my $lastrev = <$fh>; chomp $lastrev;
  37  $repo->command_close_pipe($fh, $c);
  38
  39  my $lastrev = $repo->command_oneline( [ 'rev-list', '--all' ],
  40                                        STDERR => 0 );
  41
  42  my $sha1 = $repo->hash_and_insert_object('file.txt');
  43  my $tempfile = tempfile();
  44  my $size = $repo->cat_blob($sha1, $tempfile);
  45
  46=cut
  47
  48
  49require Exporter;
  50
  51@ISA = qw(Exporter);
  52
  53@EXPORT = qw(git_cmd_try);
  54
  55# Methods which can be called as standalone functions as well:
  56@EXPORT_OK = qw(command command_oneline command_noisy
  57                command_output_pipe command_input_pipe command_close_pipe
  58                command_bidi_pipe command_close_bidi_pipe
  59                version exec_path hash_object git_cmd_try);
  60
  61
  62=head1 DESCRIPTION
  63
  64This module provides Perl scripts easy way to interface the Git version control
  65system. The modules have an easy and well-tested way to call arbitrary Git
  66commands; in the future, the interface will also provide specialized methods
  67for doing easily operations which are not totally trivial to do over
  68the generic command interface.
  69
  70While some commands can be executed outside of any context (e.g. 'version'
  71or 'init'), most operations require a repository context, which in practice
  72means getting an instance of the Git object using the repository() constructor.
  73(In the future, we will also get a new_repository() constructor.) All commands
  74called as methods of the object are then executed in the context of the
  75repository.
  76
  77Part of the "repository state" is also information about path to the attached
  78working copy (unless you work with a bare repository). You can also navigate
  79inside of the working copy using the C<wc_chdir()> method. (Note that
  80the repository object is self-contained and will not change working directory
  81of your process.)
  82
  83TODO: In the future, we might also do
  84
  85        my $remoterepo = $repo->remote_repository (Name => 'cogito', Branch => 'master');
  86        $remoterepo ||= Git->remote_repository ('http://git.or.cz/cogito.git/');
  87        my @refs = $remoterepo->refs();
  88
  89Currently, the module merely wraps calls to external Git tools. In the future,
  90it will provide a much faster way to interact with Git by linking directly
  91to libgit. This should be completely opaque to the user, though (performance
  92increate nonwithstanding).
  93
  94=cut
  95
  96
  97use Carp qw(carp croak); # but croak is bad - throw instead
  98use Error qw(:try);
  99use Cwd qw(abs_path);
 100use IPC::Open2 qw(open2);
 101
 102}
 103
 104
 105=head1 CONSTRUCTORS
 106
 107=over 4
 108
 109=item repository ( OPTIONS )
 110
 111=item repository ( DIRECTORY )
 112
 113=item repository ()
 114
 115Construct a new repository object.
 116C<OPTIONS> are passed in a hash like fashion, using key and value pairs.
 117Possible options are:
 118
 119B<Repository> - Path to the Git repository.
 120
 121B<WorkingCopy> - Path to the associated working copy; not strictly required
 122as many commands will happily crunch on a bare repository.
 123
 124B<WorkingSubdir> - Subdirectory in the working copy to work inside.
 125Just left undefined if you do not want to limit the scope of operations.
 126
 127B<Directory> - Path to the Git working directory in its usual setup.
 128The C<.git> directory is searched in the directory and all the parent
 129directories; if found, C<WorkingCopy> is set to the directory containing
 130it and C<Repository> to the C<.git> directory itself. If no C<.git>
 131directory was found, the C<Directory> is assumed to be a bare repository,
 132C<Repository> is set to point at it and C<WorkingCopy> is left undefined.
 133If the C<$GIT_DIR> environment variable is set, things behave as expected
 134as well.
 135
 136You should not use both C<Directory> and either of C<Repository> and
 137C<WorkingCopy> - the results of that are undefined.
 138
 139Alternatively, a directory path may be passed as a single scalar argument
 140to the constructor; it is equivalent to setting only the C<Directory> option
 141field.
 142
 143Calling the constructor with no options whatsoever is equivalent to
 144calling it with C<< Directory => '.' >>. In general, if you are building
 145a standard porcelain command, simply doing C<< Git->repository() >> should
 146do the right thing and setup the object to reflect exactly where the user
 147is right now.
 148
 149=cut
 150
 151sub repository {
 152        my $class = shift;
 153        my @args = @_;
 154        my %opts = ();
 155        my $self;
 156
 157        if (defined $args[0]) {
 158                if ($#args % 2 != 1) {
 159                        # Not a hash.
 160                        $#args == 0 or throw Error::Simple("bad usage");
 161                        %opts = ( Directory => $args[0] );
 162                } else {
 163                        %opts = @args;
 164                }
 165        }
 166
 167        if (not defined $opts{Repository} and not defined $opts{WorkingCopy}) {
 168                $opts{Directory} ||= '.';
 169        }
 170
 171        if ($opts{Directory}) {
 172                -d $opts{Directory} or throw Error::Simple("Directory not found: $!");
 173
 174                my $search = Git->repository(WorkingCopy => $opts{Directory});
 175                my $dir;
 176                try {
 177                        $dir = $search->command_oneline(['rev-parse', '--git-dir'],
 178                                                        STDERR => 0);
 179                } catch Git::Error::Command with {
 180                        $dir = undef;
 181                };
 182
 183                if ($dir) {
 184                        $dir =~ m#^/# or $dir = $opts{Directory} . '/' . $dir;
 185                        $opts{Repository} = $dir;
 186
 187                        # If --git-dir went ok, this shouldn't die either.
 188                        my $prefix = $search->command_oneline('rev-parse', '--show-prefix');
 189                        $dir = abs_path($opts{Directory}) . '/';
 190                        if ($prefix) {
 191                                if (substr($dir, -length($prefix)) ne $prefix) {
 192                                        throw Error::Simple("rev-parse confused me - $dir does not have trailing $prefix");
 193                                }
 194                                substr($dir, -length($prefix)) = '';
 195                        }
 196                        $opts{WorkingCopy} = $dir;
 197                        $opts{WorkingSubdir} = $prefix;
 198
 199                } else {
 200                        # A bare repository? Let's see...
 201                        $dir = $opts{Directory};
 202
 203                        unless (-d "$dir/refs" and -d "$dir/objects" and -e "$dir/HEAD") {
 204                                # Mimick git-rev-parse --git-dir error message:
 205                                throw Error::Simple('fatal: Not a git repository');
 206                        }
 207                        my $search = Git->repository(Repository => $dir);
 208                        try {
 209                                $search->command('symbolic-ref', 'HEAD');
 210                        } catch Git::Error::Command with {
 211                                # Mimick git-rev-parse --git-dir error message:
 212                                throw Error::Simple('fatal: Not a git repository');
 213                        }
 214
 215                        $opts{Repository} = abs_path($dir);
 216                }
 217
 218                delete $opts{Directory};
 219        }
 220
 221        $self = { opts => \%opts };
 222        bless $self, $class;
 223}
 224
 225=back
 226
 227=head1 METHODS
 228
 229=over 4
 230
 231=item command ( COMMAND [, ARGUMENTS... ] )
 232
 233=item command ( [ COMMAND, ARGUMENTS... ], { Opt => Val ... } )
 234
 235Execute the given Git C<COMMAND> (specify it without the 'git-'
 236prefix), optionally with the specified extra C<ARGUMENTS>.
 237
 238The second more elaborate form can be used if you want to further adjust
 239the command execution. Currently, only one option is supported:
 240
 241B<STDERR> - How to deal with the command's error output. By default (C<undef>)
 242it is delivered to the caller's C<STDERR>. A false value (0 or '') will cause
 243it to be thrown away. If you want to process it, you can get it in a filehandle
 244you specify, but you must be extremely careful; if the error output is not
 245very short and you want to read it in the same process as where you called
 246C<command()>, you are set up for a nice deadlock!
 247
 248The method can be called without any instance or on a specified Git repository
 249(in that case the command will be run in the repository context).
 250
 251In scalar context, it returns all the command output in a single string
 252(verbatim).
 253
 254In array context, it returns an array containing lines printed to the
 255command's stdout (without trailing newlines).
 256
 257In both cases, the command's stdin and stderr are the same as the caller's.
 258
 259=cut
 260
 261sub command {
 262        my ($fh, $ctx) = command_output_pipe(@_);
 263
 264        if (not defined wantarray) {
 265                # Nothing to pepper the possible exception with.
 266                _cmd_close($fh, $ctx);
 267
 268        } elsif (not wantarray) {
 269                local $/;
 270                my $text = <$fh>;
 271                try {
 272                        _cmd_close($fh, $ctx);
 273                } catch Git::Error::Command with {
 274                        # Pepper with the output:
 275                        my $E = shift;
 276                        $E->{'-outputref'} = \$text;
 277                        throw $E;
 278                };
 279                return $text;
 280
 281        } else {
 282                my @lines = <$fh>;
 283                defined and chomp for @lines;
 284                try {
 285                        _cmd_close($fh, $ctx);
 286                } catch Git::Error::Command with {
 287                        my $E = shift;
 288                        $E->{'-outputref'} = \@lines;
 289                        throw $E;
 290                };
 291                return @lines;
 292        }
 293}
 294
 295
 296=item command_oneline ( COMMAND [, ARGUMENTS... ] )
 297
 298=item command_oneline ( [ COMMAND, ARGUMENTS... ], { Opt => Val ... } )
 299
 300Execute the given C<COMMAND> in the same way as command()
 301does but always return a scalar string containing the first line
 302of the command's standard output.
 303
 304=cut
 305
 306sub command_oneline {
 307        my ($fh, $ctx) = command_output_pipe(@_);
 308
 309        my $line = <$fh>;
 310        defined $line and chomp $line;
 311        try {
 312                _cmd_close($fh, $ctx);
 313        } catch Git::Error::Command with {
 314                # Pepper with the output:
 315                my $E = shift;
 316                $E->{'-outputref'} = \$line;
 317                throw $E;
 318        };
 319        return $line;
 320}
 321
 322
 323=item command_output_pipe ( COMMAND [, ARGUMENTS... ] )
 324
 325=item command_output_pipe ( [ COMMAND, ARGUMENTS... ], { Opt => Val ... } )
 326
 327Execute the given C<COMMAND> in the same way as command()
 328does but return a pipe filehandle from which the command output can be
 329read.
 330
 331The function can return C<($pipe, $ctx)> in array context.
 332See C<command_close_pipe()> for details.
 333
 334=cut
 335
 336sub command_output_pipe {
 337        _command_common_pipe('-|', @_);
 338}
 339
 340
 341=item command_input_pipe ( COMMAND [, ARGUMENTS... ] )
 342
 343=item command_input_pipe ( [ COMMAND, ARGUMENTS... ], { Opt => Val ... } )
 344
 345Execute the given C<COMMAND> in the same way as command_output_pipe()
 346does but return an input pipe filehandle instead; the command output
 347is not captured.
 348
 349The function can return C<($pipe, $ctx)> in array context.
 350See C<command_close_pipe()> for details.
 351
 352=cut
 353
 354sub command_input_pipe {
 355        _command_common_pipe('|-', @_);
 356}
 357
 358
 359=item command_close_pipe ( PIPE [, CTX ] )
 360
 361Close the C<PIPE> as returned from C<command_*_pipe()>, checking
 362whether the command finished successfully. The optional C<CTX> argument
 363is required if you want to see the command name in the error message,
 364and it is the second value returned by C<command_*_pipe()> when
 365called in array context. The call idiom is:
 366
 367        my ($fh, $ctx) = $r->command_output_pipe('status');
 368        while (<$fh>) { ... }
 369        $r->command_close_pipe($fh, $ctx);
 370
 371Note that you should not rely on whatever actually is in C<CTX>;
 372currently it is simply the command name but in future the context might
 373have more complicated structure.
 374
 375=cut
 376
 377sub command_close_pipe {
 378        my ($self, $fh, $ctx) = _maybe_self(@_);
 379        $ctx ||= '<unknown>';
 380        _cmd_close($fh, $ctx);
 381}
 382
 383=item command_bidi_pipe ( COMMAND [, ARGUMENTS... ] )
 384
 385Execute the given C<COMMAND> in the same way as command_output_pipe()
 386does but return both an input pipe filehandle and an output pipe filehandle.
 387
 388The function will return return C<($pid, $pipe_in, $pipe_out, $ctx)>.
 389See C<command_close_bidi_pipe()> for details.
 390
 391=cut
 392
 393sub command_bidi_pipe {
 394        my ($pid, $in, $out);
 395        $pid = open2($in, $out, 'git', @_);
 396        return ($pid, $in, $out, join(' ', @_));
 397}
 398
 399=item command_close_bidi_pipe ( PID, PIPE_IN, PIPE_OUT [, CTX] )
 400
 401Close the C<PIPE_IN> and C<PIPE_OUT> as returned from C<command_bidi_pipe()>,
 402checking whether the command finished successfully. The optional C<CTX>
 403argument is required if you want to see the command name in the error message,
 404and it is the fourth value returned by C<command_bidi_pipe()>.  The call idiom
 405is:
 406
 407        my ($pid, $in, $out, $ctx) = $r->command_bidi_pipe('cat-file --batch-check');
 408        print "000000000\n" $out;
 409        while (<$in>) { ... }
 410        $r->command_close_bidi_pipe($pid, $in, $out, $ctx);
 411
 412Note that you should not rely on whatever actually is in C<CTX>;
 413currently it is simply the command name but in future the context might
 414have more complicated structure.
 415
 416=cut
 417
 418sub command_close_bidi_pipe {
 419        my ($pid, $in, $out, $ctx) = @_;
 420        foreach my $fh ($in, $out) {
 421                unless (close $fh) {
 422                        if ($!) {
 423                                carp "error closing pipe: $!";
 424                        } elsif ($? >> 8) {
 425                                throw Git::Error::Command($ctx, $? >>8);
 426                        }
 427                }
 428        }
 429
 430        waitpid $pid, 0;
 431
 432        if ($? >> 8) {
 433                throw Git::Error::Command($ctx, $? >>8);
 434        }
 435}
 436
 437
 438=item command_noisy ( COMMAND [, ARGUMENTS... ] )
 439
 440Execute the given C<COMMAND> in the same way as command() does but do not
 441capture the command output - the standard output is not redirected and goes
 442to the standard output of the caller application.
 443
 444While the method is called command_noisy(), you might want to as well use
 445it for the most silent Git commands which you know will never pollute your
 446stdout but you want to avoid the overhead of the pipe setup when calling them.
 447
 448The function returns only after the command has finished running.
 449
 450=cut
 451
 452sub command_noisy {
 453        my ($self, $cmd, @args) = _maybe_self(@_);
 454        _check_valid_cmd($cmd);
 455
 456        my $pid = fork;
 457        if (not defined $pid) {
 458                throw Error::Simple("fork failed: $!");
 459        } elsif ($pid == 0) {
 460                _cmd_exec($self, $cmd, @args);
 461        }
 462        if (waitpid($pid, 0) > 0 and $?>>8 != 0) {
 463                throw Git::Error::Command(join(' ', $cmd, @args), $? >> 8);
 464        }
 465}
 466
 467
 468=item version ()
 469
 470Return the Git version in use.
 471
 472=cut
 473
 474sub version {
 475        my $verstr = command_oneline('--version');
 476        $verstr =~ s/^git version //;
 477        $verstr;
 478}
 479
 480
 481=item exec_path ()
 482
 483Return path to the Git sub-command executables (the same as
 484C<git --exec-path>). Useful mostly only internally.
 485
 486=cut
 487
 488sub exec_path { command_oneline('--exec-path') }
 489
 490
 491=item repo_path ()
 492
 493Return path to the git repository. Must be called on a repository instance.
 494
 495=cut
 496
 497sub repo_path { $_[0]->{opts}->{Repository} }
 498
 499
 500=item wc_path ()
 501
 502Return path to the working copy. Must be called on a repository instance.
 503
 504=cut
 505
 506sub wc_path { $_[0]->{opts}->{WorkingCopy} }
 507
 508
 509=item wc_subdir ()
 510
 511Return path to the subdirectory inside of a working copy. Must be called
 512on a repository instance.
 513
 514=cut
 515
 516sub wc_subdir { $_[0]->{opts}->{WorkingSubdir} ||= '' }
 517
 518
 519=item wc_chdir ( SUBDIR )
 520
 521Change the working copy subdirectory to work within. The C<SUBDIR> is
 522relative to the working copy root directory (not the current subdirectory).
 523Must be called on a repository instance attached to a working copy
 524and the directory must exist.
 525
 526=cut
 527
 528sub wc_chdir {
 529        my ($self, $subdir) = @_;
 530        $self->wc_path()
 531                or throw Error::Simple("bare repository");
 532
 533        -d $self->wc_path().'/'.$subdir
 534                or throw Error::Simple("subdir not found: $!");
 535        # Of course we will not "hold" the subdirectory so anyone
 536        # can delete it now and we will never know. But at least we tried.
 537
 538        $self->{opts}->{WorkingSubdir} = $subdir;
 539}
 540
 541
 542=item config ( VARIABLE )
 543
 544Retrieve the configuration C<VARIABLE> in the same manner as C<config>
 545does. In scalar context requires the variable to be set only one time
 546(exception is thrown otherwise), in array context returns allows the
 547variable to be set multiple times and returns all the values.
 548
 549This currently wraps command('config') so it is not so fast.
 550
 551=cut
 552
 553sub config {
 554        my ($self, $var) = _maybe_self(@_);
 555
 556        try {
 557                my @cmd = ('config');
 558                unshift @cmd, $self if $self;
 559                if (wantarray) {
 560                        return command(@cmd, '--get-all', $var);
 561                } else {
 562                        return command_oneline(@cmd, '--get', $var);
 563                }
 564        } catch Git::Error::Command with {
 565                my $E = shift;
 566                if ($E->value() == 1) {
 567                        # Key not found.
 568                        return undef;
 569                } else {
 570                        throw $E;
 571                }
 572        };
 573}
 574
 575
 576=item config_bool ( VARIABLE )
 577
 578Retrieve the bool configuration C<VARIABLE>. The return value
 579is usable as a boolean in perl (and C<undef> if it's not defined,
 580of course).
 581
 582This currently wraps command('config') so it is not so fast.
 583
 584=cut
 585
 586sub config_bool {
 587        my ($self, $var) = _maybe_self(@_);
 588
 589        try {
 590                my @cmd = ('config', '--bool', '--get', $var);
 591                unshift @cmd, $self if $self;
 592                my $val = command_oneline(@cmd);
 593                return undef unless defined $val;
 594                return $val eq 'true';
 595        } catch Git::Error::Command with {
 596                my $E = shift;
 597                if ($E->value() == 1) {
 598                        # Key not found.
 599                        return undef;
 600                } else {
 601                        throw $E;
 602                }
 603        };
 604}
 605
 606=item config_int ( VARIABLE )
 607
 608Retrieve the integer configuration C<VARIABLE>. The return value
 609is simple decimal number.  An optional value suffix of 'k', 'm',
 610or 'g' in the config file will cause the value to be multiplied
 611by 1024, 1048576 (1024^2), or 1073741824 (1024^3) prior to output.
 612It would return C<undef> if configuration variable is not defined,
 613
 614This currently wraps command('config') so it is not so fast.
 615
 616=cut
 617
 618sub config_int {
 619        my ($self, $var) = _maybe_self(@_);
 620
 621        try {
 622                my @cmd = ('config', '--int', '--get', $var);
 623                unshift @cmd, $self if $self;
 624                return command_oneline(@cmd);
 625        } catch Git::Error::Command with {
 626                my $E = shift;
 627                if ($E->value() == 1) {
 628                        # Key not found.
 629                        return undef;
 630                } else {
 631                        throw $E;
 632                }
 633        };
 634}
 635
 636=item get_colorbool ( NAME )
 637
 638Finds if color should be used for NAMEd operation from the configuration,
 639and returns boolean (true for "use color", false for "do not use color").
 640
 641=cut
 642
 643sub get_colorbool {
 644        my ($self, $var) = @_;
 645        my $stdout_to_tty = (-t STDOUT) ? "true" : "false";
 646        my $use_color = $self->command_oneline('config', '--get-colorbool',
 647                                               $var, $stdout_to_tty);
 648        return ($use_color eq 'true');
 649}
 650
 651=item get_color ( SLOT, COLOR )
 652
 653Finds color for SLOT from the configuration, while defaulting to COLOR,
 654and returns the ANSI color escape sequence:
 655
 656        print $repo->get_color("color.interactive.prompt", "underline blue white");
 657        print "some text";
 658        print $repo->get_color("", "normal");
 659
 660=cut
 661
 662sub get_color {
 663        my ($self, $slot, $default) = @_;
 664        my $color = $self->command_oneline('config', '--get-color', $slot, $default);
 665        if (!defined $color) {
 666                $color = "";
 667        }
 668        return $color;
 669}
 670
 671=item ident ( TYPE | IDENTSTR )
 672
 673=item ident_person ( TYPE | IDENTSTR | IDENTARRAY )
 674
 675This suite of functions retrieves and parses ident information, as stored
 676in the commit and tag objects or produced by C<var GIT_type_IDENT> (thus
 677C<TYPE> can be either I<author> or I<committer>; case is insignificant).
 678
 679The C<ident> method retrieves the ident information from C<git-var>
 680and either returns it as a scalar string or as an array with the fields parsed.
 681Alternatively, it can take a prepared ident string (e.g. from the commit
 682object) and just parse it.
 683
 684C<ident_person> returns the person part of the ident - name and email;
 685it can take the same arguments as C<ident> or the array returned by C<ident>.
 686
 687The synopsis is like:
 688
 689        my ($name, $email, $time_tz) = ident('author');
 690        "$name <$email>" eq ident_person('author');
 691        "$name <$email>" eq ident_person($name);
 692        $time_tz =~ /^\d+ [+-]\d{4}$/;
 693
 694=cut
 695
 696sub ident {
 697        my ($self, $type) = _maybe_self(@_);
 698        my $identstr;
 699        if (lc $type eq lc 'committer' or lc $type eq lc 'author') {
 700                my @cmd = ('var', 'GIT_'.uc($type).'_IDENT');
 701                unshift @cmd, $self if $self;
 702                $identstr = command_oneline(@cmd);
 703        } else {
 704                $identstr = $type;
 705        }
 706        if (wantarray) {
 707                return $identstr =~ /^(.*) <(.*)> (\d+ [+-]\d{4})$/;
 708        } else {
 709                return $identstr;
 710        }
 711}
 712
 713sub ident_person {
 714        my ($self, @ident) = _maybe_self(@_);
 715        $#ident == 0 and @ident = $self ? $self->ident($ident[0]) : ident($ident[0]);
 716        return "$ident[0] <$ident[1]>";
 717}
 718
 719
 720=item hash_object ( TYPE, FILENAME )
 721
 722Compute the SHA1 object id of the given C<FILENAME> (or data waiting in
 723C<FILEHANDLE>) considering it is of the C<TYPE> object type (C<blob>,
 724C<commit>, C<tree>).
 725
 726The method can be called without any instance or on a specified Git repository,
 727it makes zero difference.
 728
 729The function returns the SHA1 hash.
 730
 731=cut
 732
 733# TODO: Support for passing FILEHANDLE instead of FILENAME
 734sub hash_object {
 735        my ($self, $type, $file) = _maybe_self(@_);
 736        command_oneline('hash-object', '-t', $type, $file);
 737}
 738
 739
 740=item hash_and_insert_object ( FILENAME )
 741
 742Compute the SHA1 object id of the given C<FILENAME> and add the object to the
 743object database.
 744
 745The function returns the SHA1 hash.
 746
 747=cut
 748
 749# TODO: Support for passing FILEHANDLE instead of FILENAME
 750sub hash_and_insert_object {
 751        my ($self, $filename) = @_;
 752
 753        carp "Bad filename \"$filename\"" if $filename =~ /[\r\n]/;
 754
 755        $self->_open_hash_and_insert_object_if_needed();
 756        my ($in, $out) = ($self->{hash_object_in}, $self->{hash_object_out});
 757
 758        unless (print $out $filename, "\n") {
 759                $self->_close_hash_and_insert_object();
 760                throw Error::Simple("out pipe went bad");
 761        }
 762
 763        chomp(my $hash = <$in>);
 764        unless (defined($hash)) {
 765                $self->_close_hash_and_insert_object();
 766                throw Error::Simple("in pipe went bad");
 767        }
 768
 769        return $hash;
 770}
 771
 772sub _open_hash_and_insert_object_if_needed {
 773        my ($self) = @_;
 774
 775        return if defined($self->{hash_object_pid});
 776
 777        ($self->{hash_object_pid}, $self->{hash_object_in},
 778         $self->{hash_object_out}, $self->{hash_object_ctx}) =
 779                command_bidi_pipe(qw(hash-object -w --stdin-paths));
 780}
 781
 782sub _close_hash_and_insert_object {
 783        my ($self) = @_;
 784
 785        return unless defined($self->{hash_object_pid});
 786
 787        my @vars = map { 'hash_object_' . $_ } qw(pid in out ctx);
 788
 789        command_close_bidi_pipe($self->{@vars});
 790        delete $self->{@vars};
 791}
 792
 793=item cat_blob ( SHA1, FILEHANDLE )
 794
 795Prints the contents of the blob identified by C<SHA1> to C<FILEHANDLE> and
 796returns the number of bytes printed.
 797
 798=cut
 799
 800sub cat_blob {
 801        my ($self, $sha1, $fh) = @_;
 802
 803        $self->_open_cat_blob_if_needed();
 804        my ($in, $out) = ($self->{cat_blob_in}, $self->{cat_blob_out});
 805
 806        unless (print $out $sha1, "\n") {
 807                $self->_close_cat_blob();
 808                throw Error::Simple("out pipe went bad");
 809        }
 810
 811        my $description = <$in>;
 812        if ($description =~ / missing$/) {
 813                carp "$sha1 doesn't exist in the repository";
 814                return 0;
 815        }
 816
 817        if ($description !~ /^[0-9a-fA-F]{40} \S+ (\d+)$/) {
 818                carp "Unexpected result returned from git cat-file";
 819                return 0;
 820        }
 821
 822        my $size = $1;
 823
 824        my $blob;
 825        my $bytesRead = 0;
 826
 827        while (1) {
 828                my $bytesLeft = $size - $bytesRead;
 829                last unless $bytesLeft;
 830
 831                my $bytesToRead = $bytesLeft < 1024 ? $bytesLeft : 1024;
 832                my $read = read($in, $blob, $bytesToRead, $bytesRead);
 833                unless (defined($read)) {
 834                        $self->_close_cat_blob();
 835                        throw Error::Simple("in pipe went bad");
 836                }
 837
 838                $bytesRead += $read;
 839        }
 840
 841        # Skip past the trailing newline.
 842        my $newline;
 843        my $read = read($in, $newline, 1);
 844        unless (defined($read)) {
 845                $self->_close_cat_blob();
 846                throw Error::Simple("in pipe went bad");
 847        }
 848        unless ($read == 1 && $newline eq "\n") {
 849                $self->_close_cat_blob();
 850                throw Error::Simple("didn't find newline after blob");
 851        }
 852
 853        unless (print $fh $blob) {
 854                $self->_close_cat_blob();
 855                throw Error::Simple("couldn't write to passed in filehandle");
 856        }
 857
 858        return $size;
 859}
 860
 861sub _open_cat_blob_if_needed {
 862        my ($self) = @_;
 863
 864        return if defined($self->{cat_blob_pid});
 865
 866        ($self->{cat_blob_pid}, $self->{cat_blob_in},
 867         $self->{cat_blob_out}, $self->{cat_blob_ctx}) =
 868                command_bidi_pipe(qw(cat-file --batch));
 869}
 870
 871sub _close_cat_blob {
 872        my ($self) = @_;
 873
 874        return unless defined($self->{cat_blob_pid});
 875
 876        my @vars = map { 'cat_blob_' . $_ } qw(pid in out ctx);
 877
 878        command_close_bidi_pipe($self->{@vars});
 879        delete $self->{@vars};
 880}
 881
 882=back
 883
 884=head1 ERROR HANDLING
 885
 886All functions are supposed to throw Perl exceptions in case of errors.
 887See the L<Error> module on how to catch those. Most exceptions are mere
 888L<Error::Simple> instances.
 889
 890However, the C<command()>, C<command_oneline()> and C<command_noisy()>
 891functions suite can throw C<Git::Error::Command> exceptions as well: those are
 892thrown when the external command returns an error code and contain the error
 893code as well as access to the captured command's output. The exception class
 894provides the usual C<stringify> and C<value> (command's exit code) methods and
 895in addition also a C<cmd_output> method that returns either an array or a
 896string with the captured command output (depending on the original function
 897call context; C<command_noisy()> returns C<undef>) and $<cmdline> which
 898returns the command and its arguments (but without proper quoting).
 899
 900Note that the C<command_*_pipe()> functions cannot throw this exception since
 901it has no idea whether the command failed or not. You will only find out
 902at the time you C<close> the pipe; if you want to have that automated,
 903use C<command_close_pipe()>, which can throw the exception.
 904
 905=cut
 906
 907{
 908        package Git::Error::Command;
 909
 910        @Git::Error::Command::ISA = qw(Error);
 911
 912        sub new {
 913                my $self = shift;
 914                my $cmdline = '' . shift;
 915                my $value = 0 + shift;
 916                my $outputref = shift;
 917                my(@args) = ();
 918
 919                local $Error::Depth = $Error::Depth + 1;
 920
 921                push(@args, '-cmdline', $cmdline);
 922                push(@args, '-value', $value);
 923                push(@args, '-outputref', $outputref);
 924
 925                $self->SUPER::new(-text => 'command returned error', @args);
 926        }
 927
 928        sub stringify {
 929                my $self = shift;
 930                my $text = $self->SUPER::stringify;
 931                $self->cmdline() . ': ' . $text . ': ' . $self->value() . "\n";
 932        }
 933
 934        sub cmdline {
 935                my $self = shift;
 936                $self->{'-cmdline'};
 937        }
 938
 939        sub cmd_output {
 940                my $self = shift;
 941                my $ref = $self->{'-outputref'};
 942                defined $ref or undef;
 943                if (ref $ref eq 'ARRAY') {
 944                        return @$ref;
 945                } else { # SCALAR
 946                        return $$ref;
 947                }
 948        }
 949}
 950
 951=over 4
 952
 953=item git_cmd_try { CODE } ERRMSG
 954
 955This magical statement will automatically catch any C<Git::Error::Command>
 956exceptions thrown by C<CODE> and make your program die with C<ERRMSG>
 957on its lips; the message will have %s substituted for the command line
 958and %d for the exit status. This statement is useful mostly for producing
 959more user-friendly error messages.
 960
 961In case of no exception caught the statement returns C<CODE>'s return value.
 962
 963Note that this is the only auto-exported function.
 964
 965=cut
 966
 967sub git_cmd_try(&$) {
 968        my ($code, $errmsg) = @_;
 969        my @result;
 970        my $err;
 971        my $array = wantarray;
 972        try {
 973                if ($array) {
 974                        @result = &$code;
 975                } else {
 976                        $result[0] = &$code;
 977                }
 978        } catch Git::Error::Command with {
 979                my $E = shift;
 980                $err = $errmsg;
 981                $err =~ s/\%s/$E->cmdline()/ge;
 982                $err =~ s/\%d/$E->value()/ge;
 983                # We can't croak here since Error.pm would mangle
 984                # that to Error::Simple.
 985        };
 986        $err and croak $err;
 987        return $array ? @result : $result[0];
 988}
 989
 990
 991=back
 992
 993=head1 COPYRIGHT
 994
 995Copyright 2006 by Petr Baudis E<lt>pasky@suse.czE<gt>.
 996
 997This module is free software; it may be used, copied, modified
 998and distributed under the terms of the GNU General Public Licence,
 999either version 2, or (at your option) any later version.
1000
1001=cut
1002
1003
1004# Take raw method argument list and return ($obj, @args) in case
1005# the method was called upon an instance and (undef, @args) if
1006# it was called directly.
1007sub _maybe_self {
1008        # This breaks inheritance. Oh well.
1009        ref $_[0] eq 'Git' ? @_ : (undef, @_);
1010}
1011
1012# Check if the command id is something reasonable.
1013sub _check_valid_cmd {
1014        my ($cmd) = @_;
1015        $cmd =~ /^[a-z0-9A-Z_-]+$/ or throw Error::Simple("bad command: $cmd");
1016}
1017
1018# Common backend for the pipe creators.
1019sub _command_common_pipe {
1020        my $direction = shift;
1021        my ($self, @p) = _maybe_self(@_);
1022        my (%opts, $cmd, @args);
1023        if (ref $p[0]) {
1024                ($cmd, @args) = @{shift @p};
1025                %opts = ref $p[0] ? %{$p[0]} : @p;
1026        } else {
1027                ($cmd, @args) = @p;
1028        }
1029        _check_valid_cmd($cmd);
1030
1031        my $fh;
1032        if ($^O eq 'MSWin32') {
1033                # ActiveState Perl
1034                #defined $opts{STDERR} and
1035                #       warn 'ignoring STDERR option - running w/ ActiveState';
1036                $direction eq '-|' or
1037                        die 'input pipe for ActiveState not implemented';
1038                # the strange construction with *ACPIPE is just to
1039                # explain the tie below that we want to bind to
1040                # a handle class, not scalar. It is not known if
1041                # it is something specific to ActiveState Perl or
1042                # just a Perl quirk.
1043                tie (*ACPIPE, 'Git::activestate_pipe', $cmd, @args);
1044                $fh = *ACPIPE;
1045
1046        } else {
1047                my $pid = open($fh, $direction);
1048                if (not defined $pid) {
1049                        throw Error::Simple("open failed: $!");
1050                } elsif ($pid == 0) {
1051                        if (defined $opts{STDERR}) {
1052                                close STDERR;
1053                        }
1054                        if ($opts{STDERR}) {
1055                                open (STDERR, '>&', $opts{STDERR})
1056                                        or die "dup failed: $!";
1057                        }
1058                        _cmd_exec($self, $cmd, @args);
1059                }
1060        }
1061        return wantarray ? ($fh, join(' ', $cmd, @args)) : $fh;
1062}
1063
1064# When already in the subprocess, set up the appropriate state
1065# for the given repository and execute the git command.
1066sub _cmd_exec {
1067        my ($self, @args) = @_;
1068        if ($self) {
1069                $self->repo_path() and $ENV{'GIT_DIR'} = $self->repo_path();
1070                $self->wc_path() and chdir($self->wc_path());
1071                $self->wc_subdir() and chdir($self->wc_subdir());
1072        }
1073        _execv_git_cmd(@args);
1074        die qq[exec "@args" failed: $!];
1075}
1076
1077# Execute the given Git command ($_[0]) with arguments ($_[1..])
1078# by searching for it at proper places.
1079sub _execv_git_cmd { exec('git', @_); }
1080
1081# Close pipe to a subprocess.
1082sub _cmd_close {
1083        my ($fh, $ctx) = @_;
1084        if (not close $fh) {
1085                if ($!) {
1086                        # It's just close, no point in fatalities
1087                        carp "error closing pipe: $!";
1088                } elsif ($? >> 8) {
1089                        # The caller should pepper this.
1090                        throw Git::Error::Command($ctx, $? >> 8);
1091                }
1092                # else we might e.g. closed a live stream; the command
1093                # dying of SIGPIPE would drive us here.
1094        }
1095}
1096
1097
1098sub DESTROY {
1099        my ($self) = @_;
1100        $self->_close_hash_and_insert_object();
1101        $self->_close_cat_blob();
1102}
1103
1104
1105# Pipe implementation for ActiveState Perl.
1106
1107package Git::activestate_pipe;
1108use strict;
1109
1110sub TIEHANDLE {
1111        my ($class, @params) = @_;
1112        # FIXME: This is probably horrible idea and the thing will explode
1113        # at the moment you give it arguments that require some quoting,
1114        # but I have no ActiveState clue... --pasky
1115        # Let's just hope ActiveState Perl does at least the quoting
1116        # correctly.
1117        my @data = qx{git @params};
1118        bless { i => 0, data => \@data }, $class;
1119}
1120
1121sub READLINE {
1122        my $self = shift;
1123        if ($self->{i} >= scalar @{$self->{data}}) {
1124                return undef;
1125        }
1126        my $i = $self->{i};
1127        if (wantarray) {
1128                $self->{i} = $#{$self->{'data'}} + 1;
1129                return splice(@{$self->{'data'}}, $i);
1130        }
1131        $self->{i} = $i + 1;
1132        return $self->{'data'}->[ $i ];
1133}
1134
1135sub CLOSE {
1136        my $self = shift;
1137        delete $self->{data};
1138        delete $self->{i};
1139}
1140
1141sub EOF {
1142        my $self = shift;
1143        return ($self->{i} >= scalar @{$self->{data}});
1144}
1145
1146
11471; # Famous last words