1=head1 NAME 2 3Git - Perl interface to the Git version control system 4 5=cut 6 7 8package Git; 9 10use strict; 11 12 13BEGIN{ 14 15our($VERSION,@ISA,@EXPORT,@EXPORT_OK); 16 17# Totally unstable API. 18$VERSION='0.01'; 19 20 21=head1 SYNOPSIS 22 23 use Git; 24 25 my $version = Git::command_oneline('version'); 26 27 git_cmd_try { Git::command_noisy('update-server-info') } 28 '%s failed w/ code %d'; 29 30 my $repo = Git->repository (Directory => '/srv/git/cogito.git'); 31 32 33 my @revs = $repo->command('rev-list', '--since=last monday', '--all'); 34 35 my ($fh, $c) = $repo->command_output_pipe('rev-list', '--since=last monday', '--all'); 36 my $lastrev = <$fh>; chomp $lastrev; 37 $repo->command_close_pipe($fh, $c); 38 39 my $lastrev = $repo->command_oneline( [ 'rev-list', '--all' ], 40 STDERR => 0 ); 41 42=cut 43 44 45require Exporter; 46 47@ISA=qw(Exporter); 48 49@EXPORT=qw(git_cmd_try); 50 51# Methods which can be called as standalone functions as well: 52@EXPORT_OK=qw(command command_oneline command_noisy 53 command_output_pipe command_input_pipe command_close_pipe 54 version exec_path hash_object git_cmd_try); 55 56 57=head1 DESCRIPTION 58 59This module provides Perl scripts easy way to interface the Git version control 60system. The modules have an easy and well-tested way to call arbitrary Git 61commands; in the future, the interface will also provide specialized methods 62for doing easily operations which are not totally trivial to do over 63the generic command interface. 64 65While some commands can be executed outside of any context (e.g. 'version' 66or 'init-db'), most operations require a repository context, which in practice 67means getting an instance of the Git object using the repository() constructor. 68(In the future, we will also get a new_repository() constructor.) All commands 69called as methods of the object are then executed in the context of the 70repository. 71 72Part of the "repository state" is also information about path to the attached 73working copy (unless you work with a bare repository). You can also navigate 74inside of the working copy using the C<wc_chdir()> method. (Note that 75the repository object is self-contained and will not change working directory 76of your process.) 77 78TODO: In the future, we might also do 79 80 my $remoterepo = $repo->remote_repository (Name => 'cogito', Branch => 'master'); 81 $remoterepo ||= Git->remote_repository ('http://git.or.cz/cogito.git/'); 82 my @refs = $remoterepo->refs(); 83 84Currently, the module merely wraps calls to external Git tools. In the future, 85it will provide a much faster way to interact with Git by linking directly 86to libgit. This should be completely opaque to the user, though (performance 87increate nonwithstanding). 88 89=cut 90 91 92use Carp qw(carp croak);# but croak is bad - throw instead 93use Error qw(:try); 94use Cwd qw(abs_path); 95 96require XSLoader; 97XSLoader::load('Git',$VERSION); 98 99} 100 101 102=head1 CONSTRUCTORS 103 104=over 4 105 106=item repository ( OPTIONS ) 107 108=item repository ( DIRECTORY ) 109 110=item repository () 111 112Construct a new repository object. 113C<OPTIONS> are passed in a hash like fashion, using key and value pairs. 114Possible options are: 115 116B<Repository> - Path to the Git repository. 117 118B<WorkingCopy> - Path to the associated working copy; not strictly required 119as many commands will happily crunch on a bare repository. 120 121B<WorkingSubdir> - Subdirectory in the working copy to work inside. 122Just left undefined if you do not want to limit the scope of operations. 123 124B<Directory> - Path to the Git working directory in its usual setup. 125The C<.git> directory is searched in the directory and all the parent 126directories; if found, C<WorkingCopy> is set to the directory containing 127it and C<Repository> to the C<.git> directory itself. If no C<.git> 128directory was found, the C<Directory> is assumed to be a bare repository, 129C<Repository> is set to point at it and C<WorkingCopy> is left undefined. 130If the C<$GIT_DIR> environment variable is set, things behave as expected 131as well. 132 133You should not use both C<Directory> and either of C<Repository> and 134C<WorkingCopy> - the results of that are undefined. 135 136Alternatively, a directory path may be passed as a single scalar argument 137to the constructor; it is equivalent to setting only the C<Directory> option 138field. 139 140Calling the constructor with no options whatsoever is equivalent to 141calling it with C<< Directory => '.' >>. In general, if you are building 142a standard porcelain command, simply doing C<< Git->repository() >> should 143do the right thing and setup the object to reflect exactly where the user 144is right now. 145 146=cut 147 148sub repository { 149my$class=shift; 150my@args=@_; 151my%opts= (); 152my$self; 153 154if(defined$args[0]) { 155if($#args%2!=1) { 156# Not a hash. 157$#args==0or throw Error::Simple("bad usage"); 158%opts= ( Directory =>$args[0] ); 159}else{ 160%opts=@args; 161} 162} 163 164if(not defined$opts{Repository}and not defined$opts{WorkingCopy}) { 165$opts{Directory} ||='.'; 166} 167 168if($opts{Directory}) { 169-d $opts{Directory}or throw Error::Simple("Directory not found:$!"); 170 171my$search= Git->repository(WorkingCopy =>$opts{Directory}); 172my$dir; 173try{ 174$dir=$search->command_oneline(['rev-parse','--git-dir'], 175 STDERR =>0); 176} catch Git::Error::Command with { 177$dir=undef; 178}; 179 180if($dir) { 181$dir=~ m#^/# or $dir = $opts{Directory} . '/' . $dir; 182$opts{Repository} =$dir; 183 184# If --git-dir went ok, this shouldn't die either. 185my$prefix=$search->command_oneline('rev-parse','--show-prefix'); 186$dir= abs_path($opts{Directory}) .'/'; 187if($prefix) { 188if(substr($dir, -length($prefix))ne$prefix) { 189 throw Error::Simple("rev-parse confused me -$dirdoes not have trailing$prefix"); 190} 191substr($dir, -length($prefix)) =''; 192} 193$opts{WorkingCopy} =$dir; 194$opts{WorkingSubdir} =$prefix; 195 196}else{ 197# A bare repository? Let's see... 198$dir=$opts{Directory}; 199 200unless(-d "$dir/refs"and-d "$dir/objects"and-e "$dir/HEAD") { 201# Mimick git-rev-parse --git-dir error message: 202 throw Error::Simple('fatal: Not a git repository'); 203} 204my$search= Git->repository(Repository =>$dir); 205try{ 206$search->command('symbolic-ref','HEAD'); 207} catch Git::Error::Command with { 208# Mimick git-rev-parse --git-dir error message: 209 throw Error::Simple('fatal: Not a git repository'); 210} 211 212$opts{Repository} = abs_path($dir); 213} 214 215delete$opts{Directory}; 216} 217 218$self= { opts => \%opts}; 219bless$self,$class; 220} 221 222 223=back 224 225=head1 METHODS 226 227=over 4 228 229=item command ( COMMAND [, ARGUMENTS... ] ) 230 231=item command ( [ COMMAND, ARGUMENTS... ], { Opt => Val ... } ) 232 233Execute the given Git C<COMMAND> (specify it without the 'git-' 234prefix), optionally with the specified extra C<ARGUMENTS>. 235 236The second more elaborate form can be used if you want to further adjust 237the command execution. Currently, only one option is supported: 238 239B<STDERR> - How to deal with the command's error output. By default (C<undef>) 240it is delivered to the caller's C<STDERR>. A false value (0 or '') will cause 241it to be thrown away. If you want to process it, you can get it in a filehandle 242you specify, but you must be extremely careful; if the error output is not 243very short and you want to read it in the same process as where you called 244C<command()>, you are set up for a nice deadlock! 245 246The method can be called without any instance or on a specified Git repository 247(in that case the command will be run in the repository context). 248 249In scalar context, it returns all the command output in a single string 250(verbatim). 251 252In array context, it returns an array containing lines printed to the 253command's stdout (without trailing newlines). 254 255In both cases, the command's stdin and stderr are the same as the caller's. 256 257=cut 258 259sub command { 260my($fh,$ctx) = command_output_pipe(@_); 261 262if(not defined wantarray) { 263# Nothing to pepper the possible exception with. 264 _cmd_close($fh,$ctx); 265 266}elsif(not wantarray) { 267local$/; 268my$text= <$fh>; 269try{ 270 _cmd_close($fh,$ctx); 271} catch Git::Error::Command with { 272# Pepper with the output: 273my$E=shift; 274$E->{'-outputref'} = \$text; 275 throw $E; 276}; 277return$text; 278 279}else{ 280my@lines= <$fh>; 281chomp@lines; 282try{ 283 _cmd_close($fh,$ctx); 284} catch Git::Error::Command with { 285my$E=shift; 286$E->{'-outputref'} = \@lines; 287 throw $E; 288}; 289return@lines; 290} 291} 292 293 294=item command_oneline ( COMMAND [, ARGUMENTS... ] ) 295 296=item command_oneline ( [ COMMAND, ARGUMENTS... ], { Opt => Val ... } ) 297 298Execute the given C<COMMAND> in the same way as command() 299does but always return a scalar string containing the first line 300of the command's standard output. 301 302=cut 303 304sub command_oneline { 305my($fh,$ctx) = command_output_pipe(@_); 306 307my$line= <$fh>; 308defined$lineand chomp$line; 309try{ 310 _cmd_close($fh,$ctx); 311} catch Git::Error::Command with { 312# Pepper with the output: 313my$E=shift; 314$E->{'-outputref'} = \$line; 315 throw $E; 316}; 317return$line; 318} 319 320 321=item command_output_pipe ( COMMAND [, ARGUMENTS... ] ) 322 323=item command_output_pipe ( [ COMMAND, ARGUMENTS... ], { Opt => Val ... } ) 324 325Execute the given C<COMMAND> in the same way as command() 326does but return a pipe filehandle from which the command output can be 327read. 328 329The function can return C<($pipe, $ctx)> in array context. 330See C<command_close_pipe()> for details. 331 332=cut 333 334sub command_output_pipe { 335 _command_common_pipe('-|',@_); 336} 337 338 339=item command_input_pipe ( COMMAND [, ARGUMENTS... ] ) 340 341=item command_input_pipe ( [ COMMAND, ARGUMENTS... ], { Opt => Val ... } ) 342 343Execute the given C<COMMAND> in the same way as command_output_pipe() 344does but return an input pipe filehandle instead; the command output 345is not captured. 346 347The function can return C<($pipe, $ctx)> in array context. 348See C<command_close_pipe()> for details. 349 350=cut 351 352sub command_input_pipe { 353 _command_common_pipe('|-',@_); 354} 355 356 357=item command_close_pipe ( PIPE [, CTX ] ) 358 359Close the C<PIPE> as returned from C<command_*_pipe()>, checking 360whether the command finished successfuly. The optional C<CTX> argument 361is required if you want to see the command name in the error message, 362and it is the second value returned by C<command_*_pipe()> when 363called in array context. The call idiom is: 364 365 my ($fh, $ctx) = $r->command_output_pipe('status'); 366 while (<$fh>) { ... } 367 $r->command_close_pipe($fh, $ctx); 368 369Note that you should not rely on whatever actually is in C<CTX>; 370currently it is simply the command name but in future the context might 371have more complicated structure. 372 373=cut 374 375sub command_close_pipe { 376my($self,$fh,$ctx) = _maybe_self(@_); 377$ctx||='<unknown>'; 378 _cmd_close($fh,$ctx); 379} 380 381 382=item command_noisy ( COMMAND [, ARGUMENTS... ] ) 383 384Execute the given C<COMMAND> in the same way as command() does but do not 385capture the command output - the standard output is not redirected and goes 386to the standard output of the caller application. 387 388While the method is called command_noisy(), you might want to as well use 389it for the most silent Git commands which you know will never pollute your 390stdout but you want to avoid the overhead of the pipe setup when calling them. 391 392The function returns only after the command has finished running. 393 394=cut 395 396sub command_noisy { 397my($self,$cmd,@args) = _maybe_self(@_); 398 _check_valid_cmd($cmd); 399 400my$pid=fork; 401if(not defined$pid) { 402 throw Error::Simple("fork failed:$!"); 403}elsif($pid==0) { 404 _cmd_exec($self,$cmd,@args); 405} 406if(waitpid($pid,0) >0and$?>>8!=0) { 407 throw Git::Error::Command(join(' ',$cmd,@args),$?>>8); 408} 409} 410 411 412=item version () 413 414Return the Git version in use. 415 416Implementation of this function is very fast; no external command calls 417are involved. 418 419=cut 420 421# Implemented in Git.xs. 422 423 424=item exec_path () 425 426Return path to the Git sub-command executables (the same as 427C<git --exec-path>). Useful mostly only internally. 428 429Implementation of this function is very fast; no external command calls 430are involved. 431 432=cut 433 434# Implemented in Git.xs. 435 436 437=item repo_path () 438 439Return path to the git repository. Must be called on a repository instance. 440 441=cut 442 443sub repo_path {$_[0]->{opts}->{Repository} } 444 445 446=item wc_path () 447 448Return path to the working copy. Must be called on a repository instance. 449 450=cut 451 452sub wc_path {$_[0]->{opts}->{WorkingCopy} } 453 454 455=item wc_subdir () 456 457Return path to the subdirectory inside of a working copy. Must be called 458on a repository instance. 459 460=cut 461 462sub wc_subdir {$_[0]->{opts}->{WorkingSubdir} ||=''} 463 464 465=item wc_chdir ( SUBDIR ) 466 467Change the working copy subdirectory to work within. The C<SUBDIR> is 468relative to the working copy root directory (not the current subdirectory). 469Must be called on a repository instance attached to a working copy 470and the directory must exist. 471 472=cut 473 474sub wc_chdir { 475my($self,$subdir) =@_; 476 477$self->wc_path() 478or throw Error::Simple("bare repository"); 479 480-d $self->wc_path().'/'.$subdir 481or throw Error::Simple("subdir not found:$!"); 482# Of course we will not "hold" the subdirectory so anyone 483# can delete it now and we will never know. But at least we tried. 484 485$self->{opts}->{WorkingSubdir} =$subdir; 486} 487 488 489=item hash_object ( TYPE, FILENAME ) 490 491=item hash_object ( TYPE, FILEHANDLE ) 492 493Compute the SHA1 object id of the given C<FILENAME> (or data waiting in 494C<FILEHANDLE>) considering it is of the C<TYPE> object type (C<blob>, 495C<commit>, C<tree>). 496 497In case of C<FILEHANDLE> passed instead of file name, all the data 498available are read and hashed, and the filehandle is automatically 499closed. The file handle should be freshly opened - if you have already 500read anything from the file handle, the results are undefined (since 501this function works directly with the file descriptor and internal 502PerlIO buffering might have messed things up). 503 504The method can be called without any instance or on a specified Git repository, 505it makes zero difference. 506 507The function returns the SHA1 hash. 508 509Implementation of this function is very fast; no external command calls 510are involved. 511 512=cut 513 514# Implemented in Git.xs. 515 516 517 518=back 519 520=head1 ERROR HANDLING 521 522All functions are supposed to throw Perl exceptions in case of errors. 523See the L<Error> module on how to catch those. Most exceptions are mere 524L<Error::Simple> instances. 525 526However, the C<command()>, C<command_oneline()> and C<command_noisy()> 527functions suite can throw C<Git::Error::Command> exceptions as well: those are 528thrown when the external command returns an error code and contain the error 529code as well as access to the captured command's output. The exception class 530provides the usual C<stringify> and C<value> (command's exit code) methods and 531in addition also a C<cmd_output> method that returns either an array or a 532string with the captured command output (depending on the original function 533call context; C<command_noisy()> returns C<undef>) and $<cmdline> which 534returns the command and its arguments (but without proper quoting). 535 536Note that the C<command_*_pipe()> functions cannot throw this exception since 537it has no idea whether the command failed or not. You will only find out 538at the time you C<close> the pipe; if you want to have that automated, 539use C<command_close_pipe()>, which can throw the exception. 540 541=cut 542 543{ 544package Git::Error::Command; 545 546@Git::Error::Command::ISA =qw(Error); 547 548sub new { 549my$self=shift; 550my$cmdline=''.shift; 551my$value=0+shift; 552my$outputref=shift; 553my(@args) = (); 554 555local$Error::Depth =$Error::Depth +1; 556 557push(@args,'-cmdline',$cmdline); 558push(@args,'-value',$value); 559push(@args,'-outputref',$outputref); 560 561$self->SUPER::new(-text =>'command returned error',@args); 562} 563 564sub stringify { 565my$self=shift; 566my$text=$self->SUPER::stringify; 567$self->cmdline() .': '.$text.': '.$self->value() ."\n"; 568} 569 570sub cmdline { 571my$self=shift; 572$self->{'-cmdline'}; 573} 574 575sub cmd_output { 576my$self=shift; 577my$ref=$self->{'-outputref'}; 578defined$refor undef; 579if(ref$refeq'ARRAY') { 580return@$ref; 581}else{# SCALAR 582return$$ref; 583} 584} 585} 586 587=over 4 588 589=item git_cmd_try { CODE } ERRMSG 590 591This magical statement will automatically catch any C<Git::Error::Command> 592exceptions thrown by C<CODE> and make your program die with C<ERRMSG> 593on its lips; the message will have %s substituted for the command line 594and %d for the exit status. This statement is useful mostly for producing 595more user-friendly error messages. 596 597In case of no exception caught the statement returns C<CODE>'s return value. 598 599Note that this is the only auto-exported function. 600 601=cut 602 603sub git_cmd_try(&$) { 604my($code,$errmsg) =@_; 605my@result; 606my$err; 607my$array=wantarray; 608try{ 609if($array) { 610@result= &$code; 611}else{ 612$result[0] = &$code; 613} 614} catch Git::Error::Command with { 615my$E=shift; 616$err=$errmsg; 617$err=~s/\%s/$E->cmdline()/ge; 618$err=~s/\%d/$E->value()/ge; 619# We can't croak here since Error.pm would mangle 620# that to Error::Simple. 621}; 622$errand croak $err; 623return$array?@result:$result[0]; 624} 625 626 627=back 628 629=head1 COPYRIGHT 630 631Copyright 2006 by Petr Baudis E<lt>pasky@suse.czE<gt>. 632 633This module is free software; it may be used, copied, modified 634and distributed under the terms of the GNU General Public Licence, 635either version 2, or (at your option) any later version. 636 637=cut 638 639 640# Take raw method argument list and return ($obj, @args) in case 641# the method was called upon an instance and (undef, @args) if 642# it was called directly. 643sub _maybe_self { 644# This breaks inheritance. Oh well. 645ref$_[0]eq'Git'?@_: (undef,@_); 646} 647 648# Check if the command id is something reasonable. 649sub _check_valid_cmd { 650my($cmd) =@_; 651$cmd=~/^[a-z0-9A-Z_-]+$/or throw Error::Simple("bad command:$cmd"); 652} 653 654# Common backend for the pipe creators. 655sub _command_common_pipe { 656my$direction=shift; 657my($self,@p) = _maybe_self(@_); 658my(%opts,$cmd,@args); 659if(ref$p[0]) { 660($cmd,@args) = @{shift@p}; 661%opts=ref$p[0] ? %{$p[0]} :@p; 662}else{ 663($cmd,@args) =@p; 664} 665 _check_valid_cmd($cmd); 666 667my$fh; 668if($^Oeq'##INSERT_ACTIVESTATE_STRING_HERE##') { 669# ActiveState Perl 670#defined $opts{STDERR} and 671# warn 'ignoring STDERR option - running w/ ActiveState'; 672$directioneq'-|'or 673die'input pipe for ActiveState not implemented'; 674 tie ($fh,'Git::activestate_pipe',$cmd,@args); 675 676}else{ 677my$pid=open($fh,$direction); 678if(not defined$pid) { 679 throw Error::Simple("open failed:$!"); 680}elsif($pid==0) { 681if(defined$opts{STDERR}) { 682close STDERR; 683} 684if($opts{STDERR}) { 685open(STDERR,'>&',$opts{STDERR}) 686or die"dup failed:$!"; 687} 688 _cmd_exec($self,$cmd,@args); 689} 690} 691returnwantarray? ($fh,join(' ',$cmd,@args)) :$fh; 692} 693 694# When already in the subprocess, set up the appropriate state 695# for the given repository and execute the git command. 696sub _cmd_exec { 697my($self,@args) =@_; 698if($self) { 699$self->repo_path()and$ENV{'GIT_DIR'} =$self->repo_path(); 700$self->wc_path()and chdir($self->wc_path()); 701$self->wc_subdir()and chdir($self->wc_subdir()); 702} 703 _execv_git_cmd(@args); 704die"exec failed:$!"; 705} 706 707# Execute the given Git command ($_[0]) with arguments ($_[1..]) 708# by searching for it at proper places. 709# _execv_git_cmd(), implemented in Git.xs. 710 711# Close pipe to a subprocess. 712sub _cmd_close { 713my($fh,$ctx) =@_; 714if(not close$fh) { 715if($!) { 716# It's just close, no point in fatalities 717 carp "error closing pipe:$!"; 718}elsif($?>>8) { 719# The caller should pepper this. 720 throw Git::Error::Command($ctx,$?>>8); 721} 722# else we might e.g. closed a live stream; the command 723# dying of SIGPIPE would drive us here. 724} 725} 726 727 728# Trickery for .xs routines: In order to avoid having some horrid 729# C code trying to do stuff with undefs and hashes, we gate all 730# xs calls through the following and in case we are being ran upon 731# an instance call a C part of the gate which will set up the 732# environment properly. 733sub _call_gate { 734my$xsfunc=shift; 735my($self,@args) = _maybe_self(@_); 736 737if(defined$self) { 738# XXX: We ignore the WorkingCopy! To properly support 739# that will require heavy changes in libgit. 740 741# XXX: And we ignore everything else as well. libgit 742# at least needs to be extended to let us specify 743# the $GIT_DIR instead of looking it up in environment. 744#xs_call_gate($self->{opts}->{Repository}); 745} 746 747# Having to call throw from the C code is a sure path to insanity. 748local$SIG{__DIE__} =sub{ throw Error::Simple("@_"); }; 749&$xsfunc(@args); 750} 751 752sub AUTOLOAD { 753my$xsname; 754our$AUTOLOAD; 755($xsname=$AUTOLOAD) =~s/.*:://; 756 throw Error::Simple("&Git::$xsnamenot defined")if$xsname=~/^xs_/; 757$xsname='xs_'.$xsname; 758 _call_gate(\&$xsname,@_); 759} 760 761sub DESTROY { } 762 763 764# Pipe implementation for ActiveState Perl. 765 766package Git::activestate_pipe; 767use strict; 768 769sub TIEHANDLE { 770my($class,@params) =@_; 771# FIXME: This is probably horrible idea and the thing will explode 772# at the moment you give it arguments that require some quoting, 773# but I have no ActiveState clue... --pasky 774my$cmdline=join" ",@params; 775my@data=qx{$cmdline}; 776bless{ i =>0, data => \@data},$class; 777} 778 779sub READLINE { 780my$self=shift; 781if($self->{i} >=scalar@{$self->{data}}) { 782returnundef; 783} 784return$self->{'data'}->[$self->{i}++ ]; 785} 786 787sub CLOSE { 788my$self=shift; 789delete$self->{data}; 790delete$self->{i}; 791} 792 793sub EOF { 794my$self=shift; 795return($self->{i} >=scalar@{$self->{data}}); 796} 797 798 7991;# Famous last words