gitweb / gitweb.perlon commit Allow passing of configuration parameters in the command line (8b1fa77)
   1#!/usr/bin/perl
   2
   3# gitweb - simple web interface to track changes in git repositories
   4#
   5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
   6# (C) 2005, Christian Gierke
   7#
   8# This program is licensed under the GPLv2
   9
  10use strict;
  11use warnings;
  12use CGI qw(:standard :escapeHTML -nosticky);
  13use CGI::Util qw(unescape);
  14use CGI::Carp qw(fatalsToBrowser);
  15use Encode;
  16use Fcntl ':mode';
  17use File::Find qw();
  18use File::Basename qw(basename);
  19binmode STDOUT, ':utf8';
  20
  21our $t0;
  22if (eval { require Time::HiRes; 1; }) {
  23        $t0 = [Time::HiRes::gettimeofday()];
  24}
  25our $number_of_git_cmds = 0;
  26
  27BEGIN {
  28        CGI->compile() if $ENV{'MOD_PERL'};
  29}
  30
  31our $cgi = new CGI;
  32our $version = "++GIT_VERSION++";
  33our $my_url = $cgi->url();
  34our $my_uri = $cgi->url(-absolute => 1);
  35
  36# Base URL for relative URLs in gitweb ($logo, $favicon, ...),
  37# needed and used only for URLs with nonempty PATH_INFO
  38our $base_url = $my_url;
  39
  40# When the script is used as DirectoryIndex, the URL does not contain the name
  41# of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
  42# have to do it ourselves. We make $path_info global because it's also used
  43# later on.
  44#
  45# Another issue with the script being the DirectoryIndex is that the resulting
  46# $my_url data is not the full script URL: this is good, because we want
  47# generated links to keep implying the script name if it wasn't explicitly
  48# indicated in the URL we're handling, but it means that $my_url cannot be used
  49# as base URL.
  50# Therefore, if we needed to strip PATH_INFO, then we know that we have
  51# to build the base URL ourselves:
  52our $path_info = $ENV{"PATH_INFO"};
  53if ($path_info) {
  54        if ($my_url =~ s,\Q$path_info\E$,, &&
  55            $my_uri =~ s,\Q$path_info\E$,, &&
  56            defined $ENV{'SCRIPT_NAME'}) {
  57                $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
  58        }
  59}
  60
  61# core git executable to use
  62# this can just be "git" if your webserver has a sensible PATH
  63our $GIT = "++GIT_BINDIR++/git";
  64
  65# absolute fs-path which will be prepended to the project path
  66#our $projectroot = "/pub/scm";
  67our $projectroot = "++GITWEB_PROJECTROOT++";
  68
  69# fs traversing limit for getting project list
  70# the number is relative to the projectroot
  71our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
  72
  73# target of the home link on top of all pages
  74our $home_link = $my_uri || "/";
  75
  76# string of the home link on top of all pages
  77our $home_link_str = "++GITWEB_HOME_LINK_STR++";
  78
  79# name of your site or organization to appear in page titles
  80# replace this with something more descriptive for clearer bookmarks
  81our $site_name = "++GITWEB_SITENAME++"
  82                 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
  83
  84# filename of html text to include at top of each page
  85our $site_header = "++GITWEB_SITE_HEADER++";
  86# html text to include at home page
  87our $home_text = "++GITWEB_HOMETEXT++";
  88# filename of html text to include at bottom of each page
  89our $site_footer = "++GITWEB_SITE_FOOTER++";
  90
  91# URI of stylesheets
  92our @stylesheets = ("++GITWEB_CSS++");
  93# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
  94our $stylesheet = undef;
  95# URI of GIT logo (72x27 size)
  96our $logo = "++GITWEB_LOGO++";
  97# URI of GIT favicon, assumed to be image/png type
  98our $favicon = "++GITWEB_FAVICON++";
  99# URI of gitweb.js (JavaScript code for gitweb)
 100our $javascript = "++GITWEB_JS++";
 101
 102# URI and label (title) of GIT logo link
 103#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
 104#our $logo_label = "git documentation";
 105our $logo_url = "http://git-scm.com/";
 106our $logo_label = "git homepage";
 107
 108# source of projects list
 109our $projects_list = "++GITWEB_LIST++";
 110
 111# the width (in characters) of the projects list "Description" column
 112our $projects_list_description_width = 25;
 113
 114# default order of projects list
 115# valid values are none, project, descr, owner, and age
 116our $default_projects_order = "project";
 117
 118# show repository only if this file exists
 119# (only effective if this variable evaluates to true)
 120our $export_ok = "++GITWEB_EXPORT_OK++";
 121
 122# show repository only if this subroutine returns true
 123# when given the path to the project, for example:
 124#    sub { return -e "$_[0]/git-daemon-export-ok"; }
 125our $export_auth_hook = undef;
 126
 127# only allow viewing of repositories also shown on the overview page
 128our $strict_export = "++GITWEB_STRICT_EXPORT++";
 129
 130# list of git base URLs used for URL to where fetch project from,
 131# i.e. full URL is "$git_base_url/$project"
 132our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
 133
 134# default blob_plain mimetype and default charset for text/plain blob
 135our $default_blob_plain_mimetype = 'text/plain';
 136our $default_text_plain_charset  = undef;
 137
 138# file to use for guessing MIME types before trying /etc/mime.types
 139# (relative to the current git repository)
 140our $mimetypes_file = undef;
 141
 142# assume this charset if line contains non-UTF-8 characters;
 143# it should be valid encoding (see Encoding::Supported(3pm) for list),
 144# for which encoding all byte sequences are valid, for example
 145# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
 146# could be even 'utf-8' for the old behavior)
 147our $fallback_encoding = 'latin1';
 148
 149# rename detection options for git-diff and git-diff-tree
 150# - default is '-M', with the cost proportional to
 151#   (number of removed files) * (number of new files).
 152# - more costly is '-C' (which implies '-M'), with the cost proportional to
 153#   (number of changed files + number of removed files) * (number of new files)
 154# - even more costly is '-C', '--find-copies-harder' with cost
 155#   (number of files in the original tree) * (number of new files)
 156# - one might want to include '-B' option, e.g. '-B', '-M'
 157our @diff_opts = ('-M'); # taken from git_commit
 158
 159# Disables features that would allow repository owners to inject script into
 160# the gitweb domain.
 161our $prevent_xss = 0;
 162
 163# information about snapshot formats that gitweb is capable of serving
 164our %known_snapshot_formats = (
 165        # name => {
 166        #       'display' => display name,
 167        #       'type' => mime type,
 168        #       'suffix' => filename suffix,
 169        #       'format' => --format for git-archive,
 170        #       'compressor' => [compressor command and arguments]
 171        #                       (array reference, optional)
 172        #       'disabled' => boolean (optional)}
 173        #
 174        'tgz' => {
 175                'display' => 'tar.gz',
 176                'type' => 'application/x-gzip',
 177                'suffix' => '.tar.gz',
 178                'format' => 'tar',
 179                'compressor' => ['gzip']},
 180
 181        'tbz2' => {
 182                'display' => 'tar.bz2',
 183                'type' => 'application/x-bzip2',
 184                'suffix' => '.tar.bz2',
 185                'format' => 'tar',
 186                'compressor' => ['bzip2']},
 187
 188        'txz' => {
 189                'display' => 'tar.xz',
 190                'type' => 'application/x-xz',
 191                'suffix' => '.tar.xz',
 192                'format' => 'tar',
 193                'compressor' => ['xz'],
 194                'disabled' => 1},
 195
 196        'zip' => {
 197                'display' => 'zip',
 198                'type' => 'application/x-zip',
 199                'suffix' => '.zip',
 200                'format' => 'zip'},
 201);
 202
 203# Aliases so we understand old gitweb.snapshot values in repository
 204# configuration.
 205our %known_snapshot_format_aliases = (
 206        'gzip'  => 'tgz',
 207        'bzip2' => 'tbz2',
 208        'xz'    => 'txz',
 209
 210        # backward compatibility: legacy gitweb config support
 211        'x-gzip' => undef, 'gz' => undef,
 212        'x-bzip2' => undef, 'bz2' => undef,
 213        'x-zip' => undef, '' => undef,
 214);
 215
 216# Pixel sizes for icons and avatars. If the default font sizes or lineheights
 217# are changed, it may be appropriate to change these values too via
 218# $GITWEB_CONFIG.
 219our %avatar_size = (
 220        'default' => 16,
 221        'double'  => 32
 222);
 223
 224# Used to set the maximum load that we will still respond to gitweb queries.
 225# If server load exceed this value then return "503 server busy" error.
 226# If gitweb cannot determined server load, it is taken to be 0.
 227# Leave it undefined (or set to 'undef') to turn off load checking.
 228our $maxload = 300;
 229
 230# You define site-wide feature defaults here; override them with
 231# $GITWEB_CONFIG as necessary.
 232our %feature = (
 233        # feature => {
 234        #       'sub' => feature-sub (subroutine),
 235        #       'override' => allow-override (boolean),
 236        #       'default' => [ default options...] (array reference)}
 237        #
 238        # if feature is overridable (it means that allow-override has true value),
 239        # then feature-sub will be called with default options as parameters;
 240        # return value of feature-sub indicates if to enable specified feature
 241        #
 242        # if there is no 'sub' key (no feature-sub), then feature cannot be
 243        # overriden
 244        #
 245        # use gitweb_get_feature(<feature>) to retrieve the <feature> value
 246        # (an array) or gitweb_check_feature(<feature>) to check if <feature>
 247        # is enabled
 248
 249        # Enable the 'blame' blob view, showing the last commit that modified
 250        # each line in the file. This can be very CPU-intensive.
 251
 252        # To enable system wide have in $GITWEB_CONFIG
 253        # $feature{'blame'}{'default'} = [1];
 254        # To have project specific config enable override in $GITWEB_CONFIG
 255        # $feature{'blame'}{'override'} = 1;
 256        # and in project config gitweb.blame = 0|1;
 257        'blame' => {
 258                'sub' => sub { feature_bool('blame', @_) },
 259                'override' => 0,
 260                'default' => [0]},
 261
 262        # Enable the 'snapshot' link, providing a compressed archive of any
 263        # tree. This can potentially generate high traffic if you have large
 264        # project.
 265
 266        # Value is a list of formats defined in %known_snapshot_formats that
 267        # you wish to offer.
 268        # To disable system wide have in $GITWEB_CONFIG
 269        # $feature{'snapshot'}{'default'} = [];
 270        # To have project specific config enable override in $GITWEB_CONFIG
 271        # $feature{'snapshot'}{'override'} = 1;
 272        # and in project config, a comma-separated list of formats or "none"
 273        # to disable.  Example: gitweb.snapshot = tbz2,zip;
 274        'snapshot' => {
 275                'sub' => \&feature_snapshot,
 276                'override' => 0,
 277                'default' => ['tgz']},
 278
 279        # Enable text search, which will list the commits which match author,
 280        # committer or commit text to a given string.  Enabled by default.
 281        # Project specific override is not supported.
 282        'search' => {
 283                'override' => 0,
 284                'default' => [1]},
 285
 286        # Enable grep search, which will list the files in currently selected
 287        # tree containing the given string. Enabled by default. This can be
 288        # potentially CPU-intensive, of course.
 289
 290        # To enable system wide have in $GITWEB_CONFIG
 291        # $feature{'grep'}{'default'} = [1];
 292        # To have project specific config enable override in $GITWEB_CONFIG
 293        # $feature{'grep'}{'override'} = 1;
 294        # and in project config gitweb.grep = 0|1;
 295        'grep' => {
 296                'sub' => sub { feature_bool('grep', @_) },
 297                'override' => 0,
 298                'default' => [1]},
 299
 300        # Enable the pickaxe search, which will list the commits that modified
 301        # a given string in a file. This can be practical and quite faster
 302        # alternative to 'blame', but still potentially CPU-intensive.
 303
 304        # To enable system wide have in $GITWEB_CONFIG
 305        # $feature{'pickaxe'}{'default'} = [1];
 306        # To have project specific config enable override in $GITWEB_CONFIG
 307        # $feature{'pickaxe'}{'override'} = 1;
 308        # and in project config gitweb.pickaxe = 0|1;
 309        'pickaxe' => {
 310                'sub' => sub { feature_bool('pickaxe', @_) },
 311                'override' => 0,
 312                'default' => [1]},
 313
 314        # Enable showing size of blobs in a 'tree' view, in a separate
 315        # column, similar to what 'ls -l' does.  This cost a bit of IO.
 316
 317        # To disable system wide have in $GITWEB_CONFIG
 318        # $feature{'show-sizes'}{'default'} = [0];
 319        # To have project specific config enable override in $GITWEB_CONFIG
 320        # $feature{'show-sizes'}{'override'} = 1;
 321        # and in project config gitweb.showsizes = 0|1;
 322        'show-sizes' => {
 323                'sub' => sub { feature_bool('showsizes', @_) },
 324                'override' => 0,
 325                'default' => [1]},
 326
 327        # Make gitweb use an alternative format of the URLs which can be
 328        # more readable and natural-looking: project name is embedded
 329        # directly in the path and the query string contains other
 330        # auxiliary information. All gitweb installations recognize
 331        # URL in either format; this configures in which formats gitweb
 332        # generates links.
 333
 334        # To enable system wide have in $GITWEB_CONFIG
 335        # $feature{'pathinfo'}{'default'} = [1];
 336        # Project specific override is not supported.
 337
 338        # Note that you will need to change the default location of CSS,
 339        # favicon, logo and possibly other files to an absolute URL. Also,
 340        # if gitweb.cgi serves as your indexfile, you will need to force
 341        # $my_uri to contain the script name in your $GITWEB_CONFIG.
 342        'pathinfo' => {
 343                'override' => 0,
 344                'default' => [0]},
 345
 346        # Make gitweb consider projects in project root subdirectories
 347        # to be forks of existing projects. Given project $projname.git,
 348        # projects matching $projname/*.git will not be shown in the main
 349        # projects list, instead a '+' mark will be added to $projname
 350        # there and a 'forks' view will be enabled for the project, listing
 351        # all the forks. If project list is taken from a file, forks have
 352        # to be listed after the main project.
 353
 354        # To enable system wide have in $GITWEB_CONFIG
 355        # $feature{'forks'}{'default'} = [1];
 356        # Project specific override is not supported.
 357        'forks' => {
 358                'override' => 0,
 359                'default' => [0]},
 360
 361        # Insert custom links to the action bar of all project pages.
 362        # This enables you mainly to link to third-party scripts integrating
 363        # into gitweb; e.g. git-browser for graphical history representation
 364        # or custom web-based repository administration interface.
 365
 366        # The 'default' value consists of a list of triplets in the form
 367        # (label, link, position) where position is the label after which
 368        # to insert the link and link is a format string where %n expands
 369        # to the project name, %f to the project path within the filesystem,
 370        # %h to the current hash (h gitweb parameter) and %b to the current
 371        # hash base (hb gitweb parameter); %% expands to %.
 372
 373        # To enable system wide have in $GITWEB_CONFIG e.g.
 374        # $feature{'actions'}{'default'} = [('graphiclog',
 375        #       '/git-browser/by-commit.html?r=%n', 'summary')];
 376        # Project specific override is not supported.
 377        'actions' => {
 378                'override' => 0,
 379                'default' => []},
 380
 381        # Allow gitweb scan project content tags described in ctags/
 382        # of project repository, and display the popular Web 2.0-ish
 383        # "tag cloud" near the project list. Note that this is something
 384        # COMPLETELY different from the normal Git tags.
 385
 386        # gitweb by itself can show existing tags, but it does not handle
 387        # tagging itself; you need an external application for that.
 388        # For an example script, check Girocco's cgi/tagproj.cgi.
 389        # You may want to install the HTML::TagCloud Perl module to get
 390        # a pretty tag cloud instead of just a list of tags.
 391
 392        # To enable system wide have in $GITWEB_CONFIG
 393        # $feature{'ctags'}{'default'} = ['path_to_tag_script'];
 394        # Project specific override is not supported.
 395        'ctags' => {
 396                'override' => 0,
 397                'default' => [0]},
 398
 399        # The maximum number of patches in a patchset generated in patch
 400        # view. Set this to 0 or undef to disable patch view, or to a
 401        # negative number to remove any limit.
 402
 403        # To disable system wide have in $GITWEB_CONFIG
 404        # $feature{'patches'}{'default'} = [0];
 405        # To have project specific config enable override in $GITWEB_CONFIG
 406        # $feature{'patches'}{'override'} = 1;
 407        # and in project config gitweb.patches = 0|n;
 408        # where n is the maximum number of patches allowed in a patchset.
 409        'patches' => {
 410                'sub' => \&feature_patches,
 411                'override' => 0,
 412                'default' => [16]},
 413
 414        # Avatar support. When this feature is enabled, views such as
 415        # shortlog or commit will display an avatar associated with
 416        # the email of the committer(s) and/or author(s).
 417
 418        # Currently available providers are gravatar and picon.
 419        # If an unknown provider is specified, the feature is disabled.
 420
 421        # Gravatar depends on Digest::MD5.
 422        # Picon currently relies on the indiana.edu database.
 423
 424        # To enable system wide have in $GITWEB_CONFIG
 425        # $feature{'avatar'}{'default'} = ['<provider>'];
 426        # where <provider> is either gravatar or picon.
 427        # To have project specific config enable override in $GITWEB_CONFIG
 428        # $feature{'avatar'}{'override'} = 1;
 429        # and in project config gitweb.avatar = <provider>;
 430        'avatar' => {
 431                'sub' => \&feature_avatar,
 432                'override' => 0,
 433                'default' => ['']},
 434
 435        # Enable displaying how much time and how many git commands
 436        # it took to generate and display page.  Disabled by default.
 437        # Project specific override is not supported.
 438        'timed' => {
 439                'override' => 0,
 440                'default' => [0]},
 441
 442        # Enable turning some links into links to actions which require
 443        # JavaScript to run (like 'blame_incremental').  Not enabled by
 444        # default.  Project specific override is currently not supported.
 445        'javascript-actions' => {
 446                'override' => 0,
 447                'default' => [0]},
 448);
 449
 450sub gitweb_get_feature {
 451        my ($name) = @_;
 452        return unless exists $feature{$name};
 453        my ($sub, $override, @defaults) = (
 454                $feature{$name}{'sub'},
 455                $feature{$name}{'override'},
 456                @{$feature{$name}{'default'}});
 457        # project specific override is possible only if we have project
 458        our $git_dir; # global variable, declared later
 459        if (!$override || !defined $git_dir) {
 460                return @defaults;
 461        }
 462        if (!defined $sub) {
 463                warn "feature $name is not overridable";
 464                return @defaults;
 465        }
 466        return $sub->(@defaults);
 467}
 468
 469# A wrapper to check if a given feature is enabled.
 470# With this, you can say
 471#
 472#   my $bool_feat = gitweb_check_feature('bool_feat');
 473#   gitweb_check_feature('bool_feat') or somecode;
 474#
 475# instead of
 476#
 477#   my ($bool_feat) = gitweb_get_feature('bool_feat');
 478#   (gitweb_get_feature('bool_feat'))[0] or somecode;
 479#
 480sub gitweb_check_feature {
 481        return (gitweb_get_feature(@_))[0];
 482}
 483
 484
 485sub feature_bool {
 486        my $key = shift;
 487        my ($val) = git_get_project_config($key, '--bool');
 488
 489        if (!defined $val) {
 490                return ($_[0]);
 491        } elsif ($val eq 'true') {
 492                return (1);
 493        } elsif ($val eq 'false') {
 494                return (0);
 495        }
 496}
 497
 498sub feature_snapshot {
 499        my (@fmts) = @_;
 500
 501        my ($val) = git_get_project_config('snapshot');
 502
 503        if ($val) {
 504                @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
 505        }
 506
 507        return @fmts;
 508}
 509
 510sub feature_patches {
 511        my @val = (git_get_project_config('patches', '--int'));
 512
 513        if (@val) {
 514                return @val;
 515        }
 516
 517        return ($_[0]);
 518}
 519
 520sub feature_avatar {
 521        my @val = (git_get_project_config('avatar'));
 522
 523        return @val ? @val : @_;
 524}
 525
 526# checking HEAD file with -e is fragile if the repository was
 527# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
 528# and then pruned.
 529sub check_head_link {
 530        my ($dir) = @_;
 531        my $headfile = "$dir/HEAD";
 532        return ((-e $headfile) ||
 533                (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
 534}
 535
 536sub check_export_ok {
 537        my ($dir) = @_;
 538        return (check_head_link($dir) &&
 539                (!$export_ok || -e "$dir/$export_ok") &&
 540                (!$export_auth_hook || $export_auth_hook->($dir)));
 541}
 542
 543# process alternate names for backward compatibility
 544# filter out unsupported (unknown) snapshot formats
 545sub filter_snapshot_fmts {
 546        my @fmts = @_;
 547
 548        @fmts = map {
 549                exists $known_snapshot_format_aliases{$_} ?
 550                       $known_snapshot_format_aliases{$_} : $_} @fmts;
 551        @fmts = grep {
 552                exists $known_snapshot_formats{$_} &&
 553                !$known_snapshot_formats{$_}{'disabled'}} @fmts;
 554}
 555
 556our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
 557our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
 558# die if there are errors parsing config file
 559if (-e $GITWEB_CONFIG) {
 560        do $GITWEB_CONFIG;
 561        die $@ if $@;
 562} elsif (-e $GITWEB_CONFIG_SYSTEM) {
 563        do $GITWEB_CONFIG_SYSTEM;
 564        die $@ if $@;
 565}
 566
 567# Get loadavg of system, to compare against $maxload.
 568# Currently it requires '/proc/loadavg' present to get loadavg;
 569# if it is not present it returns 0, which means no load checking.
 570sub get_loadavg {
 571        if( -e '/proc/loadavg' ){
 572                open my $fd, '<', '/proc/loadavg'
 573                        or return 0;
 574                my @load = split(/\s+/, scalar <$fd>);
 575                close $fd;
 576
 577                # The first three columns measure CPU and IO utilization of the last one,
 578                # five, and 10 minute periods.  The fourth column shows the number of
 579                # currently running processes and the total number of processes in the m/n
 580                # format.  The last column displays the last process ID used.
 581                return $load[0] || 0;
 582        }
 583        # additional checks for load average should go here for things that don't export
 584        # /proc/loadavg
 585
 586        return 0;
 587}
 588
 589# version of the core git binary
 590our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
 591$number_of_git_cmds++;
 592
 593$projects_list ||= $projectroot;
 594
 595if (defined $maxload && get_loadavg() > $maxload) {
 596        die_error(503, "The load average on the server is too high");
 597}
 598
 599# ======================================================================
 600# input validation and dispatch
 601
 602# input parameters can be collected from a variety of sources (presently, CGI
 603# and PATH_INFO), so we define an %input_params hash that collects them all
 604# together during validation: this allows subsequent uses (e.g. href()) to be
 605# agnostic of the parameter origin
 606
 607our %input_params = ();
 608
 609# input parameters are stored with the long parameter name as key. This will
 610# also be used in the href subroutine to convert parameters to their CGI
 611# equivalent, and since the href() usage is the most frequent one, we store
 612# the name -> CGI key mapping here, instead of the reverse.
 613#
 614# XXX: Warning: If you touch this, check the search form for updating,
 615# too.
 616
 617our @cgi_param_mapping = (
 618        project => "p",
 619        action => "a",
 620        file_name => "f",
 621        file_parent => "fp",
 622        hash => "h",
 623        hash_parent => "hp",
 624        hash_base => "hb",
 625        hash_parent_base => "hpb",
 626        page => "pg",
 627        order => "o",
 628        searchtext => "s",
 629        searchtype => "st",
 630        snapshot_format => "sf",
 631        extra_options => "opt",
 632        search_use_regexp => "sr",
 633        # this must be last entry (for manipulation from JavaScript)
 634        javascript => "js"
 635);
 636our %cgi_param_mapping = @cgi_param_mapping;
 637
 638# we will also need to know the possible actions, for validation
 639our %actions = (
 640        "blame" => \&git_blame,
 641        "blame_incremental" => \&git_blame_incremental,
 642        "blame_data" => \&git_blame_data,
 643        "blobdiff" => \&git_blobdiff,
 644        "blobdiff_plain" => \&git_blobdiff_plain,
 645        "blob" => \&git_blob,
 646        "blob_plain" => \&git_blob_plain,
 647        "commitdiff" => \&git_commitdiff,
 648        "commitdiff_plain" => \&git_commitdiff_plain,
 649        "commit" => \&git_commit,
 650        "forks" => \&git_forks,
 651        "heads" => \&git_heads,
 652        "history" => \&git_history,
 653        "log" => \&git_log,
 654        "patch" => \&git_patch,
 655        "patches" => \&git_patches,
 656        "rss" => \&git_rss,
 657        "atom" => \&git_atom,
 658        "search" => \&git_search,
 659        "search_help" => \&git_search_help,
 660        "shortlog" => \&git_shortlog,
 661        "summary" => \&git_summary,
 662        "tag" => \&git_tag,
 663        "tags" => \&git_tags,
 664        "tree" => \&git_tree,
 665        "snapshot" => \&git_snapshot,
 666        "object" => \&git_object,
 667        # those below don't need $project
 668        "opml" => \&git_opml,
 669        "project_list" => \&git_project_list,
 670        "project_index" => \&git_project_index,
 671);
 672
 673# finally, we have the hash of allowed extra_options for the commands that
 674# allow them
 675our %allowed_options = (
 676        "--no-merges" => [ qw(rss atom log shortlog history) ],
 677);
 678
 679# fill %input_params with the CGI parameters. All values except for 'opt'
 680# should be single values, but opt can be an array. We should probably
 681# build an array of parameters that can be multi-valued, but since for the time
 682# being it's only this one, we just single it out
 683while (my ($name, $symbol) = each %cgi_param_mapping) {
 684        if ($symbol eq 'opt') {
 685                $input_params{$name} = [ $cgi->param($symbol) ];
 686        } else {
 687                $input_params{$name} = $cgi->param($symbol);
 688        }
 689}
 690
 691# now read PATH_INFO and update the parameter list for missing parameters
 692sub evaluate_path_info {
 693        return if defined $input_params{'project'};
 694        return if !$path_info;
 695        $path_info =~ s,^/+,,;
 696        return if !$path_info;
 697
 698        # find which part of PATH_INFO is project
 699        my $project = $path_info;
 700        $project =~ s,/+$,,;
 701        while ($project && !check_head_link("$projectroot/$project")) {
 702                $project =~ s,/*[^/]*$,,;
 703        }
 704        return unless $project;
 705        $input_params{'project'} = $project;
 706
 707        # do not change any parameters if an action is given using the query string
 708        return if $input_params{'action'};
 709        $path_info =~ s,^\Q$project\E/*,,;
 710
 711        # next, check if we have an action
 712        my $action = $path_info;
 713        $action =~ s,/.*$,,;
 714        if (exists $actions{$action}) {
 715                $path_info =~ s,^$action/*,,;
 716                $input_params{'action'} = $action;
 717        }
 718
 719        # list of actions that want hash_base instead of hash, but can have no
 720        # pathname (f) parameter
 721        my @wants_base = (
 722                'tree',
 723                'history',
 724        );
 725
 726        # we want to catch
 727        # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
 728        my ($parentrefname, $parentpathname, $refname, $pathname) =
 729                ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?(.+?)(?::(.+))?$/);
 730
 731        # first, analyze the 'current' part
 732        if (defined $pathname) {
 733                # we got "branch:filename" or "branch:dir/"
 734                # we could use git_get_type(branch:pathname), but:
 735                # - it needs $git_dir
 736                # - it does a git() call
 737                # - the convention of terminating directories with a slash
 738                #   makes it superfluous
 739                # - embedding the action in the PATH_INFO would make it even
 740                #   more superfluous
 741                $pathname =~ s,^/+,,;
 742                if (!$pathname || substr($pathname, -1) eq "/") {
 743                        $input_params{'action'} ||= "tree";
 744                        $pathname =~ s,/$,,;
 745                } else {
 746                        # the default action depends on whether we had parent info
 747                        # or not
 748                        if ($parentrefname) {
 749                                $input_params{'action'} ||= "blobdiff_plain";
 750                        } else {
 751                                $input_params{'action'} ||= "blob_plain";
 752                        }
 753                }
 754                $input_params{'hash_base'} ||= $refname;
 755                $input_params{'file_name'} ||= $pathname;
 756        } elsif (defined $refname) {
 757                # we got "branch". In this case we have to choose if we have to
 758                # set hash or hash_base.
 759                #
 760                # Most of the actions without a pathname only want hash to be
 761                # set, except for the ones specified in @wants_base that want
 762                # hash_base instead. It should also be noted that hand-crafted
 763                # links having 'history' as an action and no pathname or hash
 764                # set will fail, but that happens regardless of PATH_INFO.
 765                $input_params{'action'} ||= "shortlog";
 766                if (grep { $_ eq $input_params{'action'} } @wants_base) {
 767                        $input_params{'hash_base'} ||= $refname;
 768                } else {
 769                        $input_params{'hash'} ||= $refname;
 770                }
 771        }
 772
 773        # next, handle the 'parent' part, if present
 774        if (defined $parentrefname) {
 775                # a missing pathspec defaults to the 'current' filename, allowing e.g.
 776                # someproject/blobdiff/oldrev..newrev:/filename
 777                if ($parentpathname) {
 778                        $parentpathname =~ s,^/+,,;
 779                        $parentpathname =~ s,/$,,;
 780                        $input_params{'file_parent'} ||= $parentpathname;
 781                } else {
 782                        $input_params{'file_parent'} ||= $input_params{'file_name'};
 783                }
 784                # we assume that hash_parent_base is wanted if a path was specified,
 785                # or if the action wants hash_base instead of hash
 786                if (defined $input_params{'file_parent'} ||
 787                        grep { $_ eq $input_params{'action'} } @wants_base) {
 788                        $input_params{'hash_parent_base'} ||= $parentrefname;
 789                } else {
 790                        $input_params{'hash_parent'} ||= $parentrefname;
 791                }
 792        }
 793
 794        # for the snapshot action, we allow URLs in the form
 795        # $project/snapshot/$hash.ext
 796        # where .ext determines the snapshot and gets removed from the
 797        # passed $refname to provide the $hash.
 798        #
 799        # To be able to tell that $refname includes the format extension, we
 800        # require the following two conditions to be satisfied:
 801        # - the hash input parameter MUST have been set from the $refname part
 802        #   of the URL (i.e. they must be equal)
 803        # - the snapshot format MUST NOT have been defined already (e.g. from
 804        #   CGI parameter sf)
 805        # It's also useless to try any matching unless $refname has a dot,
 806        # so we check for that too
 807        if (defined $input_params{'action'} &&
 808                $input_params{'action'} eq 'snapshot' &&
 809                defined $refname && index($refname, '.') != -1 &&
 810                $refname eq $input_params{'hash'} &&
 811                !defined $input_params{'snapshot_format'}) {
 812                # We loop over the known snapshot formats, checking for
 813                # extensions. Allowed extensions are both the defined suffix
 814                # (which includes the initial dot already) and the snapshot
 815                # format key itself, with a prepended dot
 816                while (my ($fmt, $opt) = each %known_snapshot_formats) {
 817                        my $hash = $refname;
 818                        unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
 819                                next;
 820                        }
 821                        my $sfx = $1;
 822                        # a valid suffix was found, so set the snapshot format
 823                        # and reset the hash parameter
 824                        $input_params{'snapshot_format'} = $fmt;
 825                        $input_params{'hash'} = $hash;
 826                        # we also set the format suffix to the one requested
 827                        # in the URL: this way a request for e.g. .tgz returns
 828                        # a .tgz instead of a .tar.gz
 829                        $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
 830                        last;
 831                }
 832        }
 833}
 834evaluate_path_info();
 835
 836our $action = $input_params{'action'};
 837if (defined $action) {
 838        if (!validate_action($action)) {
 839                die_error(400, "Invalid action parameter");
 840        }
 841}
 842
 843# parameters which are pathnames
 844our $project = $input_params{'project'};
 845if (defined $project) {
 846        if (!validate_project($project)) {
 847                undef $project;
 848                die_error(404, "No such project");
 849        }
 850}
 851
 852our $file_name = $input_params{'file_name'};
 853if (defined $file_name) {
 854        if (!validate_pathname($file_name)) {
 855                die_error(400, "Invalid file parameter");
 856        }
 857}
 858
 859our $file_parent = $input_params{'file_parent'};
 860if (defined $file_parent) {
 861        if (!validate_pathname($file_parent)) {
 862                die_error(400, "Invalid file parent parameter");
 863        }
 864}
 865
 866# parameters which are refnames
 867our $hash = $input_params{'hash'};
 868if (defined $hash) {
 869        if (!validate_refname($hash)) {
 870                die_error(400, "Invalid hash parameter");
 871        }
 872}
 873
 874our $hash_parent = $input_params{'hash_parent'};
 875if (defined $hash_parent) {
 876        if (!validate_refname($hash_parent)) {
 877                die_error(400, "Invalid hash parent parameter");
 878        }
 879}
 880
 881our $hash_base = $input_params{'hash_base'};
 882if (defined $hash_base) {
 883        if (!validate_refname($hash_base)) {
 884                die_error(400, "Invalid hash base parameter");
 885        }
 886}
 887
 888our @extra_options = @{$input_params{'extra_options'}};
 889# @extra_options is always defined, since it can only be (currently) set from
 890# CGI, and $cgi->param() returns the empty array in array context if the param
 891# is not set
 892foreach my $opt (@extra_options) {
 893        if (not exists $allowed_options{$opt}) {
 894                die_error(400, "Invalid option parameter");
 895        }
 896        if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
 897                die_error(400, "Invalid option parameter for this action");
 898        }
 899}
 900
 901our $hash_parent_base = $input_params{'hash_parent_base'};
 902if (defined $hash_parent_base) {
 903        if (!validate_refname($hash_parent_base)) {
 904                die_error(400, "Invalid hash parent base parameter");
 905        }
 906}
 907
 908# other parameters
 909our $page = $input_params{'page'};
 910if (defined $page) {
 911        if ($page =~ m/[^0-9]/) {
 912                die_error(400, "Invalid page parameter");
 913        }
 914}
 915
 916our $searchtype = $input_params{'searchtype'};
 917if (defined $searchtype) {
 918        if ($searchtype =~ m/[^a-z]/) {
 919                die_error(400, "Invalid searchtype parameter");
 920        }
 921}
 922
 923our $search_use_regexp = $input_params{'search_use_regexp'};
 924
 925our $searchtext = $input_params{'searchtext'};
 926our $search_regexp;
 927if (defined $searchtext) {
 928        if (length($searchtext) < 2) {
 929                die_error(403, "At least two characters are required for search parameter");
 930        }
 931        $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
 932}
 933
 934# path to the current git repository
 935our $git_dir;
 936$git_dir = "$projectroot/$project" if $project;
 937
 938# list of supported snapshot formats
 939our @snapshot_fmts = gitweb_get_feature('snapshot');
 940@snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
 941
 942# check that the avatar feature is set to a known provider name,
 943# and for each provider check if the dependencies are satisfied.
 944# if the provider name is invalid or the dependencies are not met,
 945# reset $git_avatar to the empty string.
 946our ($git_avatar) = gitweb_get_feature('avatar');
 947if ($git_avatar eq 'gravatar') {
 948        $git_avatar = '' unless (eval { require Digest::MD5; 1; });
 949} elsif ($git_avatar eq 'picon') {
 950        # no dependencies
 951} else {
 952        $git_avatar = '';
 953}
 954
 955# dispatch
 956if (!defined $action) {
 957        if (defined $hash) {
 958                $action = git_get_type($hash);
 959        } elsif (defined $hash_base && defined $file_name) {
 960                $action = git_get_type("$hash_base:$file_name");
 961        } elsif (defined $project) {
 962                $action = 'summary';
 963        } else {
 964                $action = 'project_list';
 965        }
 966}
 967if (!defined($actions{$action})) {
 968        die_error(400, "Unknown action");
 969}
 970if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
 971    !$project) {
 972        die_error(400, "Project needed");
 973}
 974$actions{$action}->();
 975exit;
 976
 977## ======================================================================
 978## action links
 979
 980sub href {
 981        my %params = @_;
 982        # default is to use -absolute url() i.e. $my_uri
 983        my $href = $params{-full} ? $my_url : $my_uri;
 984
 985        $params{'project'} = $project unless exists $params{'project'};
 986
 987        if ($params{-replay}) {
 988                while (my ($name, $symbol) = each %cgi_param_mapping) {
 989                        if (!exists $params{$name}) {
 990                                $params{$name} = $input_params{$name};
 991                        }
 992                }
 993        }
 994
 995        my $use_pathinfo = gitweb_check_feature('pathinfo');
 996        if ($use_pathinfo and defined $params{'project'}) {
 997                # try to put as many parameters as possible in PATH_INFO:
 998                #   - project name
 999                #   - action
1000                #   - hash_parent or hash_parent_base:/file_parent
1001                #   - hash or hash_base:/filename
1002                #   - the snapshot_format as an appropriate suffix
1003
1004                # When the script is the root DirectoryIndex for the domain,
1005                # $href here would be something like http://gitweb.example.com/
1006                # Thus, we strip any trailing / from $href, to spare us double
1007                # slashes in the final URL
1008                $href =~ s,/$,,;
1009
1010                # Then add the project name, if present
1011                $href .= "/".esc_url($params{'project'});
1012                delete $params{'project'};
1013
1014                # since we destructively absorb parameters, we keep this
1015                # boolean that remembers if we're handling a snapshot
1016                my $is_snapshot = $params{'action'} eq 'snapshot';
1017
1018                # Summary just uses the project path URL, any other action is
1019                # added to the URL
1020                if (defined $params{'action'}) {
1021                        $href .= "/".esc_url($params{'action'}) unless $params{'action'} eq 'summary';
1022                        delete $params{'action'};
1023                }
1024
1025                # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1026                # stripping nonexistent or useless pieces
1027                $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1028                        || $params{'hash_parent'} || $params{'hash'});
1029                if (defined $params{'hash_base'}) {
1030                        if (defined $params{'hash_parent_base'}) {
1031                                $href .= esc_url($params{'hash_parent_base'});
1032                                # skip the file_parent if it's the same as the file_name
1033                                if (defined $params{'file_parent'}) {
1034                                        if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1035                                                delete $params{'file_parent'};
1036                                        } elsif ($params{'file_parent'} !~ /\.\./) {
1037                                                $href .= ":/".esc_url($params{'file_parent'});
1038                                                delete $params{'file_parent'};
1039                                        }
1040                                }
1041                                $href .= "..";
1042                                delete $params{'hash_parent'};
1043                                delete $params{'hash_parent_base'};
1044                        } elsif (defined $params{'hash_parent'}) {
1045                                $href .= esc_url($params{'hash_parent'}). "..";
1046                                delete $params{'hash_parent'};
1047                        }
1048
1049                        $href .= esc_url($params{'hash_base'});
1050                        if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1051                                $href .= ":/".esc_url($params{'file_name'});
1052                                delete $params{'file_name'};
1053                        }
1054                        delete $params{'hash'};
1055                        delete $params{'hash_base'};
1056                } elsif (defined $params{'hash'}) {
1057                        $href .= esc_url($params{'hash'});
1058                        delete $params{'hash'};
1059                }
1060
1061                # If the action was a snapshot, we can absorb the
1062                # snapshot_format parameter too
1063                if ($is_snapshot) {
1064                        my $fmt = $params{'snapshot_format'};
1065                        # snapshot_format should always be defined when href()
1066                        # is called, but just in case some code forgets, we
1067                        # fall back to the default
1068                        $fmt ||= $snapshot_fmts[0];
1069                        $href .= $known_snapshot_formats{$fmt}{'suffix'};
1070                        delete $params{'snapshot_format'};
1071                }
1072        }
1073
1074        # now encode the parameters explicitly
1075        my @result = ();
1076        for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1077                my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1078                if (defined $params{$name}) {
1079                        if (ref($params{$name}) eq "ARRAY") {
1080                                foreach my $par (@{$params{$name}}) {
1081                                        push @result, $symbol . "=" . esc_param($par);
1082                                }
1083                        } else {
1084                                push @result, $symbol . "=" . esc_param($params{$name});
1085                        }
1086                }
1087        }
1088        $href .= "?" . join(';', @result) if scalar @result;
1089
1090        return $href;
1091}
1092
1093
1094## ======================================================================
1095## validation, quoting/unquoting and escaping
1096
1097sub validate_action {
1098        my $input = shift || return undef;
1099        return undef unless exists $actions{$input};
1100        return $input;
1101}
1102
1103sub validate_project {
1104        my $input = shift || return undef;
1105        if (!validate_pathname($input) ||
1106                !(-d "$projectroot/$input") ||
1107                !check_export_ok("$projectroot/$input") ||
1108                ($strict_export && !project_in_list($input))) {
1109                return undef;
1110        } else {
1111                return $input;
1112        }
1113}
1114
1115sub validate_pathname {
1116        my $input = shift || return undef;
1117
1118        # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1119        # at the beginning, at the end, and between slashes.
1120        # also this catches doubled slashes
1121        if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1122                return undef;
1123        }
1124        # no null characters
1125        if ($input =~ m!\0!) {
1126                return undef;
1127        }
1128        return $input;
1129}
1130
1131sub validate_refname {
1132        my $input = shift || return undef;
1133
1134        # textual hashes are O.K.
1135        if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1136                return $input;
1137        }
1138        # it must be correct pathname
1139        $input = validate_pathname($input)
1140                or return undef;
1141        # restrictions on ref name according to git-check-ref-format
1142        if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1143                return undef;
1144        }
1145        return $input;
1146}
1147
1148# decode sequences of octets in utf8 into Perl's internal form,
1149# which is utf-8 with utf8 flag set if needed.  gitweb writes out
1150# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1151sub to_utf8 {
1152        my $str = shift;
1153        return undef unless defined $str;
1154        if (utf8::valid($str)) {
1155                utf8::decode($str);
1156                return $str;
1157        } else {
1158                return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1159        }
1160}
1161
1162# quote unsafe chars, but keep the slash, even when it's not
1163# correct, but quoted slashes look too horrible in bookmarks
1164sub esc_param {
1165        my $str = shift;
1166        return undef unless defined $str;
1167        $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1168        $str =~ s/ /\+/g;
1169        return $str;
1170}
1171
1172# quote unsafe chars in whole URL, so some charactrs cannot be quoted
1173sub esc_url {
1174        my $str = shift;
1175        return undef unless defined $str;
1176        $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&=])/sprintf("%%%02X", ord($1))/eg;
1177        $str =~ s/\+/%2B/g;
1178        $str =~ s/ /\+/g;
1179        return $str;
1180}
1181
1182# replace invalid utf8 character with SUBSTITUTION sequence
1183sub esc_html {
1184        my $str = shift;
1185        my %opts = @_;
1186
1187        return undef unless defined $str;
1188
1189        $str = to_utf8($str);
1190        $str = $cgi->escapeHTML($str);
1191        if ($opts{'-nbsp'}) {
1192                $str =~ s/ /&nbsp;/g;
1193        }
1194        $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1195        return $str;
1196}
1197
1198# quote control characters and escape filename to HTML
1199sub esc_path {
1200        my $str = shift;
1201        my %opts = @_;
1202
1203        return undef unless defined $str;
1204
1205        $str = to_utf8($str);
1206        $str = $cgi->escapeHTML($str);
1207        if ($opts{'-nbsp'}) {
1208                $str =~ s/ /&nbsp;/g;
1209        }
1210        $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1211        return $str;
1212}
1213
1214# Make control characters "printable", using character escape codes (CEC)
1215sub quot_cec {
1216        my $cntrl = shift;
1217        my %opts = @_;
1218        my %es = ( # character escape codes, aka escape sequences
1219                "\t" => '\t',   # tab            (HT)
1220                "\n" => '\n',   # line feed      (LF)
1221                "\r" => '\r',   # carrige return (CR)
1222                "\f" => '\f',   # form feed      (FF)
1223                "\b" => '\b',   # backspace      (BS)
1224                "\a" => '\a',   # alarm (bell)   (BEL)
1225                "\e" => '\e',   # escape         (ESC)
1226                "\013" => '\v', # vertical tab   (VT)
1227                "\000" => '\0', # nul character  (NUL)
1228        );
1229        my $chr = ( (exists $es{$cntrl})
1230                    ? $es{$cntrl}
1231                    : sprintf('\%2x', ord($cntrl)) );
1232        if ($opts{-nohtml}) {
1233                return $chr;
1234        } else {
1235                return "<span class=\"cntrl\">$chr</span>";
1236        }
1237}
1238
1239# Alternatively use unicode control pictures codepoints,
1240# Unicode "printable representation" (PR)
1241sub quot_upr {
1242        my $cntrl = shift;
1243        my %opts = @_;
1244
1245        my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1246        if ($opts{-nohtml}) {
1247                return $chr;
1248        } else {
1249                return "<span class=\"cntrl\">$chr</span>";
1250        }
1251}
1252
1253# git may return quoted and escaped filenames
1254sub unquote {
1255        my $str = shift;
1256
1257        sub unq {
1258                my $seq = shift;
1259                my %es = ( # character escape codes, aka escape sequences
1260                        't' => "\t",   # tab            (HT, TAB)
1261                        'n' => "\n",   # newline        (NL)
1262                        'r' => "\r",   # return         (CR)
1263                        'f' => "\f",   # form feed      (FF)
1264                        'b' => "\b",   # backspace      (BS)
1265                        'a' => "\a",   # alarm (bell)   (BEL)
1266                        'e' => "\e",   # escape         (ESC)
1267                        'v' => "\013", # vertical tab   (VT)
1268                );
1269
1270                if ($seq =~ m/^[0-7]{1,3}$/) {
1271                        # octal char sequence
1272                        return chr(oct($seq));
1273                } elsif (exists $es{$seq}) {
1274                        # C escape sequence, aka character escape code
1275                        return $es{$seq};
1276                }
1277                # quoted ordinary character
1278                return $seq;
1279        }
1280
1281        if ($str =~ m/^"(.*)"$/) {
1282                # needs unquoting
1283                $str = $1;
1284                $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1285        }
1286        return $str;
1287}
1288
1289# escape tabs (convert tabs to spaces)
1290sub untabify {
1291        my $line = shift;
1292
1293        while ((my $pos = index($line, "\t")) != -1) {
1294                if (my $count = (8 - ($pos % 8))) {
1295                        my $spaces = ' ' x $count;
1296                        $line =~ s/\t/$spaces/;
1297                }
1298        }
1299
1300        return $line;
1301}
1302
1303sub project_in_list {
1304        my $project = shift;
1305        my @list = git_get_projects_list();
1306        return @list && scalar(grep { $_->{'path'} eq $project } @list);
1307}
1308
1309## ----------------------------------------------------------------------
1310## HTML aware string manipulation
1311
1312# Try to chop given string on a word boundary between position
1313# $len and $len+$add_len. If there is no word boundary there,
1314# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1315# (marking chopped part) would be longer than given string.
1316sub chop_str {
1317        my $str = shift;
1318        my $len = shift;
1319        my $add_len = shift || 10;
1320        my $where = shift || 'right'; # 'left' | 'center' | 'right'
1321
1322        # Make sure perl knows it is utf8 encoded so we don't
1323        # cut in the middle of a utf8 multibyte char.
1324        $str = to_utf8($str);
1325
1326        # allow only $len chars, but don't cut a word if it would fit in $add_len
1327        # if it doesn't fit, cut it if it's still longer than the dots we would add
1328        # remove chopped character entities entirely
1329
1330        # when chopping in the middle, distribute $len into left and right part
1331        # return early if chopping wouldn't make string shorter
1332        if ($where eq 'center') {
1333                return $str if ($len + 5 >= length($str)); # filler is length 5
1334                $len = int($len/2);
1335        } else {
1336                return $str if ($len + 4 >= length($str)); # filler is length 4
1337        }
1338
1339        # regexps: ending and beginning with word part up to $add_len
1340        my $endre = qr/.{$len}\w{0,$add_len}/;
1341        my $begre = qr/\w{0,$add_len}.{$len}/;
1342
1343        if ($where eq 'left') {
1344                $str =~ m/^(.*?)($begre)$/;
1345                my ($lead, $body) = ($1, $2);
1346                if (length($lead) > 4) {
1347                        $lead = " ...";
1348                }
1349                return "$lead$body";
1350
1351        } elsif ($where eq 'center') {
1352                $str =~ m/^($endre)(.*)$/;
1353                my ($left, $str)  = ($1, $2);
1354                $str =~ m/^(.*?)($begre)$/;
1355                my ($mid, $right) = ($1, $2);
1356                if (length($mid) > 5) {
1357                        $mid = " ... ";
1358                }
1359                return "$left$mid$right";
1360
1361        } else {
1362                $str =~ m/^($endre)(.*)$/;
1363                my $body = $1;
1364                my $tail = $2;
1365                if (length($tail) > 4) {
1366                        $tail = "... ";
1367                }
1368                return "$body$tail";
1369        }
1370}
1371
1372# takes the same arguments as chop_str, but also wraps a <span> around the
1373# result with a title attribute if it does get chopped. Additionally, the
1374# string is HTML-escaped.
1375sub chop_and_escape_str {
1376        my ($str) = @_;
1377
1378        my $chopped = chop_str(@_);
1379        if ($chopped eq $str) {
1380                return esc_html($chopped);
1381        } else {
1382                $str =~ s/[[:cntrl:]]/?/g;
1383                return $cgi->span({-title=>$str}, esc_html($chopped));
1384        }
1385}
1386
1387## ----------------------------------------------------------------------
1388## functions returning short strings
1389
1390# CSS class for given age value (in seconds)
1391sub age_class {
1392        my $age = shift;
1393
1394        if (!defined $age) {
1395                return "noage";
1396        } elsif ($age < 60*60*2) {
1397                return "age0";
1398        } elsif ($age < 60*60*24*2) {
1399                return "age1";
1400        } else {
1401                return "age2";
1402        }
1403}
1404
1405# convert age in seconds to "nn units ago" string
1406sub age_string {
1407        my $age = shift;
1408        my $age_str;
1409
1410        if ($age > 60*60*24*365*2) {
1411                $age_str = (int $age/60/60/24/365);
1412                $age_str .= " years ago";
1413        } elsif ($age > 60*60*24*(365/12)*2) {
1414                $age_str = int $age/60/60/24/(365/12);
1415                $age_str .= " months ago";
1416        } elsif ($age > 60*60*24*7*2) {
1417                $age_str = int $age/60/60/24/7;
1418                $age_str .= " weeks ago";
1419        } elsif ($age > 60*60*24*2) {
1420                $age_str = int $age/60/60/24;
1421                $age_str .= " days ago";
1422        } elsif ($age > 60*60*2) {
1423                $age_str = int $age/60/60;
1424                $age_str .= " hours ago";
1425        } elsif ($age > 60*2) {
1426                $age_str = int $age/60;
1427                $age_str .= " min ago";
1428        } elsif ($age > 2) {
1429                $age_str = int $age;
1430                $age_str .= " sec ago";
1431        } else {
1432                $age_str .= " right now";
1433        }
1434        return $age_str;
1435}
1436
1437use constant {
1438        S_IFINVALID => 0030000,
1439        S_IFGITLINK => 0160000,
1440};
1441
1442# submodule/subproject, a commit object reference
1443sub S_ISGITLINK {
1444        my $mode = shift;
1445
1446        return (($mode & S_IFMT) == S_IFGITLINK)
1447}
1448
1449# convert file mode in octal to symbolic file mode string
1450sub mode_str {
1451        my $mode = oct shift;
1452
1453        if (S_ISGITLINK($mode)) {
1454                return 'm---------';
1455        } elsif (S_ISDIR($mode & S_IFMT)) {
1456                return 'drwxr-xr-x';
1457        } elsif (S_ISLNK($mode)) {
1458                return 'lrwxrwxrwx';
1459        } elsif (S_ISREG($mode)) {
1460                # git cares only about the executable bit
1461                if ($mode & S_IXUSR) {
1462                        return '-rwxr-xr-x';
1463                } else {
1464                        return '-rw-r--r--';
1465                };
1466        } else {
1467                return '----------';
1468        }
1469}
1470
1471# convert file mode in octal to file type string
1472sub file_type {
1473        my $mode = shift;
1474
1475        if ($mode !~ m/^[0-7]+$/) {
1476                return $mode;
1477        } else {
1478                $mode = oct $mode;
1479        }
1480
1481        if (S_ISGITLINK($mode)) {
1482                return "submodule";
1483        } elsif (S_ISDIR($mode & S_IFMT)) {
1484                return "directory";
1485        } elsif (S_ISLNK($mode)) {
1486                return "symlink";
1487        } elsif (S_ISREG($mode)) {
1488                return "file";
1489        } else {
1490                return "unknown";
1491        }
1492}
1493
1494# convert file mode in octal to file type description string
1495sub file_type_long {
1496        my $mode = shift;
1497
1498        if ($mode !~ m/^[0-7]+$/) {
1499                return $mode;
1500        } else {
1501                $mode = oct $mode;
1502        }
1503
1504        if (S_ISGITLINK($mode)) {
1505                return "submodule";
1506        } elsif (S_ISDIR($mode & S_IFMT)) {
1507                return "directory";
1508        } elsif (S_ISLNK($mode)) {
1509                return "symlink";
1510        } elsif (S_ISREG($mode)) {
1511                if ($mode & S_IXUSR) {
1512                        return "executable";
1513                } else {
1514                        return "file";
1515                };
1516        } else {
1517                return "unknown";
1518        }
1519}
1520
1521
1522## ----------------------------------------------------------------------
1523## functions returning short HTML fragments, or transforming HTML fragments
1524## which don't belong to other sections
1525
1526# format line of commit message.
1527sub format_log_line_html {
1528        my $line = shift;
1529
1530        $line = esc_html($line, -nbsp=>1);
1531        $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1532                $cgi->a({-href => href(action=>"object", hash=>$1),
1533                                        -class => "text"}, $1);
1534        }eg;
1535
1536        return $line;
1537}
1538
1539# format marker of refs pointing to given object
1540
1541# the destination action is chosen based on object type and current context:
1542# - for annotated tags, we choose the tag view unless it's the current view
1543#   already, in which case we go to shortlog view
1544# - for other refs, we keep the current view if we're in history, shortlog or
1545#   log view, and select shortlog otherwise
1546sub format_ref_marker {
1547        my ($refs, $id) = @_;
1548        my $markers = '';
1549
1550        if (defined $refs->{$id}) {
1551                foreach my $ref (@{$refs->{$id}}) {
1552                        # this code exploits the fact that non-lightweight tags are the
1553                        # only indirect objects, and that they are the only objects for which
1554                        # we want to use tag instead of shortlog as action
1555                        my ($type, $name) = qw();
1556                        my $indirect = ($ref =~ s/\^\{\}$//);
1557                        # e.g. tags/v2.6.11 or heads/next
1558                        if ($ref =~ m!^(.*?)s?/(.*)$!) {
1559                                $type = $1;
1560                                $name = $2;
1561                        } else {
1562                                $type = "ref";
1563                                $name = $ref;
1564                        }
1565
1566                        my $class = $type;
1567                        $class .= " indirect" if $indirect;
1568
1569                        my $dest_action = "shortlog";
1570
1571                        if ($indirect) {
1572                                $dest_action = "tag" unless $action eq "tag";
1573                        } elsif ($action =~ /^(history|(short)?log)$/) {
1574                                $dest_action = $action;
1575                        }
1576
1577                        my $dest = "";
1578                        $dest .= "refs/" unless $ref =~ m!^refs/!;
1579                        $dest .= $ref;
1580
1581                        my $link = $cgi->a({
1582                                -href => href(
1583                                        action=>$dest_action,
1584                                        hash=>$dest
1585                                )}, $name);
1586
1587                        $markers .= " <span class=\"$class\" title=\"$ref\">" .
1588                                $link . "</span>";
1589                }
1590        }
1591
1592        if ($markers) {
1593                return ' <span class="refs">'. $markers . '</span>';
1594        } else {
1595                return "";
1596        }
1597}
1598
1599# format, perhaps shortened and with markers, title line
1600sub format_subject_html {
1601        my ($long, $short, $href, $extra) = @_;
1602        $extra = '' unless defined($extra);
1603
1604        if (length($short) < length($long)) {
1605                $long =~ s/[[:cntrl:]]/?/g;
1606                return $cgi->a({-href => $href, -class => "list subject",
1607                                -title => to_utf8($long)},
1608                       esc_html($short)) . $extra;
1609        } else {
1610                return $cgi->a({-href => $href, -class => "list subject"},
1611                       esc_html($long)) . $extra;
1612        }
1613}
1614
1615# Rather than recomputing the url for an email multiple times, we cache it
1616# after the first hit. This gives a visible benefit in views where the avatar
1617# for the same email is used repeatedly (e.g. shortlog).
1618# The cache is shared by all avatar engines (currently gravatar only), which
1619# are free to use it as preferred. Since only one avatar engine is used for any
1620# given page, there's no risk for cache conflicts.
1621our %avatar_cache = ();
1622
1623# Compute the picon url for a given email, by using the picon search service over at
1624# http://www.cs.indiana.edu/picons/search.html
1625sub picon_url {
1626        my $email = lc shift;
1627        if (!$avatar_cache{$email}) {
1628                my ($user, $domain) = split('@', $email);
1629                $avatar_cache{$email} =
1630                        "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1631                        "$domain/$user/" .
1632                        "users+domains+unknown/up/single";
1633        }
1634        return $avatar_cache{$email};
1635}
1636
1637# Compute the gravatar url for a given email, if it's not in the cache already.
1638# Gravatar stores only the part of the URL before the size, since that's the
1639# one computationally more expensive. This also allows reuse of the cache for
1640# different sizes (for this particular engine).
1641sub gravatar_url {
1642        my $email = lc shift;
1643        my $size = shift;
1644        $avatar_cache{$email} ||=
1645                "http://www.gravatar.com/avatar/" .
1646                        Digest::MD5::md5_hex($email) . "?s=";
1647        return $avatar_cache{$email} . $size;
1648}
1649
1650# Insert an avatar for the given $email at the given $size if the feature
1651# is enabled.
1652sub git_get_avatar {
1653        my ($email, %opts) = @_;
1654        my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1655        my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1656        $opts{-size} ||= 'default';
1657        my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1658        my $url = "";
1659        if ($git_avatar eq 'gravatar') {
1660                $url = gravatar_url($email, $size);
1661        } elsif ($git_avatar eq 'picon') {
1662                $url = picon_url($email);
1663        }
1664        # Other providers can be added by extending the if chain, defining $url
1665        # as needed. If no variant puts something in $url, we assume avatars
1666        # are completely disabled/unavailable.
1667        if ($url) {
1668                return $pre_white .
1669                       "<img width=\"$size\" " .
1670                            "class=\"avatar\" " .
1671                            "src=\"$url\" " .
1672                            "alt=\"\" " .
1673                       "/>" . $post_white;
1674        } else {
1675                return "";
1676        }
1677}
1678
1679sub format_search_author {
1680        my ($author, $searchtype, $displaytext) = @_;
1681        my $have_search = gitweb_check_feature('search');
1682
1683        if ($have_search) {
1684                my $performed = "";
1685                if ($searchtype eq 'author') {
1686                        $performed = "authored";
1687                } elsif ($searchtype eq 'committer') {
1688                        $performed = "committed";
1689                }
1690
1691                return $cgi->a({-href => href(action=>"search", hash=>$hash,
1692                                searchtext=>$author,
1693                                searchtype=>$searchtype), class=>"list",
1694                                title=>"Search for commits $performed by $author"},
1695                                $displaytext);
1696
1697        } else {
1698                return $displaytext;
1699        }
1700}
1701
1702# format the author name of the given commit with the given tag
1703# the author name is chopped and escaped according to the other
1704# optional parameters (see chop_str).
1705sub format_author_html {
1706        my $tag = shift;
1707        my $co = shift;
1708        my $author = chop_and_escape_str($co->{'author_name'}, @_);
1709        return "<$tag class=\"author\">" .
1710               format_search_author($co->{'author_name'}, "author",
1711                       git_get_avatar($co->{'author_email'}, -pad_after => 1) .
1712                       $author) .
1713               "</$tag>";
1714}
1715
1716# format git diff header line, i.e. "diff --(git|combined|cc) ..."
1717sub format_git_diff_header_line {
1718        my $line = shift;
1719        my $diffinfo = shift;
1720        my ($from, $to) = @_;
1721
1722        if ($diffinfo->{'nparents'}) {
1723                # combined diff
1724                $line =~ s!^(diff (.*?) )"?.*$!$1!;
1725                if ($to->{'href'}) {
1726                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1727                                         esc_path($to->{'file'}));
1728                } else { # file was deleted (no href)
1729                        $line .= esc_path($to->{'file'});
1730                }
1731        } else {
1732                # "ordinary" diff
1733                $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
1734                if ($from->{'href'}) {
1735                        $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
1736                                         'a/' . esc_path($from->{'file'}));
1737                } else { # file was added (no href)
1738                        $line .= 'a/' . esc_path($from->{'file'});
1739                }
1740                $line .= ' ';
1741                if ($to->{'href'}) {
1742                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1743                                         'b/' . esc_path($to->{'file'}));
1744                } else { # file was deleted
1745                        $line .= 'b/' . esc_path($to->{'file'});
1746                }
1747        }
1748
1749        return "<div class=\"diff header\">$line</div>\n";
1750}
1751
1752# format extended diff header line, before patch itself
1753sub format_extended_diff_header_line {
1754        my $line = shift;
1755        my $diffinfo = shift;
1756        my ($from, $to) = @_;
1757
1758        # match <path>
1759        if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
1760                $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
1761                                       esc_path($from->{'file'}));
1762        }
1763        if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
1764                $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
1765                                 esc_path($to->{'file'}));
1766        }
1767        # match single <mode>
1768        if ($line =~ m/\s(\d{6})$/) {
1769                $line .= '<span class="info"> (' .
1770                         file_type_long($1) .
1771                         ')</span>';
1772        }
1773        # match <hash>
1774        if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
1775                # can match only for combined diff
1776                $line = 'index ';
1777                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
1778                        if ($from->{'href'}[$i]) {
1779                                $line .= $cgi->a({-href=>$from->{'href'}[$i],
1780                                                  -class=>"hash"},
1781                                                 substr($diffinfo->{'from_id'}[$i],0,7));
1782                        } else {
1783                                $line .= '0' x 7;
1784                        }
1785                        # separator
1786                        $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
1787                }
1788                $line .= '..';
1789                if ($to->{'href'}) {
1790                        $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
1791                                         substr($diffinfo->{'to_id'},0,7));
1792                } else {
1793                        $line .= '0' x 7;
1794                }
1795
1796        } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
1797                # can match only for ordinary diff
1798                my ($from_link, $to_link);
1799                if ($from->{'href'}) {
1800                        $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
1801                                             substr($diffinfo->{'from_id'},0,7));
1802                } else {
1803                        $from_link = '0' x 7;
1804                }
1805                if ($to->{'href'}) {
1806                        $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
1807                                           substr($diffinfo->{'to_id'},0,7));
1808                } else {
1809                        $to_link = '0' x 7;
1810                }
1811                my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
1812                $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
1813        }
1814
1815        return $line . "<br/>\n";
1816}
1817
1818# format from-file/to-file diff header
1819sub format_diff_from_to_header {
1820        my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
1821        my $line;
1822        my $result = '';
1823
1824        $line = $from_line;
1825        #assert($line =~ m/^---/) if DEBUG;
1826        # no extra formatting for "^--- /dev/null"
1827        if (! $diffinfo->{'nparents'}) {
1828                # ordinary (single parent) diff
1829                if ($line =~ m!^--- "?a/!) {
1830                        if ($from->{'href'}) {
1831                                $line = '--- a/' .
1832                                        $cgi->a({-href=>$from->{'href'}, -class=>"path"},
1833                                                esc_path($from->{'file'}));
1834                        } else {
1835                                $line = '--- a/' .
1836                                        esc_path($from->{'file'});
1837                        }
1838                }
1839                $result .= qq!<div class="diff from_file">$line</div>\n!;
1840
1841        } else {
1842                # combined diff (merge commit)
1843                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
1844                        if ($from->{'href'}[$i]) {
1845                                $line = '--- ' .
1846                                        $cgi->a({-href=>href(action=>"blobdiff",
1847                                                             hash_parent=>$diffinfo->{'from_id'}[$i],
1848                                                             hash_parent_base=>$parents[$i],
1849                                                             file_parent=>$from->{'file'}[$i],
1850                                                             hash=>$diffinfo->{'to_id'},
1851                                                             hash_base=>$hash,
1852                                                             file_name=>$to->{'file'}),
1853                                                 -class=>"path",
1854                                                 -title=>"diff" . ($i+1)},
1855                                                $i+1) .
1856                                        '/' .
1857                                        $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
1858                                                esc_path($from->{'file'}[$i]));
1859                        } else {
1860                                $line = '--- /dev/null';
1861                        }
1862                        $result .= qq!<div class="diff from_file">$line</div>\n!;
1863                }
1864        }
1865
1866        $line = $to_line;
1867        #assert($line =~ m/^\+\+\+/) if DEBUG;
1868        # no extra formatting for "^+++ /dev/null"
1869        if ($line =~ m!^\+\+\+ "?b/!) {
1870                if ($to->{'href'}) {
1871                        $line = '+++ b/' .
1872                                $cgi->a({-href=>$to->{'href'}, -class=>"path"},
1873                                        esc_path($to->{'file'}));
1874                } else {
1875                        $line = '+++ b/' .
1876                                esc_path($to->{'file'});
1877                }
1878        }
1879        $result .= qq!<div class="diff to_file">$line</div>\n!;
1880
1881        return $result;
1882}
1883
1884# create note for patch simplified by combined diff
1885sub format_diff_cc_simplified {
1886        my ($diffinfo, @parents) = @_;
1887        my $result = '';
1888
1889        $result .= "<div class=\"diff header\">" .
1890                   "diff --cc ";
1891        if (!is_deleted($diffinfo)) {
1892                $result .= $cgi->a({-href => href(action=>"blob",
1893                                                  hash_base=>$hash,
1894                                                  hash=>$diffinfo->{'to_id'},
1895                                                  file_name=>$diffinfo->{'to_file'}),
1896                                    -class => "path"},
1897                                   esc_path($diffinfo->{'to_file'}));
1898        } else {
1899                $result .= esc_path($diffinfo->{'to_file'});
1900        }
1901        $result .= "</div>\n" . # class="diff header"
1902                   "<div class=\"diff nodifferences\">" .
1903                   "Simple merge" .
1904                   "</div>\n"; # class="diff nodifferences"
1905
1906        return $result;
1907}
1908
1909# format patch (diff) line (not to be used for diff headers)
1910sub format_diff_line {
1911        my $line = shift;
1912        my ($from, $to) = @_;
1913        my $diff_class = "";
1914
1915        chomp $line;
1916
1917        if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
1918                # combined diff
1919                my $prefix = substr($line, 0, scalar @{$from->{'href'}});
1920                if ($line =~ m/^\@{3}/) {
1921                        $diff_class = " chunk_header";
1922                } elsif ($line =~ m/^\\/) {
1923                        $diff_class = " incomplete";
1924                } elsif ($prefix =~ tr/+/+/) {
1925                        $diff_class = " add";
1926                } elsif ($prefix =~ tr/-/-/) {
1927                        $diff_class = " rem";
1928                }
1929        } else {
1930                # assume ordinary diff
1931                my $char = substr($line, 0, 1);
1932                if ($char eq '+') {
1933                        $diff_class = " add";
1934                } elsif ($char eq '-') {
1935                        $diff_class = " rem";
1936                } elsif ($char eq '@') {
1937                        $diff_class = " chunk_header";
1938                } elsif ($char eq "\\") {
1939                        $diff_class = " incomplete";
1940                }
1941        }
1942        $line = untabify($line);
1943        if ($from && $to && $line =~ m/^\@{2} /) {
1944                my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
1945                        $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
1946
1947                $from_lines = 0 unless defined $from_lines;
1948                $to_lines   = 0 unless defined $to_lines;
1949
1950                if ($from->{'href'}) {
1951                        $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
1952                                             -class=>"list"}, $from_text);
1953                }
1954                if ($to->{'href'}) {
1955                        $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
1956                                             -class=>"list"}, $to_text);
1957                }
1958                $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
1959                        "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
1960                return "<div class=\"diff$diff_class\">$line</div>\n";
1961        } elsif ($from && $to && $line =~ m/^\@{3}/) {
1962                my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
1963                my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
1964
1965                @from_text = split(' ', $ranges);
1966                for (my $i = 0; $i < @from_text; ++$i) {
1967                        ($from_start[$i], $from_nlines[$i]) =
1968                                (split(',', substr($from_text[$i], 1)), 0);
1969                }
1970
1971                $to_text   = pop @from_text;
1972                $to_start  = pop @from_start;
1973                $to_nlines = pop @from_nlines;
1974
1975                $line = "<span class=\"chunk_info\">$prefix ";
1976                for (my $i = 0; $i < @from_text; ++$i) {
1977                        if ($from->{'href'}[$i]) {
1978                                $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
1979                                                  -class=>"list"}, $from_text[$i]);
1980                        } else {
1981                                $line .= $from_text[$i];
1982                        }
1983                        $line .= " ";
1984                }
1985                if ($to->{'href'}) {
1986                        $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
1987                                          -class=>"list"}, $to_text);
1988                } else {
1989                        $line .= $to_text;
1990                }
1991                $line .= " $prefix</span>" .
1992                         "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
1993                return "<div class=\"diff$diff_class\">$line</div>\n";
1994        }
1995        return "<div class=\"diff$diff_class\">" . esc_html($line, -nbsp=>1) . "</div>\n";
1996}
1997
1998# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
1999# linked.  Pass the hash of the tree/commit to snapshot.
2000sub format_snapshot_links {
2001        my ($hash) = @_;
2002        my $num_fmts = @snapshot_fmts;
2003        if ($num_fmts > 1) {
2004                # A parenthesized list of links bearing format names.
2005                # e.g. "snapshot (_tar.gz_ _zip_)"
2006                return "snapshot (" . join(' ', map
2007                        $cgi->a({
2008                                -href => href(
2009                                        action=>"snapshot",
2010                                        hash=>$hash,
2011                                        snapshot_format=>$_
2012                                )
2013                        }, $known_snapshot_formats{$_}{'display'})
2014                , @snapshot_fmts) . ")";
2015        } elsif ($num_fmts == 1) {
2016                # A single "snapshot" link whose tooltip bears the format name.
2017                # i.e. "_snapshot_"
2018                my ($fmt) = @snapshot_fmts;
2019                return
2020                        $cgi->a({
2021                                -href => href(
2022                                        action=>"snapshot",
2023                                        hash=>$hash,
2024                                        snapshot_format=>$fmt
2025                                ),
2026                                -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2027                        }, "snapshot");
2028        } else { # $num_fmts == 0
2029                return undef;
2030        }
2031}
2032
2033## ......................................................................
2034## functions returning values to be passed, perhaps after some
2035## transformation, to other functions; e.g. returning arguments to href()
2036
2037# returns hash to be passed to href to generate gitweb URL
2038# in -title key it returns description of link
2039sub get_feed_info {
2040        my $format = shift || 'Atom';
2041        my %res = (action => lc($format));
2042
2043        # feed links are possible only for project views
2044        return unless (defined $project);
2045        # some views should link to OPML, or to generic project feed,
2046        # or don't have specific feed yet (so they should use generic)
2047        return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2048
2049        my $branch;
2050        # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2051        # from tag links; this also makes possible to detect branch links
2052        if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2053            (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2054                $branch = $1;
2055        }
2056        # find log type for feed description (title)
2057        my $type = 'log';
2058        if (defined $file_name) {
2059                $type  = "history of $file_name";
2060                $type .= "/" if ($action eq 'tree');
2061                $type .= " on '$branch'" if (defined $branch);
2062        } else {
2063                $type = "log of $branch" if (defined $branch);
2064        }
2065
2066        $res{-title} = $type;
2067        $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2068        $res{'file_name'} = $file_name;
2069
2070        return %res;
2071}
2072
2073## ----------------------------------------------------------------------
2074## git utility subroutines, invoking git commands
2075
2076# returns path to the core git executable and the --git-dir parameter as list
2077sub git_cmd {
2078        $number_of_git_cmds++;
2079        return $GIT, '--git-dir='.$git_dir;
2080}
2081
2082# quote the given arguments for passing them to the shell
2083# quote_command("command", "arg 1", "arg with ' and ! characters")
2084# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2085# Try to avoid using this function wherever possible.
2086sub quote_command {
2087        return join(' ',
2088                map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2089}
2090
2091# get HEAD ref of given project as hash
2092sub git_get_head_hash {
2093        return git_get_full_hash(shift, 'HEAD');
2094}
2095
2096sub git_get_full_hash {
2097        return git_get_hash(@_);
2098}
2099
2100sub git_get_short_hash {
2101        return git_get_hash(@_, '--short=7');
2102}
2103
2104sub git_get_hash {
2105        my ($project, $hash, @options) = @_;
2106        my $o_git_dir = $git_dir;
2107        my $retval = undef;
2108        $git_dir = "$projectroot/$project";
2109        if (open my $fd, '-|', git_cmd(), 'rev-parse',
2110            '--verify', '-q', @options, $hash) {
2111                $retval = <$fd>;
2112                chomp $retval if defined $retval;
2113                close $fd;
2114        }
2115        if (defined $o_git_dir) {
2116                $git_dir = $o_git_dir;
2117        }
2118        return $retval;
2119}
2120
2121# get type of given object
2122sub git_get_type {
2123        my $hash = shift;
2124
2125        open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2126        my $type = <$fd>;
2127        close $fd or return;
2128        chomp $type;
2129        return $type;
2130}
2131
2132# repository configuration
2133our $config_file = '';
2134our %config;
2135
2136# store multiple values for single key as anonymous array reference
2137# single values stored directly in the hash, not as [ <value> ]
2138sub hash_set_multi {
2139        my ($hash, $key, $value) = @_;
2140
2141        if (!exists $hash->{$key}) {
2142                $hash->{$key} = $value;
2143        } elsif (!ref $hash->{$key}) {
2144                $hash->{$key} = [ $hash->{$key}, $value ];
2145        } else {
2146                push @{$hash->{$key}}, $value;
2147        }
2148}
2149
2150# return hash of git project configuration
2151# optionally limited to some section, e.g. 'gitweb'
2152sub git_parse_project_config {
2153        my $section_regexp = shift;
2154        my %config;
2155
2156        local $/ = "\0";
2157
2158        open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2159                or return;
2160
2161        while (my $keyval = <$fh>) {
2162                chomp $keyval;
2163                my ($key, $value) = split(/\n/, $keyval, 2);
2164
2165                hash_set_multi(\%config, $key, $value)
2166                        if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2167        }
2168        close $fh;
2169
2170        return %config;
2171}
2172
2173# convert config value to boolean: 'true' or 'false'
2174# no value, number > 0, 'true' and 'yes' values are true
2175# rest of values are treated as false (never as error)
2176sub config_to_bool {
2177        my $val = shift;
2178
2179        return 1 if !defined $val;             # section.key
2180
2181        # strip leading and trailing whitespace
2182        $val =~ s/^\s+//;
2183        $val =~ s/\s+$//;
2184
2185        return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2186                ($val =~ /^(?:true|yes)$/i));  # section.key = true
2187}
2188
2189# convert config value to simple decimal number
2190# an optional value suffix of 'k', 'm', or 'g' will cause the value
2191# to be multiplied by 1024, 1048576, or 1073741824
2192sub config_to_int {
2193        my $val = shift;
2194
2195        # strip leading and trailing whitespace
2196        $val =~ s/^\s+//;
2197        $val =~ s/\s+$//;
2198
2199        if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2200                $unit = lc($unit);
2201                # unknown unit is treated as 1
2202                return $num * ($unit eq 'g' ? 1073741824 :
2203                               $unit eq 'm' ?    1048576 :
2204                               $unit eq 'k' ?       1024 : 1);
2205        }
2206        return $val;
2207}
2208
2209# convert config value to array reference, if needed
2210sub config_to_multi {
2211        my $val = shift;
2212
2213        return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2214}
2215
2216sub git_get_project_config {
2217        my ($key, $type) = @_;
2218
2219        # do we have project
2220        return unless (defined $project && defined $git_dir);
2221
2222        # key sanity check
2223        return unless ($key);
2224        $key =~ s/^gitweb\.//;
2225        return if ($key =~ m/\W/);
2226
2227        # type sanity check
2228        if (defined $type) {
2229                $type =~ s/^--//;
2230                $type = undef
2231                        unless ($type eq 'bool' || $type eq 'int');
2232        }
2233
2234        # get config
2235        if (!defined $config_file ||
2236            $config_file ne "$git_dir/config") {
2237                %config = git_parse_project_config('gitweb');
2238                $config_file = "$git_dir/config";
2239        }
2240
2241        # check if config variable (key) exists
2242        return unless exists $config{"gitweb.$key"};
2243
2244        # ensure given type
2245        if (!defined $type) {
2246                return $config{"gitweb.$key"};
2247        } elsif ($type eq 'bool') {
2248                # backward compatibility: 'git config --bool' returns true/false
2249                return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2250        } elsif ($type eq 'int') {
2251                return config_to_int($config{"gitweb.$key"});
2252        }
2253        return $config{"gitweb.$key"};
2254}
2255
2256# get hash of given path at given ref
2257sub git_get_hash_by_path {
2258        my $base = shift;
2259        my $path = shift || return undef;
2260        my $type = shift;
2261
2262        $path =~ s,/+$,,;
2263
2264        open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2265                or die_error(500, "Open git-ls-tree failed");
2266        my $line = <$fd>;
2267        close $fd or return undef;
2268
2269        if (!defined $line) {
2270                # there is no tree or hash given by $path at $base
2271                return undef;
2272        }
2273
2274        #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2275        $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2276        if (defined $type && $type ne $2) {
2277                # type doesn't match
2278                return undef;
2279        }
2280        return $3;
2281}
2282
2283# get path of entry with given hash at given tree-ish (ref)
2284# used to get 'from' filename for combined diff (merge commit) for renames
2285sub git_get_path_by_hash {
2286        my $base = shift || return;
2287        my $hash = shift || return;
2288
2289        local $/ = "\0";
2290
2291        open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2292                or return undef;
2293        while (my $line = <$fd>) {
2294                chomp $line;
2295
2296                #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2297                #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2298                if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2299                        close $fd;
2300                        return $1;
2301                }
2302        }
2303        close $fd;
2304        return undef;
2305}
2306
2307## ......................................................................
2308## git utility functions, directly accessing git repository
2309
2310sub git_get_project_description {
2311        my $path = shift;
2312
2313        $git_dir = "$projectroot/$path";
2314        open my $fd, '<', "$git_dir/description"
2315                or return git_get_project_config('description');
2316        my $descr = <$fd>;
2317        close $fd;
2318        if (defined $descr) {
2319                chomp $descr;
2320        }
2321        return $descr;
2322}
2323
2324sub git_get_project_ctags {
2325        my $path = shift;
2326        my $ctags = {};
2327
2328        $git_dir = "$projectroot/$path";
2329        opendir my $dh, "$git_dir/ctags"
2330                or return $ctags;
2331        foreach (grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh)) {
2332                open my $ct, '<', $_ or next;
2333                my $val = <$ct>;
2334                chomp $val;
2335                close $ct;
2336                my $ctag = $_; $ctag =~ s#.*/##;
2337                $ctags->{$ctag} = $val;
2338        }
2339        closedir $dh;
2340        $ctags;
2341}
2342
2343sub git_populate_project_tagcloud {
2344        my $ctags = shift;
2345
2346        # First, merge different-cased tags; tags vote on casing
2347        my %ctags_lc;
2348        foreach (keys %$ctags) {
2349                $ctags_lc{lc $_}->{count} += $ctags->{$_};
2350                if (not $ctags_lc{lc $_}->{topcount}
2351                    or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2352                        $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2353                        $ctags_lc{lc $_}->{topname} = $_;
2354                }
2355        }
2356
2357        my $cloud;
2358        if (eval { require HTML::TagCloud; 1; }) {
2359                $cloud = HTML::TagCloud->new;
2360                foreach (sort keys %ctags_lc) {
2361                        # Pad the title with spaces so that the cloud looks
2362                        # less crammed.
2363                        my $title = $ctags_lc{$_}->{topname};
2364                        $title =~ s/ /&nbsp;/g;
2365                        $title =~ s/^/&nbsp;/g;
2366                        $title =~ s/$/&nbsp;/g;
2367                        $cloud->add($title, $home_link."?by_tag=".$_, $ctags_lc{$_}->{count});
2368                }
2369        } else {
2370                $cloud = \%ctags_lc;
2371        }
2372        $cloud;
2373}
2374
2375sub git_show_project_tagcloud {
2376        my ($cloud, $count) = @_;
2377        print STDERR ref($cloud)."..\n";
2378        if (ref $cloud eq 'HTML::TagCloud') {
2379                return $cloud->html_and_css($count);
2380        } else {
2381                my @tags = sort { $cloud->{$a}->{count} <=> $cloud->{$b}->{count} } keys %$cloud;
2382                return '<p align="center">' . join (', ', map {
2383                        "<a href=\"$home_link?by_tag=$_\">$cloud->{$_}->{topname}</a>"
2384                } splice(@tags, 0, $count)) . '</p>';
2385        }
2386}
2387
2388sub git_get_project_url_list {
2389        my $path = shift;
2390
2391        $git_dir = "$projectroot/$path";
2392        open my $fd, '<', "$git_dir/cloneurl"
2393                or return wantarray ?
2394                @{ config_to_multi(git_get_project_config('url')) } :
2395                   config_to_multi(git_get_project_config('url'));
2396        my @git_project_url_list = map { chomp; $_ } <$fd>;
2397        close $fd;
2398
2399        return wantarray ? @git_project_url_list : \@git_project_url_list;
2400}
2401
2402sub git_get_projects_list {
2403        my ($filter) = @_;
2404        my @list;
2405
2406        $filter ||= '';
2407        $filter =~ s/\.git$//;
2408
2409        my $check_forks = gitweb_check_feature('forks');
2410
2411        if (-d $projects_list) {
2412                # search in directory
2413                my $dir = $projects_list . ($filter ? "/$filter" : '');
2414                # remove the trailing "/"
2415                $dir =~ s!/+$!!;
2416                my $pfxlen = length("$dir");
2417                my $pfxdepth = ($dir =~ tr!/!!);
2418
2419                File::Find::find({
2420                        follow_fast => 1, # follow symbolic links
2421                        follow_skip => 2, # ignore duplicates
2422                        dangling_symlinks => 0, # ignore dangling symlinks, silently
2423                        wanted => sub {
2424                                # skip project-list toplevel, if we get it.
2425                                return if (m!^[/.]$!);
2426                                # only directories can be git repositories
2427                                return unless (-d $_);
2428                                # don't traverse too deep (Find is super slow on os x)
2429                                if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2430                                        $File::Find::prune = 1;
2431                                        return;
2432                                }
2433
2434                                my $subdir = substr($File::Find::name, $pfxlen + 1);
2435                                # we check related file in $projectroot
2436                                my $path = ($filter ? "$filter/" : '') . $subdir;
2437                                if (check_export_ok("$projectroot/$path")) {
2438                                        push @list, { path => $path };
2439                                        $File::Find::prune = 1;
2440                                }
2441                        },
2442                }, "$dir");
2443
2444        } elsif (-f $projects_list) {
2445                # read from file(url-encoded):
2446                # 'git%2Fgit.git Linus+Torvalds'
2447                # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2448                # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2449                my %paths;
2450                open my $fd, '<', $projects_list or return;
2451        PROJECT:
2452                while (my $line = <$fd>) {
2453                        chomp $line;
2454                        my ($path, $owner) = split ' ', $line;
2455                        $path = unescape($path);
2456                        $owner = unescape($owner);
2457                        if (!defined $path) {
2458                                next;
2459                        }
2460                        if ($filter ne '') {
2461                                # looking for forks;
2462                                my $pfx = substr($path, 0, length($filter));
2463                                if ($pfx ne $filter) {
2464                                        next PROJECT;
2465                                }
2466                                my $sfx = substr($path, length($filter));
2467                                if ($sfx !~ /^\/.*\.git$/) {
2468                                        next PROJECT;
2469                                }
2470                        } elsif ($check_forks) {
2471                        PATH:
2472                                foreach my $filter (keys %paths) {
2473                                        # looking for forks;
2474                                        my $pfx = substr($path, 0, length($filter));
2475                                        if ($pfx ne $filter) {
2476                                                next PATH;
2477                                        }
2478                                        my $sfx = substr($path, length($filter));
2479                                        if ($sfx !~ /^\/.*\.git$/) {
2480                                                next PATH;
2481                                        }
2482                                        # is a fork, don't include it in
2483                                        # the list
2484                                        next PROJECT;
2485                                }
2486                        }
2487                        if (check_export_ok("$projectroot/$path")) {
2488                                my $pr = {
2489                                        path => $path,
2490                                        owner => to_utf8($owner),
2491                                };
2492                                push @list, $pr;
2493                                (my $forks_path = $path) =~ s/\.git$//;
2494                                $paths{$forks_path}++;
2495                        }
2496                }
2497                close $fd;
2498        }
2499        return @list;
2500}
2501
2502our $gitweb_project_owner = undef;
2503sub git_get_project_list_from_file {
2504
2505        return if (defined $gitweb_project_owner);
2506
2507        $gitweb_project_owner = {};
2508        # read from file (url-encoded):
2509        # 'git%2Fgit.git Linus+Torvalds'
2510        # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2511        # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2512        if (-f $projects_list) {
2513                open(my $fd, '<', $projects_list);
2514                while (my $line = <$fd>) {
2515                        chomp $line;
2516                        my ($pr, $ow) = split ' ', $line;
2517                        $pr = unescape($pr);
2518                        $ow = unescape($ow);
2519                        $gitweb_project_owner->{$pr} = to_utf8($ow);
2520                }
2521                close $fd;
2522        }
2523}
2524
2525sub git_get_project_owner {
2526        my $project = shift;
2527        my $owner;
2528
2529        return undef unless $project;
2530        $git_dir = "$projectroot/$project";
2531
2532        if (!defined $gitweb_project_owner) {
2533                git_get_project_list_from_file();
2534        }
2535
2536        if (exists $gitweb_project_owner->{$project}) {
2537                $owner = $gitweb_project_owner->{$project};
2538        }
2539        if (!defined $owner){
2540                $owner = git_get_project_config('owner');
2541        }
2542        if (!defined $owner) {
2543                $owner = get_file_owner("$git_dir");
2544        }
2545
2546        return $owner;
2547}
2548
2549sub git_get_last_activity {
2550        my ($path) = @_;
2551        my $fd;
2552
2553        $git_dir = "$projectroot/$path";
2554        open($fd, "-|", git_cmd(), 'for-each-ref',
2555             '--format=%(committer)',
2556             '--sort=-committerdate',
2557             '--count=1',
2558             'refs/heads') or return;
2559        my $most_recent = <$fd>;
2560        close $fd or return;
2561        if (defined $most_recent &&
2562            $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
2563                my $timestamp = $1;
2564                my $age = time - $timestamp;
2565                return ($age, age_string($age));
2566        }
2567        return (undef, undef);
2568}
2569
2570sub git_get_references {
2571        my $type = shift || "";
2572        my %refs;
2573        # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
2574        # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
2575        open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
2576                ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
2577                or return;
2578
2579        while (my $line = <$fd>) {
2580                chomp $line;
2581                if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
2582                        if (defined $refs{$1}) {
2583                                push @{$refs{$1}}, $2;
2584                        } else {
2585                                $refs{$1} = [ $2 ];
2586                        }
2587                }
2588        }
2589        close $fd or return;
2590        return \%refs;
2591}
2592
2593sub git_get_rev_name_tags {
2594        my $hash = shift || return undef;
2595
2596        open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
2597                or return;
2598        my $name_rev = <$fd>;
2599        close $fd;
2600
2601        if ($name_rev =~ m|^$hash tags/(.*)$|) {
2602                return $1;
2603        } else {
2604                # catches also '$hash undefined' output
2605                return undef;
2606        }
2607}
2608
2609## ----------------------------------------------------------------------
2610## parse to hash functions
2611
2612sub parse_date {
2613        my $epoch = shift;
2614        my $tz = shift || "-0000";
2615
2616        my %date;
2617        my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
2618        my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
2619        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
2620        $date{'hour'} = $hour;
2621        $date{'minute'} = $min;
2622        $date{'mday'} = $mday;
2623        $date{'day'} = $days[$wday];
2624        $date{'month'} = $months[$mon];
2625        $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
2626                             $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
2627        $date{'mday-time'} = sprintf "%d %s %02d:%02d",
2628                             $mday, $months[$mon], $hour ,$min;
2629        $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
2630                             1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
2631
2632        $tz =~ m/^([+\-][0-9][0-9])([0-9][0-9])$/;
2633        my $local = $epoch + ((int $1 + ($2/60)) * 3600);
2634        ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
2635        $date{'hour_local'} = $hour;
2636        $date{'minute_local'} = $min;
2637        $date{'tz_local'} = $tz;
2638        $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
2639                                  1900+$year, $mon+1, $mday,
2640                                  $hour, $min, $sec, $tz);
2641        return %date;
2642}
2643
2644sub parse_tag {
2645        my $tag_id = shift;
2646        my %tag;
2647        my @comment;
2648
2649        open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
2650        $tag{'id'} = $tag_id;
2651        while (my $line = <$fd>) {
2652                chomp $line;
2653                if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
2654                        $tag{'object'} = $1;
2655                } elsif ($line =~ m/^type (.+)$/) {
2656                        $tag{'type'} = $1;
2657                } elsif ($line =~ m/^tag (.+)$/) {
2658                        $tag{'name'} = $1;
2659                } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
2660                        $tag{'author'} = $1;
2661                        $tag{'author_epoch'} = $2;
2662                        $tag{'author_tz'} = $3;
2663                        if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
2664                                $tag{'author_name'}  = $1;
2665                                $tag{'author_email'} = $2;
2666                        } else {
2667                                $tag{'author_name'} = $tag{'author'};
2668                        }
2669                } elsif ($line =~ m/--BEGIN/) {
2670                        push @comment, $line;
2671                        last;
2672                } elsif ($line eq "") {
2673                        last;
2674                }
2675        }
2676        push @comment, <$fd>;
2677        $tag{'comment'} = \@comment;
2678        close $fd or return;
2679        if (!defined $tag{'name'}) {
2680                return
2681        };
2682        return %tag
2683}
2684
2685sub parse_commit_text {
2686        my ($commit_text, $withparents) = @_;
2687        my @commit_lines = split '\n', $commit_text;
2688        my %co;
2689
2690        pop @commit_lines; # Remove '\0'
2691
2692        if (! @commit_lines) {
2693                return;
2694        }
2695
2696        my $header = shift @commit_lines;
2697        if ($header !~ m/^[0-9a-fA-F]{40}/) {
2698                return;
2699        }
2700        ($co{'id'}, my @parents) = split ' ', $header;
2701        while (my $line = shift @commit_lines) {
2702                last if $line eq "\n";
2703                if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
2704                        $co{'tree'} = $1;
2705                } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
2706                        push @parents, $1;
2707                } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
2708                        $co{'author'} = to_utf8($1);
2709                        $co{'author_epoch'} = $2;
2710                        $co{'author_tz'} = $3;
2711                        if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
2712                                $co{'author_name'}  = $1;
2713                                $co{'author_email'} = $2;
2714                        } else {
2715                                $co{'author_name'} = $co{'author'};
2716                        }
2717                } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
2718                        $co{'committer'} = to_utf8($1);
2719                        $co{'committer_epoch'} = $2;
2720                        $co{'committer_tz'} = $3;
2721                        if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
2722                                $co{'committer_name'}  = $1;
2723                                $co{'committer_email'} = $2;
2724                        } else {
2725                                $co{'committer_name'} = $co{'committer'};
2726                        }
2727                }
2728        }
2729        if (!defined $co{'tree'}) {
2730                return;
2731        };
2732        $co{'parents'} = \@parents;
2733        $co{'parent'} = $parents[0];
2734
2735        foreach my $title (@commit_lines) {
2736                $title =~ s/^    //;
2737                if ($title ne "") {
2738                        $co{'title'} = chop_str($title, 80, 5);
2739                        # remove leading stuff of merges to make the interesting part visible
2740                        if (length($title) > 50) {
2741                                $title =~ s/^Automatic //;
2742                                $title =~ s/^merge (of|with) /Merge ... /i;
2743                                if (length($title) > 50) {
2744                                        $title =~ s/(http|rsync):\/\///;
2745                                }
2746                                if (length($title) > 50) {
2747                                        $title =~ s/(master|www|rsync)\.//;
2748                                }
2749                                if (length($title) > 50) {
2750                                        $title =~ s/kernel.org:?//;
2751                                }
2752                                if (length($title) > 50) {
2753                                        $title =~ s/\/pub\/scm//;
2754                                }
2755                        }
2756                        $co{'title_short'} = chop_str($title, 50, 5);
2757                        last;
2758                }
2759        }
2760        if (! defined $co{'title'} || $co{'title'} eq "") {
2761                $co{'title'} = $co{'title_short'} = '(no commit message)';
2762        }
2763        # remove added spaces
2764        foreach my $line (@commit_lines) {
2765                $line =~ s/^    //;
2766        }
2767        $co{'comment'} = \@commit_lines;
2768
2769        my $age = time - $co{'committer_epoch'};
2770        $co{'age'} = $age;
2771        $co{'age_string'} = age_string($age);
2772        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
2773        if ($age > 60*60*24*7*2) {
2774                $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
2775                $co{'age_string_age'} = $co{'age_string'};
2776        } else {
2777                $co{'age_string_date'} = $co{'age_string'};
2778                $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
2779        }
2780        return %co;
2781}
2782
2783sub parse_commit {
2784        my ($commit_id) = @_;
2785        my %co;
2786
2787        local $/ = "\0";
2788
2789        open my $fd, "-|", git_cmd(), "rev-list",
2790                "--parents",
2791                "--header",
2792                "--max-count=1",
2793                $commit_id,
2794                "--",
2795                or die_error(500, "Open git-rev-list failed");
2796        %co = parse_commit_text(<$fd>, 1);
2797        close $fd;
2798
2799        return %co;
2800}
2801
2802sub parse_commits {
2803        my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
2804        my @cos;
2805
2806        $maxcount ||= 1;
2807        $skip ||= 0;
2808
2809        local $/ = "\0";
2810
2811        open my $fd, "-|", git_cmd(), "rev-list",
2812                "--header",
2813                @args,
2814                ("--max-count=" . $maxcount),
2815                ("--skip=" . $skip),
2816                @extra_options,
2817                $commit_id,
2818                "--",
2819                ($filename ? ($filename) : ())
2820                or die_error(500, "Open git-rev-list failed");
2821        while (my $line = <$fd>) {
2822                my %co = parse_commit_text($line);
2823                push @cos, \%co;
2824        }
2825        close $fd;
2826
2827        return wantarray ? @cos : \@cos;
2828}
2829
2830# parse line of git-diff-tree "raw" output
2831sub parse_difftree_raw_line {
2832        my $line = shift;
2833        my %res;
2834
2835        # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
2836        # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
2837        if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
2838                $res{'from_mode'} = $1;
2839                $res{'to_mode'} = $2;
2840                $res{'from_id'} = $3;
2841                $res{'to_id'} = $4;
2842                $res{'status'} = $5;
2843                $res{'similarity'} = $6;
2844                if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
2845                        ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
2846                } else {
2847                        $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
2848                }
2849        }
2850        # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
2851        # combined diff (for merge commit)
2852        elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
2853                $res{'nparents'}  = length($1);
2854                $res{'from_mode'} = [ split(' ', $2) ];
2855                $res{'to_mode'} = pop @{$res{'from_mode'}};
2856                $res{'from_id'} = [ split(' ', $3) ];
2857                $res{'to_id'} = pop @{$res{'from_id'}};
2858                $res{'status'} = [ split('', $4) ];
2859                $res{'to_file'} = unquote($5);
2860        }
2861        # 'c512b523472485aef4fff9e57b229d9d243c967f'
2862        elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
2863                $res{'commit'} = $1;
2864        }
2865
2866        return wantarray ? %res : \%res;
2867}
2868
2869# wrapper: return parsed line of git-diff-tree "raw" output
2870# (the argument might be raw line, or parsed info)
2871sub parsed_difftree_line {
2872        my $line_or_ref = shift;
2873
2874        if (ref($line_or_ref) eq "HASH") {
2875                # pre-parsed (or generated by hand)
2876                return $line_or_ref;
2877        } else {
2878                return parse_difftree_raw_line($line_or_ref);
2879        }
2880}
2881
2882# parse line of git-ls-tree output
2883sub parse_ls_tree_line {
2884        my $line = shift;
2885        my %opts = @_;
2886        my %res;
2887
2888        if ($opts{'-l'}) {
2889                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
2890                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
2891
2892                $res{'mode'} = $1;
2893                $res{'type'} = $2;
2894                $res{'hash'} = $3;
2895                $res{'size'} = $4;
2896                if ($opts{'-z'}) {
2897                        $res{'name'} = $5;
2898                } else {
2899                        $res{'name'} = unquote($5);
2900                }
2901        } else {
2902                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2903                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
2904
2905                $res{'mode'} = $1;
2906                $res{'type'} = $2;
2907                $res{'hash'} = $3;
2908                if ($opts{'-z'}) {
2909                        $res{'name'} = $4;
2910                } else {
2911                        $res{'name'} = unquote($4);
2912                }
2913        }
2914
2915        return wantarray ? %res : \%res;
2916}
2917
2918# generates _two_ hashes, references to which are passed as 2 and 3 argument
2919sub parse_from_to_diffinfo {
2920        my ($diffinfo, $from, $to, @parents) = @_;
2921
2922        if ($diffinfo->{'nparents'}) {
2923                # combined diff
2924                $from->{'file'} = [];
2925                $from->{'href'} = [];
2926                fill_from_file_info($diffinfo, @parents)
2927                        unless exists $diffinfo->{'from_file'};
2928                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2929                        $from->{'file'}[$i] =
2930                                defined $diffinfo->{'from_file'}[$i] ?
2931                                        $diffinfo->{'from_file'}[$i] :
2932                                        $diffinfo->{'to_file'};
2933                        if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
2934                                $from->{'href'}[$i] = href(action=>"blob",
2935                                                           hash_base=>$parents[$i],
2936                                                           hash=>$diffinfo->{'from_id'}[$i],
2937                                                           file_name=>$from->{'file'}[$i]);
2938                        } else {
2939                                $from->{'href'}[$i] = undef;
2940                        }
2941                }
2942        } else {
2943                # ordinary (not combined) diff
2944                $from->{'file'} = $diffinfo->{'from_file'};
2945                if ($diffinfo->{'status'} ne "A") { # not new (added) file
2946                        $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
2947                                               hash=>$diffinfo->{'from_id'},
2948                                               file_name=>$from->{'file'});
2949                } else {
2950                        delete $from->{'href'};
2951                }
2952        }
2953
2954        $to->{'file'} = $diffinfo->{'to_file'};
2955        if (!is_deleted($diffinfo)) { # file exists in result
2956                $to->{'href'} = href(action=>"blob", hash_base=>$hash,
2957                                     hash=>$diffinfo->{'to_id'},
2958                                     file_name=>$to->{'file'});
2959        } else {
2960                delete $to->{'href'};
2961        }
2962}
2963
2964## ......................................................................
2965## parse to array of hashes functions
2966
2967sub git_get_heads_list {
2968        my $limit = shift;
2969        my @headslist;
2970
2971        open my $fd, '-|', git_cmd(), 'for-each-ref',
2972                ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
2973                '--format=%(objectname) %(refname) %(subject)%00%(committer)',
2974                'refs/heads'
2975                or return;
2976        while (my $line = <$fd>) {
2977                my %ref_item;
2978
2979                chomp $line;
2980                my ($refinfo, $committerinfo) = split(/\0/, $line);
2981                my ($hash, $name, $title) = split(' ', $refinfo, 3);
2982                my ($committer, $epoch, $tz) =
2983                        ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
2984                $ref_item{'fullname'}  = $name;
2985                $name =~ s!^refs/heads/!!;
2986
2987                $ref_item{'name'}  = $name;
2988                $ref_item{'id'}    = $hash;
2989                $ref_item{'title'} = $title || '(no commit message)';
2990                $ref_item{'epoch'} = $epoch;
2991                if ($epoch) {
2992                        $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
2993                } else {
2994                        $ref_item{'age'} = "unknown";
2995                }
2996
2997                push @headslist, \%ref_item;
2998        }
2999        close $fd;
3000
3001        return wantarray ? @headslist : \@headslist;
3002}
3003
3004sub git_get_tags_list {
3005        my $limit = shift;
3006        my @tagslist;
3007
3008        open my $fd, '-|', git_cmd(), 'for-each-ref',
3009                ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3010                '--format=%(objectname) %(objecttype) %(refname) '.
3011                '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3012                'refs/tags'
3013                or return;
3014        while (my $line = <$fd>) {
3015                my %ref_item;
3016
3017                chomp $line;
3018                my ($refinfo, $creatorinfo) = split(/\0/, $line);
3019                my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3020                my ($creator, $epoch, $tz) =
3021                        ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3022                $ref_item{'fullname'} = $name;
3023                $name =~ s!^refs/tags/!!;
3024
3025                $ref_item{'type'} = $type;
3026                $ref_item{'id'} = $id;
3027                $ref_item{'name'} = $name;
3028                if ($type eq "tag") {
3029                        $ref_item{'subject'} = $title;
3030                        $ref_item{'reftype'} = $reftype;
3031                        $ref_item{'refid'}   = $refid;
3032                } else {
3033                        $ref_item{'reftype'} = $type;
3034                        $ref_item{'refid'}   = $id;
3035                }
3036
3037                if ($type eq "tag" || $type eq "commit") {
3038                        $ref_item{'epoch'} = $epoch;
3039                        if ($epoch) {
3040                                $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3041                        } else {
3042                                $ref_item{'age'} = "unknown";
3043                        }
3044                }
3045
3046                push @tagslist, \%ref_item;
3047        }
3048        close $fd;
3049
3050        return wantarray ? @tagslist : \@tagslist;
3051}
3052
3053## ----------------------------------------------------------------------
3054## filesystem-related functions
3055
3056sub get_file_owner {
3057        my $path = shift;
3058
3059        my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3060        my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3061        if (!defined $gcos) {
3062                return undef;
3063        }
3064        my $owner = $gcos;
3065        $owner =~ s/[,;].*$//;
3066        return to_utf8($owner);
3067}
3068
3069# assume that file exists
3070sub insert_file {
3071        my $filename = shift;
3072
3073        open my $fd, '<', $filename;
3074        print map { to_utf8($_) } <$fd>;
3075        close $fd;
3076}
3077
3078## ......................................................................
3079## mimetype related functions
3080
3081sub mimetype_guess_file {
3082        my $filename = shift;
3083        my $mimemap = shift;
3084        -r $mimemap or return undef;
3085
3086        my %mimemap;
3087        open(my $mh, '<', $mimemap) or return undef;
3088        while (<$mh>) {
3089                next if m/^#/; # skip comments
3090                my ($mimetype, $exts) = split(/\t+/);
3091                if (defined $exts) {
3092                        my @exts = split(/\s+/, $exts);
3093                        foreach my $ext (@exts) {
3094                                $mimemap{$ext} = $mimetype;
3095                        }
3096                }
3097        }
3098        close($mh);
3099
3100        $filename =~ /\.([^.]*)$/;
3101        return $mimemap{$1};
3102}
3103
3104sub mimetype_guess {
3105        my $filename = shift;
3106        my $mime;
3107        $filename =~ /\./ or return undef;
3108
3109        if ($mimetypes_file) {
3110                my $file = $mimetypes_file;
3111                if ($file !~ m!^/!) { # if it is relative path
3112                        # it is relative to project
3113                        $file = "$projectroot/$project/$file";
3114                }
3115                $mime = mimetype_guess_file($filename, $file);
3116        }
3117        $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3118        return $mime;
3119}
3120
3121sub blob_mimetype {
3122        my $fd = shift;
3123        my $filename = shift;
3124
3125        if ($filename) {
3126                my $mime = mimetype_guess($filename);
3127                $mime and return $mime;
3128        }
3129
3130        # just in case
3131        return $default_blob_plain_mimetype unless $fd;
3132
3133        if (-T $fd) {
3134                return 'text/plain';
3135        } elsif (! $filename) {
3136                return 'application/octet-stream';
3137        } elsif ($filename =~ m/\.png$/i) {
3138                return 'image/png';
3139        } elsif ($filename =~ m/\.gif$/i) {
3140                return 'image/gif';
3141        } elsif ($filename =~ m/\.jpe?g$/i) {
3142                return 'image/jpeg';
3143        } else {
3144                return 'application/octet-stream';
3145        }
3146}
3147
3148sub blob_contenttype {
3149        my ($fd, $file_name, $type) = @_;
3150
3151        $type ||= blob_mimetype($fd, $file_name);
3152        if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3153                $type .= "; charset=$default_text_plain_charset";
3154        }
3155
3156        return $type;
3157}
3158
3159## ======================================================================
3160## functions printing HTML: header, footer, error page
3161
3162sub git_header_html {
3163        my $status = shift || "200 OK";
3164        my $expires = shift;
3165
3166        my $title = "$site_name";
3167        if (defined $project) {
3168                $title .= " - " . to_utf8($project);
3169                if (defined $action) {
3170                        $title .= "/$action";
3171                        if (defined $file_name) {
3172                                $title .= " - " . esc_path($file_name);
3173                                if ($action eq "tree" && $file_name !~ m|/$|) {
3174                                        $title .= "/";
3175                                }
3176                        }
3177                }
3178        }
3179        my $content_type;
3180        # require explicit support from the UA if we are to send the page as
3181        # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3182        # we have to do this because MSIE sometimes globs '*/*', pretending to
3183        # support xhtml+xml but choking when it gets what it asked for.
3184        if (defined $cgi->http('HTTP_ACCEPT') &&
3185            $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3186            $cgi->Accept('application/xhtml+xml') != 0) {
3187                $content_type = 'application/xhtml+xml';
3188        } else {
3189                $content_type = 'text/html';
3190        }
3191        print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3192                           -status=> $status, -expires => $expires);
3193        my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3194        print <<EOF;
3195<?xml version="1.0" encoding="utf-8"?>
3196<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3197<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3198<!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3199<!-- git core binaries version $git_version -->
3200<head>
3201<meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3202<meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3203<meta name="robots" content="index, nofollow"/>
3204<title>$title</title>
3205EOF
3206        # the stylesheet, favicon etc urls won't work correctly with path_info
3207        # unless we set the appropriate base URL
3208        if ($ENV{'PATH_INFO'}) {
3209                print "<base href=\"".esc_url($base_url)."\" />\n";
3210        }
3211        # print out each stylesheet that exist, providing backwards capability
3212        # for those people who defined $stylesheet in a config file
3213        if (defined $stylesheet) {
3214                print '<link rel="stylesheet" type="text/css" href="'.$stylesheet.'"/>'."\n";
3215        } else {
3216                foreach my $stylesheet (@stylesheets) {
3217                        next unless $stylesheet;
3218                        print '<link rel="stylesheet" type="text/css" href="'.$stylesheet.'"/>'."\n";
3219                }
3220        }
3221        if (defined $project) {
3222                my %href_params = get_feed_info();
3223                if (!exists $href_params{'-title'}) {
3224                        $href_params{'-title'} = 'log';
3225                }
3226
3227                foreach my $format qw(RSS Atom) {
3228                        my $type = lc($format);
3229                        my %link_attr = (
3230                                '-rel' => 'alternate',
3231                                '-title' => "$project - $href_params{'-title'} - $format feed",
3232                                '-type' => "application/$type+xml"
3233                        );
3234
3235                        $href_params{'action'} = $type;
3236                        $link_attr{'-href'} = href(%href_params);
3237                        print "<link ".
3238                              "rel=\"$link_attr{'-rel'}\" ".
3239                              "title=\"$link_attr{'-title'}\" ".
3240                              "href=\"$link_attr{'-href'}\" ".
3241                              "type=\"$link_attr{'-type'}\" ".
3242                              "/>\n";
3243
3244                        $href_params{'extra_options'} = '--no-merges';
3245                        $link_attr{'-href'} = href(%href_params);
3246                        $link_attr{'-title'} .= ' (no merges)';
3247                        print "<link ".
3248                              "rel=\"$link_attr{'-rel'}\" ".
3249                              "title=\"$link_attr{'-title'}\" ".
3250                              "href=\"$link_attr{'-href'}\" ".
3251                              "type=\"$link_attr{'-type'}\" ".
3252                              "/>\n";
3253                }
3254
3255        } else {
3256                printf('<link rel="alternate" title="%s projects list" '.
3257                       'href="%s" type="text/plain; charset=utf-8" />'."\n",
3258                       $site_name, href(project=>undef, action=>"project_index"));
3259                printf('<link rel="alternate" title="%s projects feeds" '.
3260                       'href="%s" type="text/x-opml" />'."\n",
3261                       $site_name, href(project=>undef, action=>"opml"));
3262        }
3263        if (defined $favicon) {
3264                print qq(<link rel="shortcut icon" href="$favicon" type="image/png" />\n);
3265        }
3266
3267        print "</head>\n" .
3268              "<body>\n";
3269
3270        if (defined $site_header && -f $site_header) {
3271                insert_file($site_header);
3272        }
3273
3274        print "<div class=\"page_header\">\n" .
3275              $cgi->a({-href => esc_url($logo_url),
3276                       -title => $logo_label},
3277                      qq(<img src="$logo" width="72" height="27" alt="git" class="logo"/>));
3278        print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3279        if (defined $project) {
3280                print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3281                if (defined $action) {
3282                        print " / $action";
3283                }
3284                print "\n";
3285        }
3286        print "</div>\n";
3287
3288        my $have_search = gitweb_check_feature('search');
3289        if (defined $project && $have_search) {
3290                if (!defined $searchtext) {
3291                        $searchtext = "";
3292                }
3293                my $search_hash;
3294                if (defined $hash_base) {
3295                        $search_hash = $hash_base;
3296                } elsif (defined $hash) {
3297                        $search_hash = $hash;
3298                } else {
3299                        $search_hash = "HEAD";
3300                }
3301                my $action = $my_uri;
3302                my $use_pathinfo = gitweb_check_feature('pathinfo');
3303                if ($use_pathinfo) {
3304                        $action .= "/".esc_url($project);
3305                }
3306                print $cgi->startform(-method => "get", -action => $action) .
3307                      "<div class=\"search\">\n" .
3308                      (!$use_pathinfo &&
3309                      $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3310                      $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3311                      $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3312                      $cgi->popup_menu(-name => 'st', -default => 'commit',
3313                                       -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3314                      $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3315                      " search:\n",
3316                      $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3317                      "<span title=\"Extended regular expression\">" .
3318                      $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3319                                     -checked => $search_use_regexp) .
3320                      "</span>" .
3321                      "</div>" .
3322                      $cgi->end_form() . "\n";
3323        }
3324}
3325
3326sub git_footer_html {
3327        my $feed_class = 'rss_logo';
3328
3329        print "<div class=\"page_footer\">\n";
3330        if (defined $project) {
3331                my $descr = git_get_project_description($project);
3332                if (defined $descr) {
3333                        print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3334                }
3335
3336                my %href_params = get_feed_info();
3337                if (!%href_params) {
3338                        $feed_class .= ' generic';
3339                }
3340                $href_params{'-title'} ||= 'log';
3341
3342                foreach my $format qw(RSS Atom) {
3343                        $href_params{'action'} = lc($format);
3344                        print $cgi->a({-href => href(%href_params),
3345                                      -title => "$href_params{'-title'} $format feed",
3346                                      -class => $feed_class}, $format)."\n";
3347                }
3348
3349        } else {
3350                print $cgi->a({-href => href(project=>undef, action=>"opml"),
3351                              -class => $feed_class}, "OPML") . " ";
3352                print $cgi->a({-href => href(project=>undef, action=>"project_index"),
3353                              -class => $feed_class}, "TXT") . "\n";
3354        }
3355        print "</div>\n"; # class="page_footer"
3356
3357        if (defined $t0 && gitweb_check_feature('timed')) {
3358                print "<div id=\"generating_info\">\n";
3359                print 'This page took '.
3360                      '<span id="generating_time" class="time_span">'.
3361                      Time::HiRes::tv_interval($t0, [Time::HiRes::gettimeofday()]).
3362                      ' seconds </span>'.
3363                      ' and '.
3364                      '<span id="generating_cmd">'.
3365                      $number_of_git_cmds.
3366                      '</span> git commands '.
3367                      " to generate.\n";
3368                print "</div>\n"; # class="page_footer"
3369        }
3370
3371        if (defined $site_footer && -f $site_footer) {
3372                insert_file($site_footer);
3373        }
3374
3375        print qq!<script type="text/javascript" src="$javascript"></script>\n!;
3376        if (defined $action &&
3377            $action eq 'blame_incremental') {
3378                print qq!<script type="text/javascript">\n!.
3379                      qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
3380                      qq!           "!. href() .qq!");\n!.
3381                      qq!</script>\n!;
3382        } elsif (gitweb_check_feature('javascript-actions')) {
3383                print qq!<script type="text/javascript">\n!.
3384                      qq!window.onload = fixLinks;\n!.
3385                      qq!</script>\n!;
3386        }
3387
3388        print "</body>\n" .
3389              "</html>";
3390}
3391
3392# die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
3393# Example: die_error(404, 'Hash not found')
3394# By convention, use the following status codes (as defined in RFC 2616):
3395# 400: Invalid or missing CGI parameters, or
3396#      requested object exists but has wrong type.
3397# 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
3398#      this server or project.
3399# 404: Requested object/revision/project doesn't exist.
3400# 500: The server isn't configured properly, or
3401#      an internal error occurred (e.g. failed assertions caused by bugs), or
3402#      an unknown error occurred (e.g. the git binary died unexpectedly).
3403# 503: The server is currently unavailable (because it is overloaded,
3404#      or down for maintenance).  Generally, this is a temporary state.
3405sub die_error {
3406        my $status = shift || 500;
3407        my $error = esc_html(shift) || "Internal Server Error";
3408        my $extra = shift;
3409
3410        my %http_responses = (
3411                400 => '400 Bad Request',
3412                403 => '403 Forbidden',
3413                404 => '404 Not Found',
3414                500 => '500 Internal Server Error',
3415                503 => '503 Service Unavailable',
3416        );
3417        git_header_html($http_responses{$status});
3418        print <<EOF;
3419<div class="page_body">
3420<br /><br />
3421$status - $error
3422<br />
3423EOF
3424        if (defined $extra) {
3425                print "<hr />\n" .
3426                      "$extra\n";
3427        }
3428        print "</div>\n";
3429
3430        git_footer_html();
3431        exit;
3432}
3433
3434## ----------------------------------------------------------------------
3435## functions printing or outputting HTML: navigation
3436
3437sub git_print_page_nav {
3438        my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
3439        $extra = '' if !defined $extra; # pager or formats
3440
3441        my @navs = qw(summary shortlog log commit commitdiff tree);
3442        if ($suppress) {
3443                @navs = grep { $_ ne $suppress } @navs;
3444        }
3445
3446        my %arg = map { $_ => {action=>$_} } @navs;
3447        if (defined $head) {
3448                for (qw(commit commitdiff)) {
3449                        $arg{$_}{'hash'} = $head;
3450                }
3451                if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
3452                        for (qw(shortlog log)) {
3453                                $arg{$_}{'hash'} = $head;
3454                        }
3455                }
3456        }
3457
3458        $arg{'tree'}{'hash'} = $treehead if defined $treehead;
3459        $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
3460
3461        my @actions = gitweb_get_feature('actions');
3462        my %repl = (
3463                '%' => '%',
3464                'n' => $project,         # project name
3465                'f' => $git_dir,         # project path within filesystem
3466                'h' => $treehead || '',  # current hash ('h' parameter)
3467                'b' => $treebase || '',  # hash base ('hb' parameter)
3468        );
3469        while (@actions) {
3470                my ($label, $link, $pos) = splice(@actions,0,3);
3471                # insert
3472                @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
3473                # munch munch
3474                $link =~ s/%([%nfhb])/$repl{$1}/g;
3475                $arg{$label}{'_href'} = $link;
3476        }
3477
3478        print "<div class=\"page_nav\">\n" .
3479                (join " | ",
3480                 map { $_ eq $current ?
3481                       $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
3482                 } @navs);
3483        print "<br/>\n$extra<br/>\n" .
3484              "</div>\n";
3485}
3486
3487sub format_paging_nav {
3488        my ($action, $page, $has_next_link) = @_;
3489        my $paging_nav;
3490
3491
3492        if ($page > 0) {
3493                $paging_nav .=
3494                        $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
3495                        " &sdot; " .
3496                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
3497                                 -accesskey => "p", -title => "Alt-p"}, "prev");
3498        } else {
3499                $paging_nav .= "first &sdot; prev";
3500        }
3501
3502        if ($has_next_link) {
3503                $paging_nav .= " &sdot; " .
3504                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
3505                                 -accesskey => "n", -title => "Alt-n"}, "next");
3506        } else {
3507                $paging_nav .= " &sdot; next";
3508        }
3509
3510        return $paging_nav;
3511}
3512
3513## ......................................................................
3514## functions printing or outputting HTML: div
3515
3516sub git_print_header_div {
3517        my ($action, $title, $hash, $hash_base) = @_;
3518        my %args = ();
3519
3520        $args{'action'} = $action;
3521        $args{'hash'} = $hash if $hash;
3522        $args{'hash_base'} = $hash_base if $hash_base;
3523
3524        print "<div class=\"header\">\n" .
3525              $cgi->a({-href => href(%args), -class => "title"},
3526              $title ? $title : $action) .
3527              "\n</div>\n";
3528}
3529
3530sub print_local_time {
3531        print format_local_time(@_);
3532}
3533
3534sub format_local_time {
3535        my $localtime = '';
3536        my %date = @_;
3537        if ($date{'hour_local'} < 6) {
3538                $localtime .= sprintf(" (<span class=\"atnight\">%02d:%02d</span> %s)",
3539                        $date{'hour_local'}, $date{'minute_local'}, $date{'tz_local'});
3540        } else {
3541                $localtime .= sprintf(" (%02d:%02d %s)",
3542                        $date{'hour_local'}, $date{'minute_local'}, $date{'tz_local'});
3543        }
3544
3545        return $localtime;
3546}
3547
3548# Outputs the author name and date in long form
3549sub git_print_authorship {
3550        my $co = shift;
3551        my %opts = @_;
3552        my $tag = $opts{-tag} || 'div';
3553        my $author = $co->{'author_name'};
3554
3555        my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
3556        print "<$tag class=\"author_date\">" .
3557              format_search_author($author, "author", esc_html($author)) .
3558              " [$ad{'rfc2822'}";
3559        print_local_time(%ad) if ($opts{-localtime});
3560        print "]" . git_get_avatar($co->{'author_email'}, -pad_before => 1)
3561                  . "</$tag>\n";
3562}
3563
3564# Outputs table rows containing the full author or committer information,
3565# in the format expected for 'commit' view (& similia).
3566# Parameters are a commit hash reference, followed by the list of people
3567# to output information for. If the list is empty it defalts to both
3568# author and committer.
3569sub git_print_authorship_rows {
3570        my $co = shift;
3571        # too bad we can't use @people = @_ || ('author', 'committer')
3572        my @people = @_;
3573        @people = ('author', 'committer') unless @people;
3574        foreach my $who (@people) {
3575                my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
3576                print "<tr><td>$who</td><td>" .
3577                      format_search_author($co->{"${who}_name"}, $who,
3578                               esc_html($co->{"${who}_name"})) . " " .
3579                      format_search_author($co->{"${who}_email"}, $who,
3580                               esc_html("<" . $co->{"${who}_email"} . ">")) .
3581                      "</td><td rowspan=\"2\">" .
3582                      git_get_avatar($co->{"${who}_email"}, -size => 'double') .
3583                      "</td></tr>\n" .
3584                      "<tr>" .
3585                      "<td></td><td> $wd{'rfc2822'}";
3586                print_local_time(%wd);
3587                print "</td>" .
3588                      "</tr>\n";
3589        }
3590}
3591
3592sub git_print_page_path {
3593        my $name = shift;
3594        my $type = shift;
3595        my $hb = shift;
3596
3597
3598        print "<div class=\"page_path\">";
3599        print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
3600                      -title => 'tree root'}, to_utf8("[$project]"));
3601        print " / ";
3602        if (defined $name) {
3603                my @dirname = split '/', $name;
3604                my $basename = pop @dirname;
3605                my $fullname = '';
3606
3607                foreach my $dir (@dirname) {
3608                        $fullname .= ($fullname ? '/' : '') . $dir;
3609                        print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
3610                                                     hash_base=>$hb),
3611                                      -title => $fullname}, esc_path($dir));
3612                        print " / ";
3613                }
3614                if (defined $type && $type eq 'blob') {
3615                        print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
3616                                                     hash_base=>$hb),
3617                                      -title => $name}, esc_path($basename));
3618                } elsif (defined $type && $type eq 'tree') {
3619                        print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
3620                                                     hash_base=>$hb),
3621                                      -title => $name}, esc_path($basename));
3622                        print " / ";
3623                } else {
3624                        print esc_path($basename);
3625                }
3626        }
3627        print "<br/></div>\n";
3628}
3629
3630sub git_print_log {
3631        my $log = shift;
3632        my %opts = @_;
3633
3634        if ($opts{'-remove_title'}) {
3635                # remove title, i.e. first line of log
3636                shift @$log;
3637        }
3638        # remove leading empty lines
3639        while (defined $log->[0] && $log->[0] eq "") {
3640                shift @$log;
3641        }
3642
3643        # print log
3644        my $signoff = 0;
3645        my $empty = 0;
3646        foreach my $line (@$log) {
3647                if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
3648                        $signoff = 1;
3649                        $empty = 0;
3650                        if (! $opts{'-remove_signoff'}) {
3651                                print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
3652                                next;
3653                        } else {
3654                                # remove signoff lines
3655                                next;
3656                        }
3657                } else {
3658                        $signoff = 0;
3659                }
3660
3661                # print only one empty line
3662                # do not print empty line after signoff
3663                if ($line eq "") {
3664                        next if ($empty || $signoff);
3665                        $empty = 1;
3666                } else {
3667                        $empty = 0;
3668                }
3669
3670                print format_log_line_html($line) . "<br/>\n";
3671        }
3672
3673        if ($opts{'-final_empty_line'}) {
3674                # end with single empty line
3675                print "<br/>\n" unless $empty;
3676        }
3677}
3678
3679# return link target (what link points to)
3680sub git_get_link_target {
3681        my $hash = shift;
3682        my $link_target;
3683
3684        # read link
3685        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
3686                or return;
3687        {
3688                local $/ = undef;
3689                $link_target = <$fd>;
3690        }
3691        close $fd
3692                or return;
3693
3694        return $link_target;
3695}
3696
3697# given link target, and the directory (basedir) the link is in,
3698# return target of link relative to top directory (top tree);
3699# return undef if it is not possible (including absolute links).
3700sub normalize_link_target {
3701        my ($link_target, $basedir) = @_;
3702
3703        # absolute symlinks (beginning with '/') cannot be normalized
3704        return if (substr($link_target, 0, 1) eq '/');
3705
3706        # normalize link target to path from top (root) tree (dir)
3707        my $path;
3708        if ($basedir) {
3709                $path = $basedir . '/' . $link_target;
3710        } else {
3711                # we are in top (root) tree (dir)
3712                $path = $link_target;
3713        }
3714
3715        # remove //, /./, and /../
3716        my @path_parts;
3717        foreach my $part (split('/', $path)) {
3718                # discard '.' and ''
3719                next if (!$part || $part eq '.');
3720                # handle '..'
3721                if ($part eq '..') {
3722                        if (@path_parts) {
3723                                pop @path_parts;
3724                        } else {
3725                                # link leads outside repository (outside top dir)
3726                                return;
3727                        }
3728                } else {
3729                        push @path_parts, $part;
3730                }
3731        }
3732        $path = join('/', @path_parts);
3733
3734        return $path;
3735}
3736
3737# print tree entry (row of git_tree), but without encompassing <tr> element
3738sub git_print_tree_entry {
3739        my ($t, $basedir, $hash_base, $have_blame) = @_;
3740
3741        my %base_key = ();
3742        $base_key{'hash_base'} = $hash_base if defined $hash_base;
3743
3744        # The format of a table row is: mode list link.  Where mode is
3745        # the mode of the entry, list is the name of the entry, an href,
3746        # and link is the action links of the entry.
3747
3748        print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
3749        if (exists $t->{'size'}) {
3750                print "<td class=\"size\">$t->{'size'}</td>\n";
3751        }
3752        if ($t->{'type'} eq "blob") {
3753                print "<td class=\"list\">" .
3754                        $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
3755                                               file_name=>"$basedir$t->{'name'}", %base_key),
3756                                -class => "list"}, esc_path($t->{'name'}));
3757                if (S_ISLNK(oct $t->{'mode'})) {
3758                        my $link_target = git_get_link_target($t->{'hash'});
3759                        if ($link_target) {
3760                                my $norm_target = normalize_link_target($link_target, $basedir);
3761                                if (defined $norm_target) {
3762                                        print " -> " .
3763                                              $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
3764                                                                     file_name=>$norm_target),
3765                                                       -title => $norm_target}, esc_path($link_target));
3766                                } else {
3767                                        print " -> " . esc_path($link_target);
3768                                }
3769                        }
3770                }
3771                print "</td>\n";
3772                print "<td class=\"link\">";
3773                print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
3774                                             file_name=>"$basedir$t->{'name'}", %base_key)},
3775                              "blob");
3776                if ($have_blame) {
3777                        print " | " .
3778                              $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
3779                                                     file_name=>"$basedir$t->{'name'}", %base_key)},
3780                                      "blame");
3781                }
3782                if (defined $hash_base) {
3783                        print " | " .
3784                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
3785                                                     hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
3786                                      "history");
3787                }
3788                print " | " .
3789                        $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
3790                                               file_name=>"$basedir$t->{'name'}")},
3791                                "raw");
3792                print "</td>\n";
3793
3794        } elsif ($t->{'type'} eq "tree") {
3795                print "<td class=\"list\">";
3796                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
3797                                             file_name=>"$basedir$t->{'name'}",
3798                                             %base_key)},
3799                              esc_path($t->{'name'}));
3800                print "</td>\n";
3801                print "<td class=\"link\">";
3802                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
3803                                             file_name=>"$basedir$t->{'name'}",
3804                                             %base_key)},
3805                              "tree");
3806                if (defined $hash_base) {
3807                        print " | " .
3808                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
3809                                                     file_name=>"$basedir$t->{'name'}")},
3810                                      "history");
3811                }
3812                print "</td>\n";
3813        } else {
3814                # unknown object: we can only present history for it
3815                # (this includes 'commit' object, i.e. submodule support)
3816                print "<td class=\"list\">" .
3817                      esc_path($t->{'name'}) .
3818                      "</td>\n";
3819                print "<td class=\"link\">";
3820                if (defined $hash_base) {
3821                        print $cgi->a({-href => href(action=>"history",
3822                                                     hash_base=>$hash_base,
3823                                                     file_name=>"$basedir$t->{'name'}")},
3824                                      "history");
3825                }
3826                print "</td>\n";
3827        }
3828}
3829
3830## ......................................................................
3831## functions printing large fragments of HTML
3832
3833# get pre-image filenames for merge (combined) diff
3834sub fill_from_file_info {
3835        my ($diff, @parents) = @_;
3836
3837        $diff->{'from_file'} = [ ];
3838        $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
3839        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
3840                if ($diff->{'status'}[$i] eq 'R' ||
3841                    $diff->{'status'}[$i] eq 'C') {
3842                        $diff->{'from_file'}[$i] =
3843                                git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
3844                }
3845        }
3846
3847        return $diff;
3848}
3849
3850# is current raw difftree line of file deletion
3851sub is_deleted {
3852        my $diffinfo = shift;
3853
3854        return $diffinfo->{'to_id'} eq ('0' x 40);
3855}
3856
3857# does patch correspond to [previous] difftree raw line
3858# $diffinfo  - hashref of parsed raw diff format
3859# $patchinfo - hashref of parsed patch diff format
3860#              (the same keys as in $diffinfo)
3861sub is_patch_split {
3862        my ($diffinfo, $patchinfo) = @_;
3863
3864        return defined $diffinfo && defined $patchinfo
3865                && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
3866}
3867
3868
3869sub git_difftree_body {
3870        my ($difftree, $hash, @parents) = @_;
3871        my ($parent) = $parents[0];
3872        my $have_blame = gitweb_check_feature('blame');
3873        print "<div class=\"list_head\">\n";
3874        if ($#{$difftree} > 10) {
3875                print(($#{$difftree} + 1) . " files changed:\n");
3876        }
3877        print "</div>\n";
3878
3879        print "<table class=\"" .
3880              (@parents > 1 ? "combined " : "") .
3881              "diff_tree\">\n";
3882
3883        # header only for combined diff in 'commitdiff' view
3884        my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
3885        if ($has_header) {
3886                # table header
3887                print "<thead><tr>\n" .
3888                       "<th></th><th></th>\n"; # filename, patchN link
3889                for (my $i = 0; $i < @parents; $i++) {
3890                        my $par = $parents[$i];
3891                        print "<th>" .
3892                              $cgi->a({-href => href(action=>"commitdiff",
3893                                                     hash=>$hash, hash_parent=>$par),
3894                                       -title => 'commitdiff to parent number ' .
3895                                                  ($i+1) . ': ' . substr($par,0,7)},
3896                                      $i+1) .
3897                              "&nbsp;</th>\n";
3898                }
3899                print "</tr></thead>\n<tbody>\n";
3900        }
3901
3902        my $alternate = 1;
3903        my $patchno = 0;
3904        foreach my $line (@{$difftree}) {
3905                my $diff = parsed_difftree_line($line);
3906
3907                if ($alternate) {
3908                        print "<tr class=\"dark\">\n";
3909                } else {
3910                        print "<tr class=\"light\">\n";
3911                }
3912                $alternate ^= 1;
3913
3914                if (exists $diff->{'nparents'}) { # combined diff
3915
3916                        fill_from_file_info($diff, @parents)
3917                                unless exists $diff->{'from_file'};
3918
3919                        if (!is_deleted($diff)) {
3920                                # file exists in the result (child) commit
3921                                print "<td>" .
3922                                      $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
3923                                                             file_name=>$diff->{'to_file'},
3924                                                             hash_base=>$hash),
3925                                              -class => "list"}, esc_path($diff->{'to_file'})) .
3926                                      "</td>\n";
3927                        } else {
3928                                print "<td>" .
3929                                      esc_path($diff->{'to_file'}) .
3930                                      "</td>\n";
3931                        }
3932
3933                        if ($action eq 'commitdiff') {
3934                                # link to patch
3935                                $patchno++;
3936                                print "<td class=\"link\">" .
3937                                      $cgi->a({-href => "#patch$patchno"}, "patch") .
3938                                      " | " .
3939                                      "</td>\n";
3940                        }
3941
3942                        my $has_history = 0;
3943                        my $not_deleted = 0;
3944                        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
3945                                my $hash_parent = $parents[$i];
3946                                my $from_hash = $diff->{'from_id'}[$i];
3947                                my $from_path = $diff->{'from_file'}[$i];
3948                                my $status = $diff->{'status'}[$i];
3949
3950                                $has_history ||= ($status ne 'A');
3951                                $not_deleted ||= ($status ne 'D');
3952
3953                                if ($status eq 'A') {
3954                                        print "<td  class=\"link\" align=\"right\"> | </td>\n";
3955                                } elsif ($status eq 'D') {
3956                                        print "<td class=\"link\">" .
3957                                              $cgi->a({-href => href(action=>"blob",
3958                                                                     hash_base=>$hash,
3959                                                                     hash=>$from_hash,
3960                                                                     file_name=>$from_path)},
3961                                                      "blob" . ($i+1)) .
3962                                              " | </td>\n";
3963                                } else {
3964                                        if ($diff->{'to_id'} eq $from_hash) {
3965                                                print "<td class=\"link nochange\">";
3966                                        } else {
3967                                                print "<td class=\"link\">";
3968                                        }
3969                                        print $cgi->a({-href => href(action=>"blobdiff",
3970                                                                     hash=>$diff->{'to_id'},
3971                                                                     hash_parent=>$from_hash,
3972                                                                     hash_base=>$hash,
3973                                                                     hash_parent_base=>$hash_parent,
3974                                                                     file_name=>$diff->{'to_file'},
3975                                                                     file_parent=>$from_path)},
3976                                                      "diff" . ($i+1)) .
3977                                              " | </td>\n";
3978                                }
3979                        }
3980
3981                        print "<td class=\"link\">";
3982                        if ($not_deleted) {
3983                                print $cgi->a({-href => href(action=>"blob",
3984                                                             hash=>$diff->{'to_id'},
3985                                                             file_name=>$diff->{'to_file'},
3986                                                             hash_base=>$hash)},
3987                                              "blob");
3988                                print " | " if ($has_history);
3989                        }
3990                        if ($has_history) {
3991                                print $cgi->a({-href => href(action=>"history",
3992                                                             file_name=>$diff->{'to_file'},
3993                                                             hash_base=>$hash)},
3994                                              "history");
3995                        }
3996                        print "</td>\n";
3997
3998                        print "</tr>\n";
3999                        next; # instead of 'else' clause, to avoid extra indent
4000                }
4001                # else ordinary diff
4002
4003                my ($to_mode_oct, $to_mode_str, $to_file_type);
4004                my ($from_mode_oct, $from_mode_str, $from_file_type);
4005                if ($diff->{'to_mode'} ne ('0' x 6)) {
4006                        $to_mode_oct = oct $diff->{'to_mode'};
4007                        if (S_ISREG($to_mode_oct)) { # only for regular file
4008                                $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4009                        }
4010                        $to_file_type = file_type($diff->{'to_mode'});
4011                }
4012                if ($diff->{'from_mode'} ne ('0' x 6)) {
4013                        $from_mode_oct = oct $diff->{'from_mode'};
4014                        if (S_ISREG($to_mode_oct)) { # only for regular file
4015                                $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4016                        }
4017                        $from_file_type = file_type($diff->{'from_mode'});
4018                }
4019
4020                if ($diff->{'status'} eq "A") { # created
4021                        my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4022                        $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4023                        $mode_chng   .= "]</span>";
4024                        print "<td>";
4025                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4026                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4027                                      -class => "list"}, esc_path($diff->{'file'}));
4028                        print "</td>\n";
4029                        print "<td>$mode_chng</td>\n";
4030                        print "<td class=\"link\">";
4031                        if ($action eq 'commitdiff') {
4032                                # link to patch
4033                                $patchno++;
4034                                print $cgi->a({-href => "#patch$patchno"}, "patch");
4035                                print " | ";
4036                        }
4037                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4038                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4039                                      "blob");
4040                        print "</td>\n";
4041
4042                } elsif ($diff->{'status'} eq "D") { # deleted
4043                        my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4044                        print "<td>";
4045                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4046                                                     hash_base=>$parent, file_name=>$diff->{'file'}),
4047                                       -class => "list"}, esc_path($diff->{'file'}));
4048                        print "</td>\n";
4049                        print "<td>$mode_chng</td>\n";
4050                        print "<td class=\"link\">";
4051                        if ($action eq 'commitdiff') {
4052                                # link to patch
4053                                $patchno++;
4054                                print $cgi->a({-href => "#patch$patchno"}, "patch");
4055                                print " | ";
4056                        }
4057                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4058                                                     hash_base=>$parent, file_name=>$diff->{'file'})},
4059                                      "blob") . " | ";
4060                        if ($have_blame) {
4061                                print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4062                                                             file_name=>$diff->{'file'})},
4063                                              "blame") . " | ";
4064                        }
4065                        print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4066                                                     file_name=>$diff->{'file'})},
4067                                      "history");
4068                        print "</td>\n";
4069
4070                } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4071                        my $mode_chnge = "";
4072                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4073                                $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4074                                if ($from_file_type ne $to_file_type) {
4075                                        $mode_chnge .= " from $from_file_type to $to_file_type";
4076                                }
4077                                if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4078                                        if ($from_mode_str && $to_mode_str) {
4079                                                $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4080                                        } elsif ($to_mode_str) {
4081                                                $mode_chnge .= " mode: $to_mode_str";
4082                                        }
4083                                }
4084                                $mode_chnge .= "]</span>\n";
4085                        }
4086                        print "<td>";
4087                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4088                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4089                                      -class => "list"}, esc_path($diff->{'file'}));
4090                        print "</td>\n";
4091                        print "<td>$mode_chnge</td>\n";
4092                        print "<td class=\"link\">";
4093                        if ($action eq 'commitdiff') {
4094                                # link to patch
4095                                $patchno++;
4096                                print $cgi->a({-href => "#patch$patchno"}, "patch") .
4097                                      " | ";
4098                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4099                                # "commit" view and modified file (not onlu mode changed)
4100                                print $cgi->a({-href => href(action=>"blobdiff",
4101                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4102                                                             hash_base=>$hash, hash_parent_base=>$parent,
4103                                                             file_name=>$diff->{'file'})},
4104                                              "diff") .
4105                                      " | ";
4106                        }
4107                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4108                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4109                                       "blob") . " | ";
4110                        if ($have_blame) {
4111                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4112                                                             file_name=>$diff->{'file'})},
4113                                              "blame") . " | ";
4114                        }
4115                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4116                                                     file_name=>$diff->{'file'})},
4117                                      "history");
4118                        print "</td>\n";
4119
4120                } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4121                        my %status_name = ('R' => 'moved', 'C' => 'copied');
4122                        my $nstatus = $status_name{$diff->{'status'}};
4123                        my $mode_chng = "";
4124                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4125                                # mode also for directories, so we cannot use $to_mode_str
4126                                $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4127                        }
4128                        print "<td>" .
4129                              $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4130                                                     hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4131                                      -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4132                              "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4133                              $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4134                                                     hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4135                                      -class => "list"}, esc_path($diff->{'from_file'})) .
4136                              " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4137                              "<td class=\"link\">";
4138                        if ($action eq 'commitdiff') {
4139                                # link to patch
4140                                $patchno++;
4141                                print $cgi->a({-href => "#patch$patchno"}, "patch") .
4142                                      " | ";
4143                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4144                                # "commit" view and modified file (not only pure rename or copy)
4145                                print $cgi->a({-href => href(action=>"blobdiff",
4146                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4147                                                             hash_base=>$hash, hash_parent_base=>$parent,
4148                                                             file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4149                                              "diff") .
4150                                      " | ";
4151                        }
4152                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4153                                                     hash_base=>$parent, file_name=>$diff->{'to_file'})},
4154                                      "blob") . " | ";
4155                        if ($have_blame) {
4156                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4157                                                             file_name=>$diff->{'to_file'})},
4158                                              "blame") . " | ";
4159                        }
4160                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4161                                                    file_name=>$diff->{'to_file'})},
4162                                      "history");
4163                        print "</td>\n";
4164
4165                } # we should not encounter Unmerged (U) or Unknown (X) status
4166                print "</tr>\n";
4167        }
4168        print "</tbody>" if $has_header;
4169        print "</table>\n";
4170}
4171
4172sub git_patchset_body {
4173        my ($fd, $difftree, $hash, @hash_parents) = @_;
4174        my ($hash_parent) = $hash_parents[0];
4175
4176        my $is_combined = (@hash_parents > 1);
4177        my $patch_idx = 0;
4178        my $patch_number = 0;
4179        my $patch_line;
4180        my $diffinfo;
4181        my $to_name;
4182        my (%from, %to);
4183
4184        print "<div class=\"patchset\">\n";
4185
4186        # skip to first patch
4187        while ($patch_line = <$fd>) {
4188                chomp $patch_line;
4189
4190                last if ($patch_line =~ m/^diff /);
4191        }
4192
4193 PATCH:
4194        while ($patch_line) {
4195
4196                # parse "git diff" header line
4197                if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
4198                        # $1 is from_name, which we do not use
4199                        $to_name = unquote($2);
4200                        $to_name =~ s!^b/!!;
4201                } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
4202                        # $1 is 'cc' or 'combined', which we do not use
4203                        $to_name = unquote($2);
4204                } else {
4205                        $to_name = undef;
4206                }
4207
4208                # check if current patch belong to current raw line
4209                # and parse raw git-diff line if needed
4210                if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
4211                        # this is continuation of a split patch
4212                        print "<div class=\"patch cont\">\n";
4213                } else {
4214                        # advance raw git-diff output if needed
4215                        $patch_idx++ if defined $diffinfo;
4216
4217                        # read and prepare patch information
4218                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4219
4220                        # compact combined diff output can have some patches skipped
4221                        # find which patch (using pathname of result) we are at now;
4222                        if ($is_combined) {
4223                                while ($to_name ne $diffinfo->{'to_file'}) {
4224                                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4225                                              format_diff_cc_simplified($diffinfo, @hash_parents) .
4226                                              "</div>\n";  # class="patch"
4227
4228                                        $patch_idx++;
4229                                        $patch_number++;
4230
4231                                        last if $patch_idx > $#$difftree;
4232                                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4233                                }
4234                        }
4235
4236                        # modifies %from, %to hashes
4237                        parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
4238
4239                        # this is first patch for raw difftree line with $patch_idx index
4240                        # we index @$difftree array from 0, but number patches from 1
4241                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
4242                }
4243
4244                # git diff header
4245                #assert($patch_line =~ m/^diff /) if DEBUG;
4246                #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
4247                $patch_number++;
4248                # print "git diff" header
4249                print format_git_diff_header_line($patch_line, $diffinfo,
4250                                                  \%from, \%to);
4251
4252                # print extended diff header
4253                print "<div class=\"diff extended_header\">\n";
4254        EXTENDED_HEADER:
4255                while ($patch_line = <$fd>) {
4256                        chomp $patch_line;
4257
4258                        last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
4259
4260                        print format_extended_diff_header_line($patch_line, $diffinfo,
4261                                                               \%from, \%to);
4262                }
4263                print "</div>\n"; # class="diff extended_header"
4264
4265                # from-file/to-file diff header
4266                if (! $patch_line) {
4267                        print "</div>\n"; # class="patch"
4268                        last PATCH;
4269                }
4270                next PATCH if ($patch_line =~ m/^diff /);
4271                #assert($patch_line =~ m/^---/) if DEBUG;
4272
4273                my $last_patch_line = $patch_line;
4274                $patch_line = <$fd>;
4275                chomp $patch_line;
4276                #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
4277
4278                print format_diff_from_to_header($last_patch_line, $patch_line,
4279                                                 $diffinfo, \%from, \%to,
4280                                                 @hash_parents);
4281
4282                # the patch itself
4283        LINE:
4284                while ($patch_line = <$fd>) {
4285                        chomp $patch_line;
4286
4287                        next PATCH if ($patch_line =~ m/^diff /);
4288
4289                        print format_diff_line($patch_line, \%from, \%to);
4290                }
4291
4292        } continue {
4293                print "</div>\n"; # class="patch"
4294        }
4295
4296        # for compact combined (--cc) format, with chunk and patch simpliciaction
4297        # patchset might be empty, but there might be unprocessed raw lines
4298        for (++$patch_idx if $patch_number > 0;
4299             $patch_idx < @$difftree;
4300             ++$patch_idx) {
4301                # read and prepare patch information
4302                $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4303
4304                # generate anchor for "patch" links in difftree / whatchanged part
4305                print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4306                      format_diff_cc_simplified($diffinfo, @hash_parents) .
4307                      "</div>\n";  # class="patch"
4308
4309                $patch_number++;
4310        }
4311
4312        if ($patch_number == 0) {
4313                if (@hash_parents > 1) {
4314                        print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
4315                } else {
4316                        print "<div class=\"diff nodifferences\">No differences found</div>\n";
4317                }
4318        }
4319
4320        print "</div>\n"; # class="patchset"
4321}
4322
4323# . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
4324
4325# fills project list info (age, description, owner, forks) for each
4326# project in the list, removing invalid projects from returned list
4327# NOTE: modifies $projlist, but does not remove entries from it
4328sub fill_project_list_info {
4329        my ($projlist, $check_forks) = @_;
4330        my @projects;
4331
4332        my $show_ctags = gitweb_check_feature('ctags');
4333 PROJECT:
4334        foreach my $pr (@$projlist) {
4335                my (@activity) = git_get_last_activity($pr->{'path'});
4336                unless (@activity) {
4337                        next PROJECT;
4338                }
4339                ($pr->{'age'}, $pr->{'age_string'}) = @activity;
4340                if (!defined $pr->{'descr'}) {
4341                        my $descr = git_get_project_description($pr->{'path'}) || "";
4342                        $descr = to_utf8($descr);
4343                        $pr->{'descr_long'} = $descr;
4344                        $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
4345                }
4346                if (!defined $pr->{'owner'}) {
4347                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
4348                }
4349                if ($check_forks) {
4350                        my $pname = $pr->{'path'};
4351                        if (($pname =~ s/\.git$//) &&
4352                            ($pname !~ /\/$/) &&
4353                            (-d "$projectroot/$pname")) {
4354                                $pr->{'forks'} = "-d $projectroot/$pname";
4355                        } else {
4356                                $pr->{'forks'} = 0;
4357                        }
4358                }
4359                $show_ctags and $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
4360                push @projects, $pr;
4361        }
4362
4363        return @projects;
4364}
4365
4366# print 'sort by' <th> element, generating 'sort by $name' replay link
4367# if that order is not selected
4368sub print_sort_th {
4369        print format_sort_th(@_);
4370}
4371
4372sub format_sort_th {
4373        my ($name, $order, $header) = @_;
4374        my $sort_th = "";
4375        $header ||= ucfirst($name);
4376
4377        if ($order eq $name) {
4378                $sort_th .= "<th>$header</th>\n";
4379        } else {
4380                $sort_th .= "<th>" .
4381                            $cgi->a({-href => href(-replay=>1, order=>$name),
4382                                     -class => "header"}, $header) .
4383                            "</th>\n";
4384        }
4385
4386        return $sort_th;
4387}
4388
4389sub git_project_list_body {
4390        # actually uses global variable $project
4391        my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
4392
4393        my $check_forks = gitweb_check_feature('forks');
4394        my @projects = fill_project_list_info($projlist, $check_forks);
4395
4396        $order ||= $default_projects_order;
4397        $from = 0 unless defined $from;
4398        $to = $#projects if (!defined $to || $#projects < $to);
4399
4400        my %order_info = (
4401                project => { key => 'path', type => 'str' },
4402                descr => { key => 'descr_long', type => 'str' },
4403                owner => { key => 'owner', type => 'str' },
4404                age => { key => 'age', type => 'num' }
4405        );
4406        my $oi = $order_info{$order};
4407        if ($oi->{'type'} eq 'str') {
4408                @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @projects;
4409        } else {
4410                @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @projects;
4411        }
4412
4413        my $show_ctags = gitweb_check_feature('ctags');
4414        if ($show_ctags) {
4415                my %ctags;
4416                foreach my $p (@projects) {
4417                        foreach my $ct (keys %{$p->{'ctags'}}) {
4418                                $ctags{$ct} += $p->{'ctags'}->{$ct};
4419                        }
4420                }
4421                my $cloud = git_populate_project_tagcloud(\%ctags);
4422                print git_show_project_tagcloud($cloud, 64);
4423        }
4424
4425        print "<table class=\"project_list\">\n";
4426        unless ($no_header) {
4427                print "<tr>\n";
4428                if ($check_forks) {
4429                        print "<th></th>\n";
4430                }
4431                print_sort_th('project', $order, 'Project');
4432                print_sort_th('descr', $order, 'Description');
4433                print_sort_th('owner', $order, 'Owner');
4434                print_sort_th('age', $order, 'Last Change');
4435                print "<th></th>\n" . # for links
4436                      "</tr>\n";
4437        }
4438        my $alternate = 1;
4439        my $tagfilter = $cgi->param('by_tag');
4440        for (my $i = $from; $i <= $to; $i++) {
4441                my $pr = $projects[$i];
4442
4443                next if $tagfilter and $show_ctags and not grep { lc $_ eq lc $tagfilter } keys %{$pr->{'ctags'}};
4444                next if $searchtext and not $pr->{'path'} =~ /$searchtext/
4445                        and not $pr->{'descr_long'} =~ /$searchtext/;
4446                # Weed out forks or non-matching entries of search
4447                if ($check_forks) {
4448                        my $forkbase = $project; $forkbase ||= ''; $forkbase =~ s#\.git$#/#;
4449                        $forkbase="^$forkbase" if $forkbase;
4450                        next if not $searchtext and not $tagfilter and $show_ctags
4451                                and $pr->{'path'} =~ m#$forkbase.*/.*#; # regexp-safe
4452                }
4453
4454                if ($alternate) {
4455                        print "<tr class=\"dark\">\n";
4456                } else {
4457                        print "<tr class=\"light\">\n";
4458                }
4459                $alternate ^= 1;
4460                if ($check_forks) {
4461                        print "<td>";
4462                        if ($pr->{'forks'}) {
4463                                print "<!-- $pr->{'forks'} -->\n";
4464                                print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "+");
4465                        }
4466                        print "</td>\n";
4467                }
4468                print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4469                                        -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
4470                      "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4471                                        -class => "list", -title => $pr->{'descr_long'}},
4472                                        esc_html($pr->{'descr'})) . "</td>\n" .
4473                      "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
4474                print "<td class=\"". age_class($pr->{'age'}) . "\">" .
4475                      (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
4476                      "<td class=\"link\">" .
4477                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
4478                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
4479                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
4480                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
4481                      ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
4482                      "</td>\n" .
4483                      "</tr>\n";
4484        }
4485        if (defined $extra) {
4486                print "<tr>\n";
4487                if ($check_forks) {
4488                        print "<td></td>\n";
4489                }
4490                print "<td colspan=\"5\">$extra</td>\n" .
4491                      "</tr>\n";
4492        }
4493        print "</table>\n";
4494}
4495
4496sub git_log_body {
4497        # uses global variable $project
4498        my ($commitlist, $from, $to, $refs, $extra) = @_;
4499
4500        $from = 0 unless defined $from;
4501        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4502
4503        for (my $i = 0; $i <= $to; $i++) {
4504                my %co = %{$commitlist->[$i]};
4505                next if !%co;
4506                my $commit = $co{'id'};
4507                my $ref = format_ref_marker($refs, $commit);
4508                my %ad = parse_date($co{'author_epoch'});
4509                git_print_header_div('commit',
4510                               "<span class=\"age\">$co{'age_string'}</span>" .
4511                               esc_html($co{'title'}) . $ref,
4512                               $commit);
4513                print "<div class=\"title_text\">\n" .
4514                      "<div class=\"log_link\">\n" .
4515                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
4516                      " | " .
4517                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
4518                      " | " .
4519                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
4520                      "<br/>\n" .
4521                      "</div>\n";
4522                      git_print_authorship(\%co, -tag => 'span');
4523                      print "<br/>\n</div>\n";
4524
4525                print "<div class=\"log_body\">\n";
4526                git_print_log($co{'comment'}, -final_empty_line=> 1);
4527                print "</div>\n";
4528        }
4529        if ($extra) {
4530                print "<div class=\"page_nav\">\n";
4531                print "$extra\n";
4532                print "</div>\n";
4533        }
4534}
4535
4536sub git_shortlog_body {
4537        # uses global variable $project
4538        my ($commitlist, $from, $to, $refs, $extra) = @_;
4539
4540        $from = 0 unless defined $from;
4541        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4542
4543        print "<table class=\"shortlog\">\n";
4544        my $alternate = 1;
4545        for (my $i = $from; $i <= $to; $i++) {
4546                my %co = %{$commitlist->[$i]};
4547                my $commit = $co{'id'};
4548                my $ref = format_ref_marker($refs, $commit);
4549                if ($alternate) {
4550                        print "<tr class=\"dark\">\n";
4551                } else {
4552                        print "<tr class=\"light\">\n";
4553                }
4554                $alternate ^= 1;
4555                # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
4556                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4557                      format_author_html('td', \%co, 10) . "<td>";
4558                print format_subject_html($co{'title'}, $co{'title_short'},
4559                                          href(action=>"commit", hash=>$commit), $ref);
4560                print "</td>\n" .
4561                      "<td class=\"link\">" .
4562                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
4563                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
4564                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
4565                my $snapshot_links = format_snapshot_links($commit);
4566                if (defined $snapshot_links) {
4567                        print " | " . $snapshot_links;
4568                }
4569                print "</td>\n" .
4570                      "</tr>\n";
4571        }
4572        if (defined $extra) {
4573                print "<tr>\n" .
4574                      "<td colspan=\"4\">$extra</td>\n" .
4575                      "</tr>\n";
4576        }
4577        print "</table>\n";
4578}
4579
4580sub git_history_body {
4581        # Warning: assumes constant type (blob or tree) during history
4582        my ($commitlist, $from, $to, $refs, $extra,
4583            $file_name, $file_hash, $ftype) = @_;
4584
4585        $from = 0 unless defined $from;
4586        $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
4587
4588        print "<table class=\"history\">\n";
4589        my $alternate = 1;
4590        for (my $i = $from; $i <= $to; $i++) {
4591                my %co = %{$commitlist->[$i]};
4592                if (!%co) {
4593                        next;
4594                }
4595                my $commit = $co{'id'};
4596
4597                my $ref = format_ref_marker($refs, $commit);
4598
4599                if ($alternate) {
4600                        print "<tr class=\"dark\">\n";
4601                } else {
4602                        print "<tr class=\"light\">\n";
4603                }
4604                $alternate ^= 1;
4605                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4606        # shortlog:   format_author_html('td', \%co, 10)
4607                      format_author_html('td', \%co, 15, 3) . "<td>";
4608                # originally git_history used chop_str($co{'title'}, 50)
4609                print format_subject_html($co{'title'}, $co{'title_short'},
4610                                          href(action=>"commit", hash=>$commit), $ref);
4611                print "</td>\n" .
4612                      "<td class=\"link\">" .
4613                      $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
4614                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
4615
4616                if ($ftype eq 'blob') {
4617                        my $blob_current = $file_hash;
4618                        my $blob_parent  = git_get_hash_by_path($commit, $file_name);
4619                        if (defined $blob_current && defined $blob_parent &&
4620                                        $blob_current ne $blob_parent) {
4621                                print " | " .
4622                                        $cgi->a({-href => href(action=>"blobdiff",
4623                                                               hash=>$blob_current, hash_parent=>$blob_parent,
4624                                                               hash_base=>$hash_base, hash_parent_base=>$commit,
4625                                                               file_name=>$file_name)},
4626                                                "diff to current");
4627                        }
4628                }
4629                print "</td>\n" .
4630                      "</tr>\n";
4631        }
4632        if (defined $extra) {
4633                print "<tr>\n" .
4634                      "<td colspan=\"4\">$extra</td>\n" .
4635                      "</tr>\n";
4636        }
4637        print "</table>\n";
4638}
4639
4640sub git_tags_body {
4641        # uses global variable $project
4642        my ($taglist, $from, $to, $extra) = @_;
4643        $from = 0 unless defined $from;
4644        $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
4645
4646        print "<table class=\"tags\">\n";
4647        my $alternate = 1;
4648        for (my $i = $from; $i <= $to; $i++) {
4649                my $entry = $taglist->[$i];
4650                my %tag = %$entry;
4651                my $comment = $tag{'subject'};
4652                my $comment_short;
4653                if (defined $comment) {
4654                        $comment_short = chop_str($comment, 30, 5);
4655                }
4656                if ($alternate) {
4657                        print "<tr class=\"dark\">\n";
4658                } else {
4659                        print "<tr class=\"light\">\n";
4660                }
4661                $alternate ^= 1;
4662                if (defined $tag{'age'}) {
4663                        print "<td><i>$tag{'age'}</i></td>\n";
4664                } else {
4665                        print "<td></td>\n";
4666                }
4667                print "<td>" .
4668                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
4669                               -class => "list name"}, esc_html($tag{'name'})) .
4670                      "</td>\n" .
4671                      "<td>";
4672                if (defined $comment) {
4673                        print format_subject_html($comment, $comment_short,
4674                                                  href(action=>"tag", hash=>$tag{'id'}));
4675                }
4676                print "</td>\n" .
4677                      "<td class=\"selflink\">";
4678                if ($tag{'type'} eq "tag") {
4679                        print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
4680                } else {
4681                        print "&nbsp;";
4682                }
4683                print "</td>\n" .
4684                      "<td class=\"link\">" . " | " .
4685                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
4686                if ($tag{'reftype'} eq "commit") {
4687                        print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
4688                              " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
4689                } elsif ($tag{'reftype'} eq "blob") {
4690                        print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
4691                }
4692                print "</td>\n" .
4693                      "</tr>";
4694        }
4695        if (defined $extra) {
4696                print "<tr>\n" .
4697                      "<td colspan=\"5\">$extra</td>\n" .
4698                      "</tr>\n";
4699        }
4700        print "</table>\n";
4701}
4702
4703sub git_heads_body {
4704        # uses global variable $project
4705        my ($headlist, $head, $from, $to, $extra) = @_;
4706        $from = 0 unless defined $from;
4707        $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
4708
4709        print "<table class=\"heads\">\n";
4710        my $alternate = 1;
4711        for (my $i = $from; $i <= $to; $i++) {
4712                my $entry = $headlist->[$i];
4713                my %ref = %$entry;
4714                my $curr = $ref{'id'} eq $head;
4715                if ($alternate) {
4716                        print "<tr class=\"dark\">\n";
4717                } else {
4718                        print "<tr class=\"light\">\n";
4719                }
4720                $alternate ^= 1;
4721                print "<td><i>$ref{'age'}</i></td>\n" .
4722                      ($curr ? "<td class=\"current_head\">" : "<td>") .
4723                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
4724                               -class => "list name"},esc_html($ref{'name'})) .
4725                      "</td>\n" .
4726                      "<td class=\"link\">" .
4727                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
4728                      $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
4729                      $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'name'})}, "tree") .
4730                      "</td>\n" .
4731                      "</tr>";
4732        }
4733        if (defined $extra) {
4734                print "<tr>\n" .
4735                      "<td colspan=\"3\">$extra</td>\n" .
4736                      "</tr>\n";
4737        }
4738        print "</table>\n";
4739}
4740
4741sub git_search_grep_body {
4742        my ($commitlist, $from, $to, $extra) = @_;
4743        $from = 0 unless defined $from;
4744        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4745
4746        print "<table class=\"commit_search\">\n";
4747        my $alternate = 1;
4748        for (my $i = $from; $i <= $to; $i++) {
4749                my %co = %{$commitlist->[$i]};
4750                if (!%co) {
4751                        next;
4752                }
4753                my $commit = $co{'id'};
4754                if ($alternate) {
4755                        print "<tr class=\"dark\">\n";
4756                } else {
4757                        print "<tr class=\"light\">\n";
4758                }
4759                $alternate ^= 1;
4760                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4761                      format_author_html('td', \%co, 15, 5) .
4762                      "<td>" .
4763                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
4764                               -class => "list subject"},
4765                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
4766                my $comment = $co{'comment'};
4767                foreach my $line (@$comment) {
4768                        if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
4769                                my ($lead, $match, $trail) = ($1, $2, $3);
4770                                $match = chop_str($match, 70, 5, 'center');
4771                                my $contextlen = int((80 - length($match))/2);
4772                                $contextlen = 30 if ($contextlen > 30);
4773                                $lead  = chop_str($lead,  $contextlen, 10, 'left');
4774                                $trail = chop_str($trail, $contextlen, 10, 'right');
4775
4776                                $lead  = esc_html($lead);
4777                                $match = esc_html($match);
4778                                $trail = esc_html($trail);
4779
4780                                print "$lead<span class=\"match\">$match</span>$trail<br />";
4781                        }
4782                }
4783                print "</td>\n" .
4784                      "<td class=\"link\">" .
4785                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
4786                      " | " .
4787                      $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
4788                      " | " .
4789                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
4790                print "</td>\n" .
4791                      "</tr>\n";
4792        }
4793        if (defined $extra) {
4794                print "<tr>\n" .
4795                      "<td colspan=\"3\">$extra</td>\n" .
4796                      "</tr>\n";
4797        }
4798        print "</table>\n";
4799}
4800
4801## ======================================================================
4802## ======================================================================
4803## actions
4804
4805sub git_project_list {
4806        my $order = $input_params{'order'};
4807        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
4808                die_error(400, "Unknown order parameter");
4809        }
4810
4811        my @list = git_get_projects_list();
4812        if (!@list) {
4813                die_error(404, "No projects found");
4814        }
4815
4816        git_header_html();
4817        if (defined $home_text && -f $home_text) {
4818                print "<div class=\"index_include\">\n";
4819                insert_file($home_text);
4820                print "</div>\n";
4821        }
4822        print $cgi->startform(-method => "get") .
4823              "<p class=\"projsearch\">Search:\n" .
4824              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
4825              "</p>" .
4826              $cgi->end_form() . "\n";
4827        git_project_list_body(\@list, $order);
4828        git_footer_html();
4829}
4830
4831sub git_forks {
4832        my $order = $input_params{'order'};
4833        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
4834                die_error(400, "Unknown order parameter");
4835        }
4836
4837        my @list = git_get_projects_list($project);
4838        if (!@list) {
4839                die_error(404, "No forks found");
4840        }
4841
4842        git_header_html();
4843        git_print_page_nav('','');
4844        git_print_header_div('summary', "$project forks");
4845        git_project_list_body(\@list, $order);
4846        git_footer_html();
4847}
4848
4849sub git_project_index {
4850        my @projects = git_get_projects_list($project);
4851
4852        print $cgi->header(
4853                -type => 'text/plain',
4854                -charset => 'utf-8',
4855                -content_disposition => 'inline; filename="index.aux"');
4856
4857        foreach my $pr (@projects) {
4858                if (!exists $pr->{'owner'}) {
4859                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
4860                }
4861
4862                my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
4863                # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
4864                $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
4865                $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
4866                $path  =~ s/ /\+/g;
4867                $owner =~ s/ /\+/g;
4868
4869                print "$path $owner\n";
4870        }
4871}
4872
4873sub git_summary {
4874        my $descr = git_get_project_description($project) || "none";
4875        my %co = parse_commit("HEAD");
4876        my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
4877        my $head = $co{'id'};
4878
4879        my $owner = git_get_project_owner($project);
4880
4881        my $refs = git_get_references();
4882        # These get_*_list functions return one more to allow us to see if
4883        # there are more ...
4884        my @taglist  = git_get_tags_list(16);
4885        my @headlist = git_get_heads_list(16);
4886        my @forklist;
4887        my $check_forks = gitweb_check_feature('forks');
4888
4889        if ($check_forks) {
4890                @forklist = git_get_projects_list($project);
4891        }
4892
4893        git_header_html();
4894        git_print_page_nav('summary','', $head);
4895
4896        print "<div class=\"title\">&nbsp;</div>\n";
4897        print "<table class=\"projects_list\">\n" .
4898              "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
4899              "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
4900        if (defined $cd{'rfc2822'}) {
4901                print "<tr id=\"metadata_lchange\"><td>last change</td><td>$cd{'rfc2822'}</td></tr>\n";
4902        }
4903
4904        # use per project git URL list in $projectroot/$project/cloneurl
4905        # or make project git URL from git base URL and project name
4906        my $url_tag = "URL";
4907        my @url_list = git_get_project_url_list($project);
4908        @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
4909        foreach my $git_url (@url_list) {
4910                next unless $git_url;
4911                print "<tr class=\"metadata_url\"><td>$url_tag</td><td>$git_url</td></tr>\n";
4912                $url_tag = "";
4913        }
4914
4915        # Tag cloud
4916        my $show_ctags = gitweb_check_feature('ctags');
4917        if ($show_ctags) {
4918                my $ctags = git_get_project_ctags($project);
4919                my $cloud = git_populate_project_tagcloud($ctags);
4920                print "<tr id=\"metadata_ctags\"><td>Content tags:<br />";
4921                print "</td>\n<td>" unless %$ctags;
4922                print "<form action=\"$show_ctags\" method=\"post\"><input type=\"hidden\" name=\"p\" value=\"$project\" />Add: <input type=\"text\" name=\"t\" size=\"8\" /></form>";
4923                print "</td>\n<td>" if %$ctags;
4924                print git_show_project_tagcloud($cloud, 48);
4925                print "</td></tr>";
4926        }
4927
4928        print "</table>\n";
4929
4930        # If XSS prevention is on, we don't include README.html.
4931        # TODO: Allow a readme in some safe format.
4932        if (!$prevent_xss && -s "$projectroot/$project/README.html") {
4933                print "<div class=\"title\">readme</div>\n" .
4934                      "<div class=\"readme\">\n";
4935                insert_file("$projectroot/$project/README.html");
4936                print "\n</div>\n"; # class="readme"
4937        }
4938
4939        # we need to request one more than 16 (0..15) to check if
4940        # those 16 are all
4941        my @commitlist = $head ? parse_commits($head, 17) : ();
4942        if (@commitlist) {
4943                git_print_header_div('shortlog');
4944                git_shortlog_body(\@commitlist, 0, 15, $refs,
4945                                  $#commitlist <=  15 ? undef :
4946                                  $cgi->a({-href => href(action=>"shortlog")}, "..."));
4947        }
4948
4949        if (@taglist) {
4950                git_print_header_div('tags');
4951                git_tags_body(\@taglist, 0, 15,
4952                              $#taglist <=  15 ? undef :
4953                              $cgi->a({-href => href(action=>"tags")}, "..."));
4954        }
4955
4956        if (@headlist) {
4957                git_print_header_div('heads');
4958                git_heads_body(\@headlist, $head, 0, 15,
4959                               $#headlist <= 15 ? undef :
4960                               $cgi->a({-href => href(action=>"heads")}, "..."));
4961        }
4962
4963        if (@forklist) {
4964                git_print_header_div('forks');
4965                git_project_list_body(\@forklist, 'age', 0, 15,
4966                                      $#forklist <= 15 ? undef :
4967                                      $cgi->a({-href => href(action=>"forks")}, "..."),
4968                                      'no_header');
4969        }
4970
4971        git_footer_html();
4972}
4973
4974sub git_tag {
4975        my $head = git_get_head_hash($project);
4976        git_header_html();
4977        git_print_page_nav('','', $head,undef,$head);
4978        my %tag = parse_tag($hash);
4979
4980        if (! %tag) {
4981                die_error(404, "Unknown tag object");
4982        }
4983
4984        git_print_header_div('commit', esc_html($tag{'name'}), $hash);
4985        print "<div class=\"title_text\">\n" .
4986              "<table class=\"object_header\">\n" .
4987              "<tr>\n" .
4988              "<td>object</td>\n" .
4989              "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
4990                               $tag{'object'}) . "</td>\n" .
4991              "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
4992                                              $tag{'type'}) . "</td>\n" .
4993              "</tr>\n";
4994        if (defined($tag{'author'})) {
4995                git_print_authorship_rows(\%tag, 'author');
4996        }
4997        print "</table>\n\n" .
4998              "</div>\n";
4999        print "<div class=\"page_body\">";
5000        my $comment = $tag{'comment'};
5001        foreach my $line (@$comment) {
5002                chomp $line;
5003                print esc_html($line, -nbsp=>1) . "<br/>\n";
5004        }
5005        print "</div>\n";
5006        git_footer_html();
5007}
5008
5009sub git_blame_common {
5010        my $format = shift || 'porcelain';
5011        if ($format eq 'porcelain' && $cgi->param('js')) {
5012                $format = 'incremental';
5013                $action = 'blame_incremental'; # for page title etc
5014        }
5015
5016        # permissions
5017        gitweb_check_feature('blame')
5018                or die_error(403, "Blame view not allowed");
5019
5020        # error checking
5021        die_error(400, "No file name given") unless $file_name;
5022        $hash_base ||= git_get_head_hash($project);
5023        die_error(404, "Couldn't find base commit") unless $hash_base;
5024        my %co = parse_commit($hash_base)
5025                or die_error(404, "Commit not found");
5026        my $ftype = "blob";
5027        if (!defined $hash) {
5028                $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
5029                        or die_error(404, "Error looking up file");
5030        } else {
5031                $ftype = git_get_type($hash);
5032                if ($ftype !~ "blob") {
5033                        die_error(400, "Object is not a blob");
5034                }
5035        }
5036
5037        my $fd;
5038        if ($format eq 'incremental') {
5039                # get file contents (as base)
5040                open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
5041                        or die_error(500, "Open git-cat-file failed");
5042        } elsif ($format eq 'data') {
5043                # run git-blame --incremental
5044                open $fd, "-|", git_cmd(), "blame", "--incremental",
5045                        $hash_base, "--", $file_name
5046                        or die_error(500, "Open git-blame --incremental failed");
5047        } else {
5048                # run git-blame --porcelain
5049                open $fd, "-|", git_cmd(), "blame", '-p',
5050                        $hash_base, '--', $file_name
5051                        or die_error(500, "Open git-blame --porcelain failed");
5052        }
5053
5054        # incremental blame data returns early
5055        if ($format eq 'data') {
5056                print $cgi->header(
5057                        -type=>"text/plain", -charset => "utf-8",
5058                        -status=> "200 OK");
5059                local $| = 1; # output autoflush
5060                print while <$fd>;
5061                close $fd
5062                        or print "ERROR $!\n";
5063
5064                print 'END';
5065                if (defined $t0 && gitweb_check_feature('timed')) {
5066                        print ' '.
5067                              Time::HiRes::tv_interval($t0, [Time::HiRes::gettimeofday()]).
5068                              ' '.$number_of_git_cmds;
5069                }
5070                print "\n";
5071
5072                return;
5073        }
5074
5075        # page header
5076        git_header_html();
5077        my $formats_nav =
5078                $cgi->a({-href => href(action=>"blob", -replay=>1)},
5079                        "blob") .
5080                " | ";
5081        if ($format eq 'incremental') {
5082                $formats_nav .=
5083                        $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
5084                                "blame") . " (non-incremental)";
5085        } else {
5086                $formats_nav .=
5087                        $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
5088                                "blame") . " (incremental)";
5089        }
5090        $formats_nav .=
5091                " | " .
5092                $cgi->a({-href => href(action=>"history", -replay=>1)},
5093                        "history") .
5094                " | " .
5095                $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
5096                        "HEAD");
5097        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5098        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5099        git_print_page_path($file_name, $ftype, $hash_base);
5100
5101        # page body
5102        if ($format eq 'incremental') {
5103                print "<noscript>\n<div class=\"error\"><center><b>\n".
5104                      "This page requires JavaScript to run.\n Use ".
5105                      $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
5106                              'this page').
5107                      " instead.\n".
5108                      "</b></center></div>\n</noscript>\n";
5109
5110                print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
5111        }
5112
5113        print qq!<div class="page_body">\n!;
5114        print qq!<div id="progress_info">... / ...</div>\n!
5115                if ($format eq 'incremental');
5116        print qq!<table id="blame_table" class="blame" width="100%">\n!.
5117              #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
5118              qq!<thead>\n!.
5119              qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
5120              qq!</thead>\n!.
5121              qq!<tbody>\n!;
5122
5123        my @rev_color = qw(light dark);
5124        my $num_colors = scalar(@rev_color);
5125        my $current_color = 0;
5126
5127        if ($format eq 'incremental') {
5128                my $color_class = $rev_color[$current_color];
5129
5130                #contents of a file
5131                my $linenr = 0;
5132        LINE:
5133                while (my $line = <$fd>) {
5134                        chomp $line;
5135                        $linenr++;
5136
5137                        print qq!<tr id="l$linenr" class="$color_class">!.
5138                              qq!<td class="sha1"><a href=""> </a></td>!.
5139                              qq!<td class="linenr">!.
5140                              qq!<a class="linenr" href="">$linenr</a></td>!;
5141                        print qq!<td class="pre">! . esc_html($line) . "</td>\n";
5142                        print qq!</tr>\n!;
5143                }
5144
5145        } else { # porcelain, i.e. ordinary blame
5146                my %metainfo = (); # saves information about commits
5147
5148                # blame data
5149        LINE:
5150                while (my $line = <$fd>) {
5151                        chomp $line;
5152                        # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
5153                        # no <lines in group> for subsequent lines in group of lines
5154                        my ($full_rev, $orig_lineno, $lineno, $group_size) =
5155                           ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
5156                        if (!exists $metainfo{$full_rev}) {
5157                                $metainfo{$full_rev} = { 'nprevious' => 0 };
5158                        }
5159                        my $meta = $metainfo{$full_rev};
5160                        my $data;
5161                        while ($data = <$fd>) {
5162                                chomp $data;
5163                                last if ($data =~ s/^\t//); # contents of line
5164                                if ($data =~ /^(\S+)(?: (.*))?$/) {
5165                                        $meta->{$1} = $2 unless exists $meta->{$1};
5166                                }
5167                                if ($data =~ /^previous /) {
5168                                        $meta->{'nprevious'}++;
5169                                }
5170                        }
5171                        my $short_rev = substr($full_rev, 0, 8);
5172                        my $author = $meta->{'author'};
5173                        my %date =
5174                                parse_date($meta->{'author-time'}, $meta->{'author-tz'});
5175                        my $date = $date{'iso-tz'};
5176                        if ($group_size) {
5177                                $current_color = ($current_color + 1) % $num_colors;
5178                        }
5179                        my $tr_class = $rev_color[$current_color];
5180                        $tr_class .= ' boundary' if (exists $meta->{'boundary'});
5181                        $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
5182                        $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
5183                        print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
5184                        if ($group_size) {
5185                                print "<td class=\"sha1\"";
5186                                print " title=\"". esc_html($author) . ", $date\"";
5187                                print " rowspan=\"$group_size\"" if ($group_size > 1);
5188                                print ">";
5189                                print $cgi->a({-href => href(action=>"commit",
5190                                                             hash=>$full_rev,
5191                                                             file_name=>$file_name)},
5192                                              esc_html($short_rev));
5193                                if ($group_size >= 2) {
5194                                        my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
5195                                        if (@author_initials) {
5196                                                print "<br />" .
5197                                                      esc_html(join('', @author_initials));
5198                                                #           or join('.', ...)
5199                                        }
5200                                }
5201                                print "</td>\n";
5202                        }
5203                        # 'previous' <sha1 of parent commit> <filename at commit>
5204                        if (exists $meta->{'previous'} &&
5205                            $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
5206                                $meta->{'parent'} = $1;
5207                                $meta->{'file_parent'} = unquote($2);
5208                        }
5209                        my $linenr_commit =
5210                                exists($meta->{'parent'}) ?
5211                                $meta->{'parent'} : $full_rev;
5212                        my $linenr_filename =
5213                                exists($meta->{'file_parent'}) ?
5214                                $meta->{'file_parent'} : unquote($meta->{'filename'});
5215                        my $blamed = href(action => 'blame',
5216                                          file_name => $linenr_filename,
5217                                          hash_base => $linenr_commit);
5218                        print "<td class=\"linenr\">";
5219                        print $cgi->a({ -href => "$blamed#l$orig_lineno",
5220                                        -class => "linenr" },
5221                                      esc_html($lineno));
5222                        print "</td>";
5223                        print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
5224                        print "</tr>\n";
5225                } # end while
5226
5227        }
5228
5229        # footer
5230        print "</tbody>\n".
5231              "</table>\n"; # class="blame"
5232        print "</div>\n";   # class="blame_body"
5233        close $fd
5234                or print "Reading blob failed\n";
5235
5236        git_footer_html();
5237}
5238
5239sub git_blame {
5240        git_blame_common();
5241}
5242
5243sub git_blame_incremental {
5244        git_blame_common('incremental');
5245}
5246
5247sub git_blame_data {
5248        git_blame_common('data');
5249}
5250
5251sub git_tags {
5252        my $head = git_get_head_hash($project);
5253        git_header_html();
5254        git_print_page_nav('','', $head,undef,$head);
5255        git_print_header_div('summary', $project);
5256
5257        my @tagslist = git_get_tags_list();
5258        if (@tagslist) {
5259                git_tags_body(\@tagslist);
5260        }
5261        git_footer_html();
5262}
5263
5264sub git_heads {
5265        my $head = git_get_head_hash($project);
5266        git_header_html();
5267        git_print_page_nav('','', $head,undef,$head);
5268        git_print_header_div('summary', $project);
5269
5270        my @headslist = git_get_heads_list();
5271        if (@headslist) {
5272                git_heads_body(\@headslist, $head);
5273        }
5274        git_footer_html();
5275}
5276
5277sub git_blob_plain {
5278        my $type = shift;
5279        my $expires;
5280
5281        if (!defined $hash) {
5282                if (defined $file_name) {
5283                        my $base = $hash_base || git_get_head_hash($project);
5284                        $hash = git_get_hash_by_path($base, $file_name, "blob")
5285                                or die_error(404, "Cannot find file");
5286                } else {
5287                        die_error(400, "No file name defined");
5288                }
5289        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5290                # blobs defined by non-textual hash id's can be cached
5291                $expires = "+1d";
5292        }
5293
5294        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5295                or die_error(500, "Open git-cat-file blob '$hash' failed");
5296
5297        # content-type (can include charset)
5298        $type = blob_contenttype($fd, $file_name, $type);
5299
5300        # "save as" filename, even when no $file_name is given
5301        my $save_as = "$hash";
5302        if (defined $file_name) {
5303                $save_as = $file_name;
5304        } elsif ($type =~ m/^text\//) {
5305                $save_as .= '.txt';
5306        }
5307
5308        # With XSS prevention on, blobs of all types except a few known safe
5309        # ones are served with "Content-Disposition: attachment" to make sure
5310        # they don't run in our security domain.  For certain image types,
5311        # blob view writes an <img> tag referring to blob_plain view, and we
5312        # want to be sure not to break that by serving the image as an
5313        # attachment (though Firefox 3 doesn't seem to care).
5314        my $sandbox = $prevent_xss &&
5315                $type !~ m!^(?:text/plain|image/(?:gif|png|jpeg))$!;
5316
5317        print $cgi->header(
5318                -type => $type,
5319                -expires => $expires,
5320                -content_disposition =>
5321                        ($sandbox ? 'attachment' : 'inline')
5322                        . '; filename="' . $save_as . '"');
5323        local $/ = undef;
5324        binmode STDOUT, ':raw';
5325        print <$fd>;
5326        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
5327        close $fd;
5328}
5329
5330sub git_blob {
5331        my $expires;
5332
5333        if (!defined $hash) {
5334                if (defined $file_name) {
5335                        my $base = $hash_base || git_get_head_hash($project);
5336                        $hash = git_get_hash_by_path($base, $file_name, "blob")
5337                                or die_error(404, "Cannot find file");
5338                } else {
5339                        die_error(400, "No file name defined");
5340                }
5341        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5342                # blobs defined by non-textual hash id's can be cached
5343                $expires = "+1d";
5344        }
5345
5346        my $have_blame = gitweb_check_feature('blame');
5347        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5348                or die_error(500, "Couldn't cat $file_name, $hash");
5349        my $mimetype = blob_mimetype($fd, $file_name);
5350        if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
5351                close $fd;
5352                return git_blob_plain($mimetype);
5353        }
5354        # we can have blame only for text/* mimetype
5355        $have_blame &&= ($mimetype =~ m!^text/!);
5356
5357        git_header_html(undef, $expires);
5358        my $formats_nav = '';
5359        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
5360                if (defined $file_name) {
5361                        if ($have_blame) {
5362                                $formats_nav .=
5363                                        $cgi->a({-href => href(action=>"blame", -replay=>1)},
5364                                                "blame") .
5365                                        " | ";
5366                        }
5367                        $formats_nav .=
5368                                $cgi->a({-href => href(action=>"history", -replay=>1)},
5369                                        "history") .
5370                                " | " .
5371                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5372                                        "raw") .
5373                                " | " .
5374                                $cgi->a({-href => href(action=>"blob",
5375                                                       hash_base=>"HEAD", file_name=>$file_name)},
5376                                        "HEAD");
5377                } else {
5378                        $formats_nav .=
5379                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5380                                        "raw");
5381                }
5382                git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5383                git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5384        } else {
5385                print "<div class=\"page_nav\">\n" .
5386                      "<br/><br/></div>\n" .
5387                      "<div class=\"title\">$hash</div>\n";
5388        }
5389        git_print_page_path($file_name, "blob", $hash_base);
5390        print "<div class=\"page_body\">\n";
5391        if ($mimetype =~ m!^image/!) {
5392                print qq!<img type="$mimetype"!;
5393                if ($file_name) {
5394                        print qq! alt="$file_name" title="$file_name"!;
5395                }
5396                print qq! src="! .
5397                      href(action=>"blob_plain", hash=>$hash,
5398                           hash_base=>$hash_base, file_name=>$file_name) .
5399                      qq!" />\n!;
5400        } else {
5401                my $nr;
5402                while (my $line = <$fd>) {
5403                        chomp $line;
5404                        $nr++;
5405                        $line = untabify($line);
5406                        printf "<div class=\"pre\"><a id=\"l%i\" href=\"" . href(-replay => 1)
5407                                . "#l%i\" class=\"linenr\">%4i</a> %s</div>\n",
5408                               $nr, $nr, $nr, esc_html($line, -nbsp=>1);
5409                }
5410        }
5411        close $fd
5412                or print "Reading blob failed.\n";
5413        print "</div>";
5414        git_footer_html();
5415}
5416
5417sub git_tree {
5418        if (!defined $hash_base) {
5419                $hash_base = "HEAD";
5420        }
5421        if (!defined $hash) {
5422                if (defined $file_name) {
5423                        $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
5424                } else {
5425                        $hash = $hash_base;
5426                }
5427        }
5428        die_error(404, "No such tree") unless defined($hash);
5429
5430        my $show_sizes = gitweb_check_feature('show-sizes');
5431        my $have_blame = gitweb_check_feature('blame');
5432
5433        my @entries = ();
5434        {
5435                local $/ = "\0";
5436                open my $fd, "-|", git_cmd(), "ls-tree", '-z',
5437                        ($show_sizes ? '-l' : ()), @extra_options, $hash
5438                        or die_error(500, "Open git-ls-tree failed");
5439                @entries = map { chomp; $_ } <$fd>;
5440                close $fd
5441                        or die_error(404, "Reading tree failed");
5442        }
5443
5444        my $refs = git_get_references();
5445        my $ref = format_ref_marker($refs, $hash_base);
5446        git_header_html();
5447        my $basedir = '';
5448        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
5449                my @views_nav = ();
5450                if (defined $file_name) {
5451                        push @views_nav,
5452                                $cgi->a({-href => href(action=>"history", -replay=>1)},
5453                                        "history"),
5454                                $cgi->a({-href => href(action=>"tree",
5455                                                       hash_base=>"HEAD", file_name=>$file_name)},
5456                                        "HEAD"),
5457                }
5458                my $snapshot_links = format_snapshot_links($hash);
5459                if (defined $snapshot_links) {
5460                        # FIXME: Should be available when we have no hash base as well.
5461                        push @views_nav, $snapshot_links;
5462                }
5463                git_print_page_nav('tree','', $hash_base, undef, undef,
5464                                   join(' | ', @views_nav));
5465                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
5466        } else {
5467                undef $hash_base;
5468                print "<div class=\"page_nav\">\n";
5469                print "<br/><br/></div>\n";
5470                print "<div class=\"title\">$hash</div>\n";
5471        }
5472        if (defined $file_name) {
5473                $basedir = $file_name;
5474                if ($basedir ne '' && substr($basedir, -1) ne '/') {
5475                        $basedir .= '/';
5476                }
5477                git_print_page_path($file_name, 'tree', $hash_base);
5478        }
5479        print "<div class=\"page_body\">\n";
5480        print "<table class=\"tree\">\n";
5481        my $alternate = 1;
5482        # '..' (top directory) link if possible
5483        if (defined $hash_base &&
5484            defined $file_name && $file_name =~ m![^/]+$!) {
5485                if ($alternate) {
5486                        print "<tr class=\"dark\">\n";
5487                } else {
5488                        print "<tr class=\"light\">\n";
5489                }
5490                $alternate ^= 1;
5491
5492                my $up = $file_name;
5493                $up =~ s!/?[^/]+$!!;
5494                undef $up unless $up;
5495                # based on git_print_tree_entry
5496                print '<td class="mode">' . mode_str('040000') . "</td>\n";
5497                print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
5498                print '<td class="list">';
5499                print $cgi->a({-href => href(action=>"tree",
5500                                             hash_base=>$hash_base,
5501                                             file_name=>$up)},
5502                              "..");
5503                print "</td>\n";
5504                print "<td class=\"link\"></td>\n";
5505
5506                print "</tr>\n";
5507        }
5508        foreach my $line (@entries) {
5509                my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
5510
5511                if ($alternate) {
5512                        print "<tr class=\"dark\">\n";
5513                } else {
5514                        print "<tr class=\"light\">\n";
5515                }
5516                $alternate ^= 1;
5517
5518                git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
5519
5520                print "</tr>\n";
5521        }
5522        print "</table>\n" .
5523              "</div>";
5524        git_footer_html();
5525}
5526
5527sub snapshot_name {
5528        my ($project, $hash) = @_;
5529
5530        # path/to/project.git  -> project
5531        # path/to/project/.git -> project
5532        my $name = to_utf8($project);
5533        $name =~ s,([^/])/*\.git$,$1,;
5534        $name = basename($name);
5535        # sanitize name
5536        $name =~ s/[[:cntrl:]]/?/g;
5537
5538        my $ver = $hash;
5539        if ($hash =~ /^[0-9a-fA-F]+$/) {
5540                # shorten SHA-1 hash
5541                my $full_hash = git_get_full_hash($project, $hash);
5542                if ($full_hash =~ /^$hash/ && length($hash) > 7) {
5543                        $ver = git_get_short_hash($project, $hash);
5544                }
5545        } elsif ($hash =~ m!^refs/tags/(.*)$!) {
5546                # tags don't need shortened SHA-1 hash
5547                $ver = $1;
5548        } else {
5549                # branches and other need shortened SHA-1 hash
5550                if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
5551                        $ver = $1;
5552                }
5553                $ver .= '-' . git_get_short_hash($project, $hash);
5554        }
5555        # in case of hierarchical branch names
5556        $ver =~ s!/!.!g;
5557
5558        # name = project-version_string
5559        $name = "$name-$ver";
5560
5561        return wantarray ? ($name, $name) : $name;
5562}
5563
5564sub git_snapshot {
5565        my $format = $input_params{'snapshot_format'};
5566        if (!@snapshot_fmts) {
5567                die_error(403, "Snapshots not allowed");
5568        }
5569        # default to first supported snapshot format
5570        $format ||= $snapshot_fmts[0];
5571        if ($format !~ m/^[a-z0-9]+$/) {
5572                die_error(400, "Invalid snapshot format parameter");
5573        } elsif (!exists($known_snapshot_formats{$format})) {
5574                die_error(400, "Unknown snapshot format");
5575        } elsif ($known_snapshot_formats{$format}{'disabled'}) {
5576                die_error(403, "Snapshot format not allowed");
5577        } elsif (!grep($_ eq $format, @snapshot_fmts)) {
5578                die_error(403, "Unsupported snapshot format");
5579        }
5580
5581        my $type = git_get_type("$hash^{}");
5582        if (!$type) {
5583                die_error(404, 'Object does not exist');
5584        }  elsif ($type eq 'blob') {
5585                die_error(400, 'Object is not a tree-ish');
5586        }
5587
5588        my ($name, $prefix) = snapshot_name($project, $hash);
5589        my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
5590        my $cmd = quote_command(
5591                git_cmd(), 'archive',
5592                "--format=$known_snapshot_formats{$format}{'format'}",
5593                "--prefix=$prefix/", $hash);
5594        if (exists $known_snapshot_formats{$format}{'compressor'}) {
5595                $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
5596        }
5597
5598        $filename =~ s/(["\\])/\\$1/g;
5599        print $cgi->header(
5600                -type => $known_snapshot_formats{$format}{'type'},
5601                -content_disposition => 'inline; filename="' . $filename . '"',
5602                -status => '200 OK');
5603
5604        open my $fd, "-|", $cmd
5605                or die_error(500, "Execute git-archive failed");
5606        binmode STDOUT, ':raw';
5607        print <$fd>;
5608        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
5609        close $fd;
5610}
5611
5612sub git_log_generic {
5613        my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
5614
5615        my $head = git_get_head_hash($project);
5616        if (!defined $base) {
5617                $base = $head;
5618        }
5619        if (!defined $page) {
5620                $page = 0;
5621        }
5622        my $refs = git_get_references();
5623
5624        my $commit_hash = $base;
5625        if (defined $parent) {
5626                $commit_hash = "$parent..$base";
5627        }
5628        my @commitlist =
5629                parse_commits($commit_hash, 101, (100 * $page),
5630                              defined $file_name ? ($file_name, "--full-history") : ());
5631
5632        my $ftype;
5633        if (!defined $file_hash && defined $file_name) {
5634                # some commits could have deleted file in question,
5635                # and not have it in tree, but one of them has to have it
5636                for (my $i = 0; $i < @commitlist; $i++) {
5637                        $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
5638                        last if defined $file_hash;
5639                }
5640        }
5641        if (defined $file_hash) {
5642                $ftype = git_get_type($file_hash);
5643        }
5644        if (defined $file_name && !defined $ftype) {
5645                die_error(500, "Unknown type of object");
5646        }
5647        my %co;
5648        if (defined $file_name) {
5649                %co = parse_commit($base)
5650                        or die_error(404, "Unknown commit object");
5651        }
5652
5653
5654        my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
5655        my $next_link = '';
5656        if ($#commitlist >= 100) {
5657                $next_link =
5658                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
5659                                 -accesskey => "n", -title => "Alt-n"}, "next");
5660        }
5661        my $patch_max = gitweb_get_feature('patches');
5662        if ($patch_max && !defined $file_name) {
5663                if ($patch_max < 0 || @commitlist <= $patch_max) {
5664                        $paging_nav .= " &sdot; " .
5665                                $cgi->a({-href => href(action=>"patches", -replay=>1)},
5666                                        "patches");
5667                }
5668        }
5669
5670        git_header_html();
5671        git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
5672        if (defined $file_name) {
5673                git_print_header_div('commit', esc_html($co{'title'}), $base);
5674        } else {
5675                git_print_header_div('summary', $project)
5676        }
5677        git_print_page_path($file_name, $ftype, $hash_base)
5678                if (defined $file_name);
5679
5680        $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
5681                     $file_name, $file_hash, $ftype);
5682
5683        git_footer_html();
5684}
5685
5686sub git_log {
5687        git_log_generic('log', \&git_log_body,
5688                        $hash, $hash_parent);
5689}
5690
5691sub git_commit {
5692        $hash ||= $hash_base || "HEAD";
5693        my %co = parse_commit($hash)
5694            or die_error(404, "Unknown commit object");
5695
5696        my $parent  = $co{'parent'};
5697        my $parents = $co{'parents'}; # listref
5698
5699        # we need to prepare $formats_nav before any parameter munging
5700        my $formats_nav;
5701        if (!defined $parent) {
5702                # --root commitdiff
5703                $formats_nav .= '(initial)';
5704        } elsif (@$parents == 1) {
5705                # single parent commit
5706                $formats_nav .=
5707                        '(parent: ' .
5708                        $cgi->a({-href => href(action=>"commit",
5709                                               hash=>$parent)},
5710                                esc_html(substr($parent, 0, 7))) .
5711                        ')';
5712        } else {
5713                # merge commit
5714                $formats_nav .=
5715                        '(merge: ' .
5716                        join(' ', map {
5717                                $cgi->a({-href => href(action=>"commit",
5718                                                       hash=>$_)},
5719                                        esc_html(substr($_, 0, 7)));
5720                        } @$parents ) .
5721                        ')';
5722        }
5723        if (gitweb_check_feature('patches') && @$parents <= 1) {
5724                $formats_nav .= " | " .
5725                        $cgi->a({-href => href(action=>"patch", -replay=>1)},
5726                                "patch");
5727        }
5728
5729        if (!defined $parent) {
5730                $parent = "--root";
5731        }
5732        my @difftree;
5733        open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
5734                @diff_opts,
5735                (@$parents <= 1 ? $parent : '-c'),
5736                $hash, "--"
5737                or die_error(500, "Open git-diff-tree failed");
5738        @difftree = map { chomp; $_ } <$fd>;
5739        close $fd or die_error(404, "Reading git-diff-tree failed");
5740
5741        # non-textual hash id's can be cached
5742        my $expires;
5743        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5744                $expires = "+1d";
5745        }
5746        my $refs = git_get_references();
5747        my $ref = format_ref_marker($refs, $co{'id'});
5748
5749        git_header_html(undef, $expires);
5750        git_print_page_nav('commit', '',
5751                           $hash, $co{'tree'}, $hash,
5752                           $formats_nav);
5753
5754        if (defined $co{'parent'}) {
5755                git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
5756        } else {
5757                git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
5758        }
5759        print "<div class=\"title_text\">\n" .
5760              "<table class=\"object_header\">\n";
5761        git_print_authorship_rows(\%co);
5762        print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
5763        print "<tr>" .
5764              "<td>tree</td>" .
5765              "<td class=\"sha1\">" .
5766              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
5767                       class => "list"}, $co{'tree'}) .
5768              "</td>" .
5769              "<td class=\"link\">" .
5770              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
5771                      "tree");
5772        my $snapshot_links = format_snapshot_links($hash);
5773        if (defined $snapshot_links) {
5774                print " | " . $snapshot_links;
5775        }
5776        print "</td>" .
5777              "</tr>\n";
5778
5779        foreach my $par (@$parents) {
5780                print "<tr>" .
5781                      "<td>parent</td>" .
5782                      "<td class=\"sha1\">" .
5783                      $cgi->a({-href => href(action=>"commit", hash=>$par),
5784                               class => "list"}, $par) .
5785                      "</td>" .
5786                      "<td class=\"link\">" .
5787                      $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
5788                      " | " .
5789                      $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
5790                      "</td>" .
5791                      "</tr>\n";
5792        }
5793        print "</table>".
5794              "</div>\n";
5795
5796        print "<div class=\"page_body\">\n";
5797        git_print_log($co{'comment'});
5798        print "</div>\n";
5799
5800        git_difftree_body(\@difftree, $hash, @$parents);
5801
5802        git_footer_html();
5803}
5804
5805sub git_object {
5806        # object is defined by:
5807        # - hash or hash_base alone
5808        # - hash_base and file_name
5809        my $type;
5810
5811        # - hash or hash_base alone
5812        if ($hash || ($hash_base && !defined $file_name)) {
5813                my $object_id = $hash || $hash_base;
5814
5815                open my $fd, "-|", quote_command(
5816                        git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
5817                        or die_error(404, "Object does not exist");
5818                $type = <$fd>;
5819                chomp $type;
5820                close $fd
5821                        or die_error(404, "Object does not exist");
5822
5823        # - hash_base and file_name
5824        } elsif ($hash_base && defined $file_name) {
5825                $file_name =~ s,/+$,,;
5826
5827                system(git_cmd(), "cat-file", '-e', $hash_base) == 0
5828                        or die_error(404, "Base object does not exist");
5829
5830                # here errors should not hapen
5831                open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
5832                        or die_error(500, "Open git-ls-tree failed");
5833                my $line = <$fd>;
5834                close $fd;
5835
5836                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
5837                unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
5838                        die_error(404, "File or directory for given base does not exist");
5839                }
5840                $type = $2;
5841                $hash = $3;
5842        } else {
5843                die_error(400, "Not enough information to find object");
5844        }
5845
5846        print $cgi->redirect(-uri => href(action=>$type, -full=>1,
5847                                          hash=>$hash, hash_base=>$hash_base,
5848                                          file_name=>$file_name),
5849                             -status => '302 Found');
5850}
5851
5852sub git_blobdiff {
5853        my $format = shift || 'html';
5854
5855        my $fd;
5856        my @difftree;
5857        my %diffinfo;
5858        my $expires;
5859
5860        # preparing $fd and %diffinfo for git_patchset_body
5861        # new style URI
5862        if (defined $hash_base && defined $hash_parent_base) {
5863                if (defined $file_name) {
5864                        # read raw output
5865                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
5866                                $hash_parent_base, $hash_base,
5867                                "--", (defined $file_parent ? $file_parent : ()), $file_name
5868                                or die_error(500, "Open git-diff-tree failed");
5869                        @difftree = map { chomp; $_ } <$fd>;
5870                        close $fd
5871                                or die_error(404, "Reading git-diff-tree failed");
5872                        @difftree
5873                                or die_error(404, "Blob diff not found");
5874
5875                } elsif (defined $hash &&
5876                         $hash =~ /[0-9a-fA-F]{40}/) {
5877                        # try to find filename from $hash
5878
5879                        # read filtered raw output
5880                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
5881                                $hash_parent_base, $hash_base, "--"
5882                                or die_error(500, "Open git-diff-tree failed");
5883                        @difftree =
5884                                # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
5885                                # $hash == to_id
5886                                grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
5887                                map { chomp; $_ } <$fd>;
5888                        close $fd
5889                                or die_error(404, "Reading git-diff-tree failed");
5890                        @difftree
5891                                or die_error(404, "Blob diff not found");
5892
5893                } else {
5894                        die_error(400, "Missing one of the blob diff parameters");
5895                }
5896
5897                if (@difftree > 1) {
5898                        die_error(400, "Ambiguous blob diff specification");
5899                }
5900
5901                %diffinfo = parse_difftree_raw_line($difftree[0]);
5902                $file_parent ||= $diffinfo{'from_file'} || $file_name;
5903                $file_name   ||= $diffinfo{'to_file'};
5904
5905                $hash_parent ||= $diffinfo{'from_id'};
5906                $hash        ||= $diffinfo{'to_id'};
5907
5908                # non-textual hash id's can be cached
5909                if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
5910                    $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
5911                        $expires = '+1d';
5912                }
5913
5914                # open patch output
5915                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
5916                        '-p', ($format eq 'html' ? "--full-index" : ()),
5917                        $hash_parent_base, $hash_base,
5918                        "--", (defined $file_parent ? $file_parent : ()), $file_name
5919                        or die_error(500, "Open git-diff-tree failed");
5920        }
5921
5922        # old/legacy style URI -- not generated anymore since 1.4.3.
5923        if (!%diffinfo) {
5924                die_error('404 Not Found', "Missing one of the blob diff parameters")
5925        }
5926
5927        # header
5928        if ($format eq 'html') {
5929                my $formats_nav =
5930                        $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
5931                                "raw");
5932                git_header_html(undef, $expires);
5933                if (defined $hash_base && (my %co = parse_commit($hash_base))) {
5934                        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5935                        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5936                } else {
5937                        print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
5938                        print "<div class=\"title\">$hash vs $hash_parent</div>\n";
5939                }
5940                if (defined $file_name) {
5941                        git_print_page_path($file_name, "blob", $hash_base);
5942                } else {
5943                        print "<div class=\"page_path\"></div>\n";
5944                }
5945
5946        } elsif ($format eq 'plain') {
5947                print $cgi->header(
5948                        -type => 'text/plain',
5949                        -charset => 'utf-8',
5950                        -expires => $expires,
5951                        -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
5952
5953                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
5954
5955        } else {
5956                die_error(400, "Unknown blobdiff format");
5957        }
5958
5959        # patch
5960        if ($format eq 'html') {
5961                print "<div class=\"page_body\">\n";
5962
5963                git_patchset_body($fd, [ \%diffinfo ], $hash_base, $hash_parent_base);
5964                close $fd;
5965
5966                print "</div>\n"; # class="page_body"
5967                git_footer_html();
5968
5969        } else {
5970                while (my $line = <$fd>) {
5971                        $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
5972                        $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
5973
5974                        print $line;
5975
5976                        last if $line =~ m!^\+\+\+!;
5977                }
5978                local $/ = undef;
5979                print <$fd>;
5980                close $fd;
5981        }
5982}
5983
5984sub git_blobdiff_plain {
5985        git_blobdiff('plain');
5986}
5987
5988sub git_commitdiff {
5989        my %params = @_;
5990        my $format = $params{-format} || 'html';
5991
5992        my ($patch_max) = gitweb_get_feature('patches');
5993        if ($format eq 'patch') {
5994                die_error(403, "Patch view not allowed") unless $patch_max;
5995        }
5996
5997        $hash ||= $hash_base || "HEAD";
5998        my %co = parse_commit($hash)
5999            or die_error(404, "Unknown commit object");
6000
6001        # choose format for commitdiff for merge
6002        if (! defined $hash_parent && @{$co{'parents'}} > 1) {
6003                $hash_parent = '--cc';
6004        }
6005        # we need to prepare $formats_nav before almost any parameter munging
6006        my $formats_nav;
6007        if ($format eq 'html') {
6008                $formats_nav =
6009                        $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
6010                                "raw");
6011                if ($patch_max && @{$co{'parents'}} <= 1) {
6012                        $formats_nav .= " | " .
6013                                $cgi->a({-href => href(action=>"patch", -replay=>1)},
6014                                        "patch");
6015                }
6016
6017                if (defined $hash_parent &&
6018                    $hash_parent ne '-c' && $hash_parent ne '--cc') {
6019                        # commitdiff with two commits given
6020                        my $hash_parent_short = $hash_parent;
6021                        if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
6022                                $hash_parent_short = substr($hash_parent, 0, 7);
6023                        }
6024                        $formats_nav .=
6025                                ' (from';
6026                        for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
6027                                if ($co{'parents'}[$i] eq $hash_parent) {
6028                                        $formats_nav .= ' parent ' . ($i+1);
6029                                        last;
6030                                }
6031                        }
6032                        $formats_nav .= ': ' .
6033                                $cgi->a({-href => href(action=>"commitdiff",
6034                                                       hash=>$hash_parent)},
6035                                        esc_html($hash_parent_short)) .
6036                                ')';
6037                } elsif (!$co{'parent'}) {
6038                        # --root commitdiff
6039                        $formats_nav .= ' (initial)';
6040                } elsif (scalar @{$co{'parents'}} == 1) {
6041                        # single parent commit
6042                        $formats_nav .=
6043                                ' (parent: ' .
6044                                $cgi->a({-href => href(action=>"commitdiff",
6045                                                       hash=>$co{'parent'})},
6046                                        esc_html(substr($co{'parent'}, 0, 7))) .
6047                                ')';
6048                } else {
6049                        # merge commit
6050                        if ($hash_parent eq '--cc') {
6051                                $formats_nav .= ' | ' .
6052                                        $cgi->a({-href => href(action=>"commitdiff",
6053                                                               hash=>$hash, hash_parent=>'-c')},
6054                                                'combined');
6055                        } else { # $hash_parent eq '-c'
6056                                $formats_nav .= ' | ' .
6057                                        $cgi->a({-href => href(action=>"commitdiff",
6058                                                               hash=>$hash, hash_parent=>'--cc')},
6059                                                'compact');
6060                        }
6061                        $formats_nav .=
6062                                ' (merge: ' .
6063                                join(' ', map {
6064                                        $cgi->a({-href => href(action=>"commitdiff",
6065                                                               hash=>$_)},
6066                                                esc_html(substr($_, 0, 7)));
6067                                } @{$co{'parents'}} ) .
6068                                ')';
6069                }
6070        }
6071
6072        my $hash_parent_param = $hash_parent;
6073        if (!defined $hash_parent_param) {
6074                # --cc for multiple parents, --root for parentless
6075                $hash_parent_param =
6076                        @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
6077        }
6078
6079        # read commitdiff
6080        my $fd;
6081        my @difftree;
6082        if ($format eq 'html') {
6083                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6084                        "--no-commit-id", "--patch-with-raw", "--full-index",
6085                        $hash_parent_param, $hash, "--"
6086                        or die_error(500, "Open git-diff-tree failed");
6087
6088                while (my $line = <$fd>) {
6089                        chomp $line;
6090                        # empty line ends raw part of diff-tree output
6091                        last unless $line;
6092                        push @difftree, scalar parse_difftree_raw_line($line);
6093                }
6094
6095        } elsif ($format eq 'plain') {
6096                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6097                        '-p', $hash_parent_param, $hash, "--"
6098                        or die_error(500, "Open git-diff-tree failed");
6099        } elsif ($format eq 'patch') {
6100                # For commit ranges, we limit the output to the number of
6101                # patches specified in the 'patches' feature.
6102                # For single commits, we limit the output to a single patch,
6103                # diverging from the git-format-patch default.
6104                my @commit_spec = ();
6105                if ($hash_parent) {
6106                        if ($patch_max > 0) {
6107                                push @commit_spec, "-$patch_max";
6108                        }
6109                        push @commit_spec, '-n', "$hash_parent..$hash";
6110                } else {
6111                        if ($params{-single}) {
6112                                push @commit_spec, '-1';
6113                        } else {
6114                                if ($patch_max > 0) {
6115                                        push @commit_spec, "-$patch_max";
6116                                }
6117                                push @commit_spec, "-n";
6118                        }
6119                        push @commit_spec, '--root', $hash;
6120                }
6121                open $fd, "-|", git_cmd(), "format-patch", '--encoding=utf8',
6122                        '--stdout', @commit_spec
6123                        or die_error(500, "Open git-format-patch failed");
6124        } else {
6125                die_error(400, "Unknown commitdiff format");
6126        }
6127
6128        # non-textual hash id's can be cached
6129        my $expires;
6130        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6131                $expires = "+1d";
6132        }
6133
6134        # write commit message
6135        if ($format eq 'html') {
6136                my $refs = git_get_references();
6137                my $ref = format_ref_marker($refs, $co{'id'});
6138
6139                git_header_html(undef, $expires);
6140                git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
6141                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
6142                print "<div class=\"title_text\">\n" .
6143                      "<table class=\"object_header\">\n";
6144                git_print_authorship_rows(\%co);
6145                print "</table>".
6146                      "</div>\n";
6147                print "<div class=\"page_body\">\n";
6148                if (@{$co{'comment'}} > 1) {
6149                        print "<div class=\"log\">\n";
6150                        git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
6151                        print "</div>\n"; # class="log"
6152                }
6153
6154        } elsif ($format eq 'plain') {
6155                my $refs = git_get_references("tags");
6156                my $tagname = git_get_rev_name_tags($hash);
6157                my $filename = basename($project) . "-$hash.patch";
6158
6159                print $cgi->header(
6160                        -type => 'text/plain',
6161                        -charset => 'utf-8',
6162                        -expires => $expires,
6163                        -content_disposition => 'inline; filename="' . "$filename" . '"');
6164                my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
6165                print "From: " . to_utf8($co{'author'}) . "\n";
6166                print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
6167                print "Subject: " . to_utf8($co{'title'}) . "\n";
6168
6169                print "X-Git-Tag: $tagname\n" if $tagname;
6170                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6171
6172                foreach my $line (@{$co{'comment'}}) {
6173                        print to_utf8($line) . "\n";
6174                }
6175                print "---\n\n";
6176        } elsif ($format eq 'patch') {
6177                my $filename = basename($project) . "-$hash.patch";
6178
6179                print $cgi->header(
6180                        -type => 'text/plain',
6181                        -charset => 'utf-8',
6182                        -expires => $expires,
6183                        -content_disposition => 'inline; filename="' . "$filename" . '"');
6184        }
6185
6186        # write patch
6187        if ($format eq 'html') {
6188                my $use_parents = !defined $hash_parent ||
6189                        $hash_parent eq '-c' || $hash_parent eq '--cc';
6190                git_difftree_body(\@difftree, $hash,
6191                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
6192                print "<br/>\n";
6193
6194                git_patchset_body($fd, \@difftree, $hash,
6195                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
6196                close $fd;
6197                print "</div>\n"; # class="page_body"
6198                git_footer_html();
6199
6200        } elsif ($format eq 'plain') {
6201                local $/ = undef;
6202                print <$fd>;
6203                close $fd
6204                        or print "Reading git-diff-tree failed\n";
6205        } elsif ($format eq 'patch') {
6206                local $/ = undef;
6207                print <$fd>;
6208                close $fd
6209                        or print "Reading git-format-patch failed\n";
6210        }
6211}
6212
6213sub git_commitdiff_plain {
6214        git_commitdiff(-format => 'plain');
6215}
6216
6217# format-patch-style patches
6218sub git_patch {
6219        git_commitdiff(-format => 'patch', -single => 1);
6220}
6221
6222sub git_patches {
6223        git_commitdiff(-format => 'patch');
6224}
6225
6226sub git_history {
6227        git_log_generic('history', \&git_history_body,
6228                        $hash_base, $hash_parent_base,
6229                        $file_name, $hash);
6230}
6231
6232sub git_search {
6233        gitweb_check_feature('search') or die_error(403, "Search is disabled");
6234        if (!defined $searchtext) {
6235                die_error(400, "Text field is empty");
6236        }
6237        if (!defined $hash) {
6238                $hash = git_get_head_hash($project);
6239        }
6240        my %co = parse_commit($hash);
6241        if (!%co) {
6242                die_error(404, "Unknown commit object");
6243        }
6244        if (!defined $page) {
6245                $page = 0;
6246        }
6247
6248        $searchtype ||= 'commit';
6249        if ($searchtype eq 'pickaxe') {
6250                # pickaxe may take all resources of your box and run for several minutes
6251                # with every query - so decide by yourself how public you make this feature
6252                gitweb_check_feature('pickaxe')
6253                    or die_error(403, "Pickaxe is disabled");
6254        }
6255        if ($searchtype eq 'grep') {
6256                gitweb_check_feature('grep')
6257                    or die_error(403, "Grep is disabled");
6258        }
6259
6260        git_header_html();
6261
6262        if ($searchtype eq 'commit' or $searchtype eq 'author' or $searchtype eq 'committer') {
6263                my $greptype;
6264                if ($searchtype eq 'commit') {
6265                        $greptype = "--grep=";
6266                } elsif ($searchtype eq 'author') {
6267                        $greptype = "--author=";
6268                } elsif ($searchtype eq 'committer') {
6269                        $greptype = "--committer=";
6270                }
6271                $greptype .= $searchtext;
6272                my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
6273                                               $greptype, '--regexp-ignore-case',
6274                                               $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
6275
6276                my $paging_nav = '';
6277                if ($page > 0) {
6278                        $paging_nav .=
6279                                $cgi->a({-href => href(action=>"search", hash=>$hash,
6280                                                       searchtext=>$searchtext,
6281                                                       searchtype=>$searchtype)},
6282                                        "first");
6283                        $paging_nav .= " &sdot; " .
6284                                $cgi->a({-href => href(-replay=>1, page=>$page-1),
6285                                         -accesskey => "p", -title => "Alt-p"}, "prev");
6286                } else {
6287                        $paging_nav .= "first";
6288                        $paging_nav .= " &sdot; prev";
6289                }
6290                my $next_link = '';
6291                if ($#commitlist >= 100) {
6292                        $next_link =
6293                                $cgi->a({-href => href(-replay=>1, page=>$page+1),
6294                                         -accesskey => "n", -title => "Alt-n"}, "next");
6295                        $paging_nav .= " &sdot; $next_link";
6296                } else {
6297                        $paging_nav .= " &sdot; next";
6298                }
6299
6300                if ($#commitlist >= 100) {
6301                }
6302
6303                git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
6304                git_print_header_div('commit', esc_html($co{'title'}), $hash);
6305                git_search_grep_body(\@commitlist, 0, 99, $next_link);
6306        }
6307
6308        if ($searchtype eq 'pickaxe') {
6309                git_print_page_nav('','', $hash,$co{'tree'},$hash);
6310                git_print_header_div('commit', esc_html($co{'title'}), $hash);
6311
6312                print "<table class=\"pickaxe search\">\n";
6313                my $alternate = 1;
6314                local $/ = "\n";
6315                open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
6316                        '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
6317                        ($search_use_regexp ? '--pickaxe-regex' : ());
6318                undef %co;
6319                my @files;
6320                while (my $line = <$fd>) {
6321                        chomp $line;
6322                        next unless $line;
6323
6324                        my %set = parse_difftree_raw_line($line);
6325                        if (defined $set{'commit'}) {
6326                                # finish previous commit
6327                                if (%co) {
6328                                        print "</td>\n" .
6329                                              "<td class=\"link\">" .
6330                                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6331                                              " | " .
6332                                              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6333                                        print "</td>\n" .
6334                                              "</tr>\n";
6335                                }
6336
6337                                if ($alternate) {
6338                                        print "<tr class=\"dark\">\n";
6339                                } else {
6340                                        print "<tr class=\"light\">\n";
6341                                }
6342                                $alternate ^= 1;
6343                                %co = parse_commit($set{'commit'});
6344                                my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6345                                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6346                                      "<td><i>$author</i></td>\n" .
6347                                      "<td>" .
6348                                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6349                                              -class => "list subject"},
6350                                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
6351                        } elsif (defined $set{'to_id'}) {
6352                                next if ($set{'to_id'} =~ m/^0{40}$/);
6353
6354                                print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6355                                                             hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6356                                              -class => "list"},
6357                                              "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6358                                      "<br/>\n";
6359                        }
6360                }
6361                close $fd;
6362
6363                # finish last commit (warning: repetition!)
6364                if (%co) {
6365                        print "</td>\n" .
6366                              "<td class=\"link\">" .
6367                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6368                              " | " .
6369                              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6370                        print "</td>\n" .
6371                              "</tr>\n";
6372                }
6373
6374                print "</table>\n";
6375        }
6376
6377        if ($searchtype eq 'grep') {
6378                git_print_page_nav('','', $hash,$co{'tree'},$hash);
6379                git_print_header_div('commit', esc_html($co{'title'}), $hash);
6380
6381                print "<table class=\"grep_search\">\n";
6382                my $alternate = 1;
6383                my $matches = 0;
6384                local $/ = "\n";
6385                open my $fd, "-|", git_cmd(), 'grep', '-n',
6386                        $search_use_regexp ? ('-E', '-i') : '-F',
6387                        $searchtext, $co{'tree'};
6388                my $lastfile = '';
6389                while (my $line = <$fd>) {
6390                        chomp $line;
6391                        my ($file, $lno, $ltext, $binary);
6392                        last if ($matches++ > 1000);
6393                        if ($line =~ /^Binary file (.+) matches$/) {
6394                                $file = $1;
6395                                $binary = 1;
6396                        } else {
6397                                (undef, $file, $lno, $ltext) = split(/:/, $line, 4);
6398                        }
6399                        if ($file ne $lastfile) {
6400                                $lastfile and print "</td></tr>\n";
6401                                if ($alternate++) {
6402                                        print "<tr class=\"dark\">\n";
6403                                } else {
6404                                        print "<tr class=\"light\">\n";
6405                                }
6406                                print "<td class=\"list\">".
6407                                        $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6408                                                               file_name=>"$file"),
6409                                                -class => "list"}, esc_path($file));
6410                                print "</td><td>\n";
6411                                $lastfile = $file;
6412                        }
6413                        if ($binary) {
6414                                print "<div class=\"binary\">Binary file</div>\n";
6415                        } else {
6416                                $ltext = untabify($ltext);
6417                                if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6418                                        $ltext = esc_html($1, -nbsp=>1);
6419                                        $ltext .= '<span class="match">';
6420                                        $ltext .= esc_html($2, -nbsp=>1);
6421                                        $ltext .= '</span>';
6422                                        $ltext .= esc_html($3, -nbsp=>1);
6423                                } else {
6424                                        $ltext = esc_html($ltext, -nbsp=>1);
6425                                }
6426                                print "<div class=\"pre\">" .
6427                                        $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6428                                                               file_name=>"$file").'#l'.$lno,
6429                                                -class => "linenr"}, sprintf('%4i', $lno))
6430                                        . ' ' .  $ltext . "</div>\n";
6431                        }
6432                }
6433                if ($lastfile) {
6434                        print "</td></tr>\n";
6435                        if ($matches > 1000) {
6436                                print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6437                        }
6438                } else {
6439                        print "<div class=\"diff nodifferences\">No matches found</div>\n";
6440                }
6441                close $fd;
6442
6443                print "</table>\n";
6444        }
6445        git_footer_html();
6446}
6447
6448sub git_search_help {
6449        git_header_html();
6450        git_print_page_nav('','', $hash,$hash,$hash);
6451        print <<EOT;
6452<p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
6453regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
6454the pattern entered is recognized as the POSIX extended
6455<a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
6456insensitive).</p>
6457<dl>
6458<dt><b>commit</b></dt>
6459<dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
6460EOT
6461        my $have_grep = gitweb_check_feature('grep');
6462        if ($have_grep) {
6463                print <<EOT;
6464<dt><b>grep</b></dt>
6465<dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
6466    a different one) are searched for the given pattern. On large trees, this search can take
6467a while and put some strain on the server, so please use it with some consideration. Note that
6468due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
6469case-sensitive.</dd>
6470EOT
6471        }
6472        print <<EOT;
6473<dt><b>author</b></dt>
6474<dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
6475<dt><b>committer</b></dt>
6476<dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
6477EOT
6478        my $have_pickaxe = gitweb_check_feature('pickaxe');
6479        if ($have_pickaxe) {
6480                print <<EOT;
6481<dt><b>pickaxe</b></dt>
6482<dd>All commits that caused the string to appear or disappear from any file (changes that
6483added, removed or "modified" the string) will be listed. This search can take a while and
6484takes a lot of strain on the server, so please use it wisely. Note that since you may be
6485interested even in changes just changing the case as well, this search is case sensitive.</dd>
6486EOT
6487        }
6488        print "</dl>\n";
6489        git_footer_html();
6490}
6491
6492sub git_shortlog {
6493        git_log_generic('shortlog', \&git_shortlog_body,
6494                        $hash, $hash_parent);
6495}
6496
6497## ......................................................................
6498## feeds (RSS, Atom; OPML)
6499
6500sub git_feed {
6501        my $format = shift || 'atom';
6502        my $have_blame = gitweb_check_feature('blame');
6503
6504        # Atom: http://www.atomenabled.org/developers/syndication/
6505        # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
6506        if ($format ne 'rss' && $format ne 'atom') {
6507                die_error(400, "Unknown web feed format");
6508        }
6509
6510        # log/feed of current (HEAD) branch, log of given branch, history of file/directory
6511        my $head = $hash || 'HEAD';
6512        my @commitlist = parse_commits($head, 150, 0, $file_name);
6513
6514        my %latest_commit;
6515        my %latest_date;
6516        my $content_type = "application/$format+xml";
6517        if (defined $cgi->http('HTTP_ACCEPT') &&
6518                 $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
6519                # browser (feed reader) prefers text/xml
6520                $content_type = 'text/xml';
6521        }
6522        if (defined($commitlist[0])) {
6523                %latest_commit = %{$commitlist[0]};
6524                my $latest_epoch = $latest_commit{'committer_epoch'};
6525                %latest_date   = parse_date($latest_epoch);
6526                my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
6527                if (defined $if_modified) {
6528                        my $since;
6529                        if (eval { require HTTP::Date; 1; }) {
6530                                $since = HTTP::Date::str2time($if_modified);
6531                        } elsif (eval { require Time::ParseDate; 1; }) {
6532                                $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
6533                        }
6534                        if (defined $since && $latest_epoch <= $since) {
6535                                print $cgi->header(
6536                                        -type => $content_type,
6537                                        -charset => 'utf-8',
6538                                        -last_modified => $latest_date{'rfc2822'},
6539                                        -status => '304 Not Modified');
6540                                return;
6541                        }
6542                }
6543                print $cgi->header(
6544                        -type => $content_type,
6545                        -charset => 'utf-8',
6546                        -last_modified => $latest_date{'rfc2822'});
6547        } else {
6548                print $cgi->header(
6549                        -type => $content_type,
6550                        -charset => 'utf-8');
6551        }
6552
6553        # Optimization: skip generating the body if client asks only
6554        # for Last-Modified date.
6555        return if ($cgi->request_method() eq 'HEAD');
6556
6557        # header variables
6558        my $title = "$site_name - $project/$action";
6559        my $feed_type = 'log';
6560        if (defined $hash) {
6561                $title .= " - '$hash'";
6562                $feed_type = 'branch log';
6563                if (defined $file_name) {
6564                        $title .= " :: $file_name";
6565                        $feed_type = 'history';
6566                }
6567        } elsif (defined $file_name) {
6568                $title .= " - $file_name";
6569                $feed_type = 'history';
6570        }
6571        $title .= " $feed_type";
6572        my $descr = git_get_project_description($project);
6573        if (defined $descr) {
6574                $descr = esc_html($descr);
6575        } else {
6576                $descr = "$project " .
6577                         ($format eq 'rss' ? 'RSS' : 'Atom') .
6578                         " feed";
6579        }
6580        my $owner = git_get_project_owner($project);
6581        $owner = esc_html($owner);
6582
6583        #header
6584        my $alt_url;
6585        if (defined $file_name) {
6586                $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
6587        } elsif (defined $hash) {
6588                $alt_url = href(-full=>1, action=>"log", hash=>$hash);
6589        } else {
6590                $alt_url = href(-full=>1, action=>"summary");
6591        }
6592        print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
6593        if ($format eq 'rss') {
6594                print <<XML;
6595<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
6596<channel>
6597XML
6598                print "<title>$title</title>\n" .
6599                      "<link>$alt_url</link>\n" .
6600                      "<description>$descr</description>\n" .
6601                      "<language>en</language>\n" .
6602                      # project owner is responsible for 'editorial' content
6603                      "<managingEditor>$owner</managingEditor>\n";
6604                if (defined $logo || defined $favicon) {
6605                        # prefer the logo to the favicon, since RSS
6606                        # doesn't allow both
6607                        my $img = esc_url($logo || $favicon);
6608                        print "<image>\n" .
6609                              "<url>$img</url>\n" .
6610                              "<title>$title</title>\n" .
6611                              "<link>$alt_url</link>\n" .
6612                              "</image>\n";
6613                }
6614                if (%latest_date) {
6615                        print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
6616                        print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
6617                }
6618                print "<generator>gitweb v.$version/$git_version</generator>\n";
6619        } elsif ($format eq 'atom') {
6620                print <<XML;
6621<feed xmlns="http://www.w3.org/2005/Atom">
6622XML
6623                print "<title>$title</title>\n" .
6624                      "<subtitle>$descr</subtitle>\n" .
6625                      '<link rel="alternate" type="text/html" href="' .
6626                      $alt_url . '" />' . "\n" .
6627                      '<link rel="self" type="' . $content_type . '" href="' .
6628                      $cgi->self_url() . '" />' . "\n" .
6629                      "<id>" . href(-full=>1) . "</id>\n" .
6630                      # use project owner for feed author
6631                      "<author><name>$owner</name></author>\n";
6632                if (defined $favicon) {
6633                        print "<icon>" . esc_url($favicon) . "</icon>\n";
6634                }
6635                if (defined $logo_url) {
6636                        # not twice as wide as tall: 72 x 27 pixels
6637                        print "<logo>" . esc_url($logo) . "</logo>\n";
6638                }
6639                if (! %latest_date) {
6640                        # dummy date to keep the feed valid until commits trickle in:
6641                        print "<updated>1970-01-01T00:00:00Z</updated>\n";
6642                } else {
6643                        print "<updated>$latest_date{'iso-8601'}</updated>\n";
6644                }
6645                print "<generator version='$version/$git_version'>gitweb</generator>\n";
6646        }
6647
6648        # contents
6649        for (my $i = 0; $i <= $#commitlist; $i++) {
6650                my %co = %{$commitlist[$i]};
6651                my $commit = $co{'id'};
6652                # we read 150, we always show 30 and the ones more recent than 48 hours
6653                if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
6654                        last;
6655                }
6656                my %cd = parse_date($co{'author_epoch'});
6657
6658                # get list of changed files
6659                open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6660                        $co{'parent'} || "--root",
6661                        $co{'id'}, "--", (defined $file_name ? $file_name : ())
6662                        or next;
6663                my @difftree = map { chomp; $_ } <$fd>;
6664                close $fd
6665                        or next;
6666
6667                # print element (entry, item)
6668                my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
6669                if ($format eq 'rss') {
6670                        print "<item>\n" .
6671                              "<title>" . esc_html($co{'title'}) . "</title>\n" .
6672                              "<author>" . esc_html($co{'author'}) . "</author>\n" .
6673                              "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
6674                              "<guid isPermaLink=\"true\">$co_url</guid>\n" .
6675                              "<link>$co_url</link>\n" .
6676                              "<description>" . esc_html($co{'title'}) . "</description>\n" .
6677                              "<content:encoded>" .
6678                              "<![CDATA[\n";
6679                } elsif ($format eq 'atom') {
6680                        print "<entry>\n" .
6681                              "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
6682                              "<updated>$cd{'iso-8601'}</updated>\n" .
6683                              "<author>\n" .
6684                              "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
6685                        if ($co{'author_email'}) {
6686                                print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
6687                        }
6688                        print "</author>\n" .
6689                              # use committer for contributor
6690                              "<contributor>\n" .
6691                              "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
6692                        if ($co{'committer_email'}) {
6693                                print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
6694                        }
6695                        print "</contributor>\n" .
6696                              "<published>$cd{'iso-8601'}</published>\n" .
6697                              "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
6698                              "<id>$co_url</id>\n" .
6699                              "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
6700                              "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
6701                }
6702                my $comment = $co{'comment'};
6703                print "<pre>\n";
6704                foreach my $line (@$comment) {
6705                        $line = esc_html($line);
6706                        print "$line\n";
6707                }
6708                print "</pre><ul>\n";
6709                foreach my $difftree_line (@difftree) {
6710                        my %difftree = parse_difftree_raw_line($difftree_line);
6711                        next if !$difftree{'from_id'};
6712
6713                        my $file = $difftree{'file'} || $difftree{'to_file'};
6714
6715                        print "<li>" .
6716                              "[" .
6717                              $cgi->a({-href => href(-full=>1, action=>"blobdiff",
6718                                                     hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
6719                                                     hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
6720                                                     file_name=>$file, file_parent=>$difftree{'from_file'}),
6721                                      -title => "diff"}, 'D');
6722                        if ($have_blame) {
6723                                print $cgi->a({-href => href(-full=>1, action=>"blame",
6724                                                             file_name=>$file, hash_base=>$commit),
6725                                              -title => "blame"}, 'B');
6726                        }
6727                        # if this is not a feed of a file history
6728                        if (!defined $file_name || $file_name ne $file) {
6729                                print $cgi->a({-href => href(-full=>1, action=>"history",
6730                                                             file_name=>$file, hash=>$commit),
6731                                              -title => "history"}, 'H');
6732                        }
6733                        $file = esc_path($file);
6734                        print "] ".
6735                              "$file</li>\n";
6736                }
6737                if ($format eq 'rss') {
6738                        print "</ul>]]>\n" .
6739                              "</content:encoded>\n" .
6740                              "</item>\n";
6741                } elsif ($format eq 'atom') {
6742                        print "</ul>\n</div>\n" .
6743                              "</content>\n" .
6744                              "</entry>\n";
6745                }
6746        }
6747
6748        # end of feed
6749        if ($format eq 'rss') {
6750                print "</channel>\n</rss>\n";
6751        } elsif ($format eq 'atom') {
6752                print "</feed>\n";
6753        }
6754}
6755
6756sub git_rss {
6757        git_feed('rss');
6758}
6759
6760sub git_atom {
6761        git_feed('atom');
6762}
6763
6764sub git_opml {
6765        my @list = git_get_projects_list();
6766
6767        print $cgi->header(
6768                -type => 'text/xml',
6769                -charset => 'utf-8',
6770                -content_disposition => 'inline; filename="opml.xml"');
6771
6772        print <<XML;
6773<?xml version="1.0" encoding="utf-8"?>
6774<opml version="1.0">
6775<head>
6776  <title>$site_name OPML Export</title>
6777</head>
6778<body>
6779<outline text="git RSS feeds">
6780XML
6781
6782        foreach my $pr (@list) {
6783                my %proj = %$pr;
6784                my $head = git_get_head_hash($proj{'path'});
6785                if (!defined $head) {
6786                        next;
6787                }
6788                $git_dir = "$projectroot/$proj{'path'}";
6789                my %co = parse_commit($head);
6790                if (!%co) {
6791                        next;
6792                }
6793
6794                my $path = esc_html(chop_str($proj{'path'}, 25, 5));
6795                my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
6796                my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
6797                print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
6798        }
6799        print <<XML;
6800</outline>
6801</body>
6802</opml>
6803XML
6804}