gitweb / gitweb.perlon commit glossary: clarify description of HEAD (67393c5)
   1#!/usr/bin/perl
   2
   3# gitweb - simple web interface to track changes in git repositories
   4#
   5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
   6# (C) 2005, Christian Gierke
   7#
   8# This program is licensed under the GPLv2
   9
  10use 5.008;
  11use strict;
  12use warnings;
  13use CGI qw(:standard :escapeHTML -nosticky);
  14use CGI::Util qw(unescape);
  15use CGI::Carp qw(fatalsToBrowser set_message);
  16use Encode;
  17use Fcntl ':mode';
  18use File::Find qw();
  19use File::Basename qw(basename);
  20use Time::HiRes qw(gettimeofday tv_interval);
  21binmode STDOUT, ':utf8';
  22
  23our $t0 = [ gettimeofday() ];
  24our $number_of_git_cmds = 0;
  25
  26BEGIN {
  27        CGI->compile() if $ENV{'MOD_PERL'};
  28}
  29
  30our $version = "++GIT_VERSION++";
  31
  32our ($my_url, $my_uri, $base_url, $path_info, $home_link);
  33sub evaluate_uri {
  34        our $cgi;
  35
  36        our $my_url = $cgi->url();
  37        our $my_uri = $cgi->url(-absolute => 1);
  38
  39        # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
  40        # needed and used only for URLs with nonempty PATH_INFO
  41        our $base_url = $my_url;
  42
  43        # When the script is used as DirectoryIndex, the URL does not contain the name
  44        # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
  45        # have to do it ourselves. We make $path_info global because it's also used
  46        # later on.
  47        #
  48        # Another issue with the script being the DirectoryIndex is that the resulting
  49        # $my_url data is not the full script URL: this is good, because we want
  50        # generated links to keep implying the script name if it wasn't explicitly
  51        # indicated in the URL we're handling, but it means that $my_url cannot be used
  52        # as base URL.
  53        # Therefore, if we needed to strip PATH_INFO, then we know that we have
  54        # to build the base URL ourselves:
  55        our $path_info = $ENV{"PATH_INFO"};
  56        if ($path_info) {
  57                if ($my_url =~ s,\Q$path_info\E$,, &&
  58                    $my_uri =~ s,\Q$path_info\E$,, &&
  59                    defined $ENV{'SCRIPT_NAME'}) {
  60                        $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
  61                }
  62        }
  63
  64        # target of the home link on top of all pages
  65        our $home_link = $my_uri || "/";
  66}
  67
  68# core git executable to use
  69# this can just be "git" if your webserver has a sensible PATH
  70our $GIT = "++GIT_BINDIR++/git";
  71
  72# absolute fs-path which will be prepended to the project path
  73#our $projectroot = "/pub/scm";
  74our $projectroot = "++GITWEB_PROJECTROOT++";
  75
  76# fs traversing limit for getting project list
  77# the number is relative to the projectroot
  78our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
  79
  80# string of the home link on top of all pages
  81our $home_link_str = "++GITWEB_HOME_LINK_STR++";
  82
  83# name of your site or organization to appear in page titles
  84# replace this with something more descriptive for clearer bookmarks
  85our $site_name = "++GITWEB_SITENAME++"
  86                 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
  87
  88# filename of html text to include at top of each page
  89our $site_header = "++GITWEB_SITE_HEADER++";
  90# html text to include at home page
  91our $home_text = "++GITWEB_HOMETEXT++";
  92# filename of html text to include at bottom of each page
  93our $site_footer = "++GITWEB_SITE_FOOTER++";
  94
  95# URI of stylesheets
  96our @stylesheets = ("++GITWEB_CSS++");
  97# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
  98our $stylesheet = undef;
  99# URI of GIT logo (72x27 size)
 100our $logo = "++GITWEB_LOGO++";
 101# URI of GIT favicon, assumed to be image/png type
 102our $favicon = "++GITWEB_FAVICON++";
 103# URI of gitweb.js (JavaScript code for gitweb)
 104our $javascript = "++GITWEB_JS++";
 105
 106# URI and label (title) of GIT logo link
 107#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
 108#our $logo_label = "git documentation";
 109our $logo_url = "http://git-scm.com/";
 110our $logo_label = "git homepage";
 111
 112# source of projects list
 113our $projects_list = "++GITWEB_LIST++";
 114
 115# the width (in characters) of the projects list "Description" column
 116our $projects_list_description_width = 25;
 117
 118# default order of projects list
 119# valid values are none, project, descr, owner, and age
 120our $default_projects_order = "project";
 121
 122# show repository only if this file exists
 123# (only effective if this variable evaluates to true)
 124our $export_ok = "++GITWEB_EXPORT_OK++";
 125
 126# show repository only if this subroutine returns true
 127# when given the path to the project, for example:
 128#    sub { return -e "$_[0]/git-daemon-export-ok"; }
 129our $export_auth_hook = undef;
 130
 131# only allow viewing of repositories also shown on the overview page
 132our $strict_export = "++GITWEB_STRICT_EXPORT++";
 133
 134# list of git base URLs used for URL to where fetch project from,
 135# i.e. full URL is "$git_base_url/$project"
 136our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
 137
 138# default blob_plain mimetype and default charset for text/plain blob
 139our $default_blob_plain_mimetype = 'text/plain';
 140our $default_text_plain_charset  = undef;
 141
 142# file to use for guessing MIME types before trying /etc/mime.types
 143# (relative to the current git repository)
 144our $mimetypes_file = undef;
 145
 146# assume this charset if line contains non-UTF-8 characters;
 147# it should be valid encoding (see Encoding::Supported(3pm) for list),
 148# for which encoding all byte sequences are valid, for example
 149# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
 150# could be even 'utf-8' for the old behavior)
 151our $fallback_encoding = 'latin1';
 152
 153# rename detection options for git-diff and git-diff-tree
 154# - default is '-M', with the cost proportional to
 155#   (number of removed files) * (number of new files).
 156# - more costly is '-C' (which implies '-M'), with the cost proportional to
 157#   (number of changed files + number of removed files) * (number of new files)
 158# - even more costly is '-C', '--find-copies-harder' with cost
 159#   (number of files in the original tree) * (number of new files)
 160# - one might want to include '-B' option, e.g. '-B', '-M'
 161our @diff_opts = ('-M'); # taken from git_commit
 162
 163# Disables features that would allow repository owners to inject script into
 164# the gitweb domain.
 165our $prevent_xss = 0;
 166
 167# Path to the highlight executable to use (must be the one from
 168# http://www.andre-simon.de due to assumptions about parameters and output).
 169# Useful if highlight is not installed on your webserver's PATH.
 170# [Default: highlight]
 171our $highlight_bin = "++HIGHLIGHT_BIN++";
 172
 173# information about snapshot formats that gitweb is capable of serving
 174our %known_snapshot_formats = (
 175        # name => {
 176        #       'display' => display name,
 177        #       'type' => mime type,
 178        #       'suffix' => filename suffix,
 179        #       'format' => --format for git-archive,
 180        #       'compressor' => [compressor command and arguments]
 181        #                       (array reference, optional)
 182        #       'disabled' => boolean (optional)}
 183        #
 184        'tgz' => {
 185                'display' => 'tar.gz',
 186                'type' => 'application/x-gzip',
 187                'suffix' => '.tar.gz',
 188                'format' => 'tar',
 189                'compressor' => ['gzip', '-n']},
 190
 191        'tbz2' => {
 192                'display' => 'tar.bz2',
 193                'type' => 'application/x-bzip2',
 194                'suffix' => '.tar.bz2',
 195                'format' => 'tar',
 196                'compressor' => ['bzip2']},
 197
 198        'txz' => {
 199                'display' => 'tar.xz',
 200                'type' => 'application/x-xz',
 201                'suffix' => '.tar.xz',
 202                'format' => 'tar',
 203                'compressor' => ['xz'],
 204                'disabled' => 1},
 205
 206        'zip' => {
 207                'display' => 'zip',
 208                'type' => 'application/x-zip',
 209                'suffix' => '.zip',
 210                'format' => 'zip'},
 211);
 212
 213# Aliases so we understand old gitweb.snapshot values in repository
 214# configuration.
 215our %known_snapshot_format_aliases = (
 216        'gzip'  => 'tgz',
 217        'bzip2' => 'tbz2',
 218        'xz'    => 'txz',
 219
 220        # backward compatibility: legacy gitweb config support
 221        'x-gzip' => undef, 'gz' => undef,
 222        'x-bzip2' => undef, 'bz2' => undef,
 223        'x-zip' => undef, '' => undef,
 224);
 225
 226# Pixel sizes for icons and avatars. If the default font sizes or lineheights
 227# are changed, it may be appropriate to change these values too via
 228# $GITWEB_CONFIG.
 229our %avatar_size = (
 230        'default' => 16,
 231        'double'  => 32
 232);
 233
 234# Used to set the maximum load that we will still respond to gitweb queries.
 235# If server load exceed this value then return "503 server busy" error.
 236# If gitweb cannot determined server load, it is taken to be 0.
 237# Leave it undefined (or set to 'undef') to turn off load checking.
 238our $maxload = 300;
 239
 240# configuration for 'highlight' (http://www.andre-simon.de/)
 241# match by basename
 242our %highlight_basename = (
 243        #'Program' => 'py',
 244        #'Library' => 'py',
 245        'SConstruct' => 'py', # SCons equivalent of Makefile
 246        'Makefile' => 'make',
 247);
 248# match by extension
 249our %highlight_ext = (
 250        # main extensions, defining name of syntax;
 251        # see files in /usr/share/highlight/langDefs/ directory
 252        map { $_ => $_ }
 253                qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
 254        # alternate extensions, see /etc/highlight/filetypes.conf
 255        'h' => 'c',
 256        map { $_ => 'sh'  } qw(bash zsh ksh),
 257        map { $_ => 'cpp' } qw(cxx c++ cc),
 258        map { $_ => 'php' } qw(php3 php4 php5 phps),
 259        map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
 260        map { $_ => 'make'} qw(mak mk),
 261        map { $_ => 'xml' } qw(xhtml html htm),
 262);
 263
 264# You define site-wide feature defaults here; override them with
 265# $GITWEB_CONFIG as necessary.
 266our %feature = (
 267        # feature => {
 268        #       'sub' => feature-sub (subroutine),
 269        #       'override' => allow-override (boolean),
 270        #       'default' => [ default options...] (array reference)}
 271        #
 272        # if feature is overridable (it means that allow-override has true value),
 273        # then feature-sub will be called with default options as parameters;
 274        # return value of feature-sub indicates if to enable specified feature
 275        #
 276        # if there is no 'sub' key (no feature-sub), then feature cannot be
 277        # overridden
 278        #
 279        # use gitweb_get_feature(<feature>) to retrieve the <feature> value
 280        # (an array) or gitweb_check_feature(<feature>) to check if <feature>
 281        # is enabled
 282
 283        # Enable the 'blame' blob view, showing the last commit that modified
 284        # each line in the file. This can be very CPU-intensive.
 285
 286        # To enable system wide have in $GITWEB_CONFIG
 287        # $feature{'blame'}{'default'} = [1];
 288        # To have project specific config enable override in $GITWEB_CONFIG
 289        # $feature{'blame'}{'override'} = 1;
 290        # and in project config gitweb.blame = 0|1;
 291        'blame' => {
 292                'sub' => sub { feature_bool('blame', @_) },
 293                'override' => 0,
 294                'default' => [0]},
 295
 296        # Enable the 'snapshot' link, providing a compressed archive of any
 297        # tree. This can potentially generate high traffic if you have large
 298        # project.
 299
 300        # Value is a list of formats defined in %known_snapshot_formats that
 301        # you wish to offer.
 302        # To disable system wide have in $GITWEB_CONFIG
 303        # $feature{'snapshot'}{'default'} = [];
 304        # To have project specific config enable override in $GITWEB_CONFIG
 305        # $feature{'snapshot'}{'override'} = 1;
 306        # and in project config, a comma-separated list of formats or "none"
 307        # to disable.  Example: gitweb.snapshot = tbz2,zip;
 308        'snapshot' => {
 309                'sub' => \&feature_snapshot,
 310                'override' => 0,
 311                'default' => ['tgz']},
 312
 313        # Enable text search, which will list the commits which match author,
 314        # committer or commit text to a given string.  Enabled by default.
 315        # Project specific override is not supported.
 316        'search' => {
 317                'override' => 0,
 318                'default' => [1]},
 319
 320        # Enable grep search, which will list the files in currently selected
 321        # tree containing the given string. Enabled by default. This can be
 322        # potentially CPU-intensive, of course.
 323        # Note that you need to have 'search' feature enabled too.
 324
 325        # To enable system wide have in $GITWEB_CONFIG
 326        # $feature{'grep'}{'default'} = [1];
 327        # To have project specific config enable override in $GITWEB_CONFIG
 328        # $feature{'grep'}{'override'} = 1;
 329        # and in project config gitweb.grep = 0|1;
 330        'grep' => {
 331                'sub' => sub { feature_bool('grep', @_) },
 332                'override' => 0,
 333                'default' => [1]},
 334
 335        # Enable the pickaxe search, which will list the commits that modified
 336        # a given string in a file. This can be practical and quite faster
 337        # alternative to 'blame', but still potentially CPU-intensive.
 338        # Note that you need to have 'search' feature enabled too.
 339
 340        # To enable system wide have in $GITWEB_CONFIG
 341        # $feature{'pickaxe'}{'default'} = [1];
 342        # To have project specific config enable override in $GITWEB_CONFIG
 343        # $feature{'pickaxe'}{'override'} = 1;
 344        # and in project config gitweb.pickaxe = 0|1;
 345        'pickaxe' => {
 346                'sub' => sub { feature_bool('pickaxe', @_) },
 347                'override' => 0,
 348                'default' => [1]},
 349
 350        # Enable showing size of blobs in a 'tree' view, in a separate
 351        # column, similar to what 'ls -l' does.  This cost a bit of IO.
 352
 353        # To disable system wide have in $GITWEB_CONFIG
 354        # $feature{'show-sizes'}{'default'} = [0];
 355        # To have project specific config enable override in $GITWEB_CONFIG
 356        # $feature{'show-sizes'}{'override'} = 1;
 357        # and in project config gitweb.showsizes = 0|1;
 358        'show-sizes' => {
 359                'sub' => sub { feature_bool('showsizes', @_) },
 360                'override' => 0,
 361                'default' => [1]},
 362
 363        # Make gitweb use an alternative format of the URLs which can be
 364        # more readable and natural-looking: project name is embedded
 365        # directly in the path and the query string contains other
 366        # auxiliary information. All gitweb installations recognize
 367        # URL in either format; this configures in which formats gitweb
 368        # generates links.
 369
 370        # To enable system wide have in $GITWEB_CONFIG
 371        # $feature{'pathinfo'}{'default'} = [1];
 372        # Project specific override is not supported.
 373
 374        # Note that you will need to change the default location of CSS,
 375        # favicon, logo and possibly other files to an absolute URL. Also,
 376        # if gitweb.cgi serves as your indexfile, you will need to force
 377        # $my_uri to contain the script name in your $GITWEB_CONFIG.
 378        'pathinfo' => {
 379                'override' => 0,
 380                'default' => [0]},
 381
 382        # Make gitweb consider projects in project root subdirectories
 383        # to be forks of existing projects. Given project $projname.git,
 384        # projects matching $projname/*.git will not be shown in the main
 385        # projects list, instead a '+' mark will be added to $projname
 386        # there and a 'forks' view will be enabled for the project, listing
 387        # all the forks. If project list is taken from a file, forks have
 388        # to be listed after the main project.
 389
 390        # To enable system wide have in $GITWEB_CONFIG
 391        # $feature{'forks'}{'default'} = [1];
 392        # Project specific override is not supported.
 393        'forks' => {
 394                'override' => 0,
 395                'default' => [0]},
 396
 397        # Insert custom links to the action bar of all project pages.
 398        # This enables you mainly to link to third-party scripts integrating
 399        # into gitweb; e.g. git-browser for graphical history representation
 400        # or custom web-based repository administration interface.
 401
 402        # The 'default' value consists of a list of triplets in the form
 403        # (label, link, position) where position is the label after which
 404        # to insert the link and link is a format string where %n expands
 405        # to the project name, %f to the project path within the filesystem,
 406        # %h to the current hash (h gitweb parameter) and %b to the current
 407        # hash base (hb gitweb parameter); %% expands to %.
 408
 409        # To enable system wide have in $GITWEB_CONFIG e.g.
 410        # $feature{'actions'}{'default'} = [('graphiclog',
 411        #       '/git-browser/by-commit.html?r=%n', 'summary')];
 412        # Project specific override is not supported.
 413        'actions' => {
 414                'override' => 0,
 415                'default' => []},
 416
 417        # Allow gitweb scan project content tags described in ctags/
 418        # of project repository, and display the popular Web 2.0-ish
 419        # "tag cloud" near the project list. Note that this is something
 420        # COMPLETELY different from the normal Git tags.
 421
 422        # gitweb by itself can show existing tags, but it does not handle
 423        # tagging itself; you need an external application for that.
 424        # For an example script, check Girocco's cgi/tagproj.cgi.
 425        # You may want to install the HTML::TagCloud Perl module to get
 426        # a pretty tag cloud instead of just a list of tags.
 427
 428        # To enable system wide have in $GITWEB_CONFIG
 429        # $feature{'ctags'}{'default'} = ['path_to_tag_script'];
 430        # Project specific override is not supported.
 431        'ctags' => {
 432                'override' => 0,
 433                'default' => [0]},
 434
 435        # The maximum number of patches in a patchset generated in patch
 436        # view. Set this to 0 or undef to disable patch view, or to a
 437        # negative number to remove any limit.
 438
 439        # To disable system wide have in $GITWEB_CONFIG
 440        # $feature{'patches'}{'default'} = [0];
 441        # To have project specific config enable override in $GITWEB_CONFIG
 442        # $feature{'patches'}{'override'} = 1;
 443        # and in project config gitweb.patches = 0|n;
 444        # where n is the maximum number of patches allowed in a patchset.
 445        'patches' => {
 446                'sub' => \&feature_patches,
 447                'override' => 0,
 448                'default' => [16]},
 449
 450        # Avatar support. When this feature is enabled, views such as
 451        # shortlog or commit will display an avatar associated with
 452        # the email of the committer(s) and/or author(s).
 453
 454        # Currently available providers are gravatar and picon.
 455        # If an unknown provider is specified, the feature is disabled.
 456
 457        # Gravatar depends on Digest::MD5.
 458        # Picon currently relies on the indiana.edu database.
 459
 460        # To enable system wide have in $GITWEB_CONFIG
 461        # $feature{'avatar'}{'default'} = ['<provider>'];
 462        # where <provider> is either gravatar or picon.
 463        # To have project specific config enable override in $GITWEB_CONFIG
 464        # $feature{'avatar'}{'override'} = 1;
 465        # and in project config gitweb.avatar = <provider>;
 466        'avatar' => {
 467                'sub' => \&feature_avatar,
 468                'override' => 0,
 469                'default' => ['']},
 470
 471        # Enable displaying how much time and how many git commands
 472        # it took to generate and display page.  Disabled by default.
 473        # Project specific override is not supported.
 474        'timed' => {
 475                'override' => 0,
 476                'default' => [0]},
 477
 478        # Enable turning some links into links to actions which require
 479        # JavaScript to run (like 'blame_incremental').  Not enabled by
 480        # default.  Project specific override is currently not supported.
 481        'javascript-actions' => {
 482                'override' => 0,
 483                'default' => [0]},
 484
 485        # Syntax highlighting support. This is based on Daniel Svensson's
 486        # and Sham Chukoury's work in gitweb-xmms2.git.
 487        # It requires the 'highlight' program present in $PATH,
 488        # and therefore is disabled by default.
 489
 490        # To enable system wide have in $GITWEB_CONFIG
 491        # $feature{'highlight'}{'default'} = [1];
 492
 493        'highlight' => {
 494                'sub' => sub { feature_bool('highlight', @_) },
 495                'override' => 0,
 496                'default' => [0]},
 497
 498        # Enable displaying of remote heads in the heads list
 499
 500        # To enable system wide have in $GITWEB_CONFIG
 501        # $feature{'remote_heads'}{'default'} = [1];
 502        # To have project specific config enable override in $GITWEB_CONFIG
 503        # $feature{'remote_heads'}{'override'} = 1;
 504        # and in project config gitweb.remote_heads = 0|1;
 505        'remote_heads' => {
 506                'sub' => sub { feature_bool('remote_heads', @_) },
 507                'override' => 0,
 508                'default' => [0]},
 509);
 510
 511sub gitweb_get_feature {
 512        my ($name) = @_;
 513        return unless exists $feature{$name};
 514        my ($sub, $override, @defaults) = (
 515                $feature{$name}{'sub'},
 516                $feature{$name}{'override'},
 517                @{$feature{$name}{'default'}});
 518        # project specific override is possible only if we have project
 519        our $git_dir; # global variable, declared later
 520        if (!$override || !defined $git_dir) {
 521                return @defaults;
 522        }
 523        if (!defined $sub) {
 524                warn "feature $name is not overridable";
 525                return @defaults;
 526        }
 527        return $sub->(@defaults);
 528}
 529
 530# A wrapper to check if a given feature is enabled.
 531# With this, you can say
 532#
 533#   my $bool_feat = gitweb_check_feature('bool_feat');
 534#   gitweb_check_feature('bool_feat') or somecode;
 535#
 536# instead of
 537#
 538#   my ($bool_feat) = gitweb_get_feature('bool_feat');
 539#   (gitweb_get_feature('bool_feat'))[0] or somecode;
 540#
 541sub gitweb_check_feature {
 542        return (gitweb_get_feature(@_))[0];
 543}
 544
 545
 546sub feature_bool {
 547        my $key = shift;
 548        my ($val) = git_get_project_config($key, '--bool');
 549
 550        if (!defined $val) {
 551                return ($_[0]);
 552        } elsif ($val eq 'true') {
 553                return (1);
 554        } elsif ($val eq 'false') {
 555                return (0);
 556        }
 557}
 558
 559sub feature_snapshot {
 560        my (@fmts) = @_;
 561
 562        my ($val) = git_get_project_config('snapshot');
 563
 564        if ($val) {
 565                @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
 566        }
 567
 568        return @fmts;
 569}
 570
 571sub feature_patches {
 572        my @val = (git_get_project_config('patches', '--int'));
 573
 574        if (@val) {
 575                return @val;
 576        }
 577
 578        return ($_[0]);
 579}
 580
 581sub feature_avatar {
 582        my @val = (git_get_project_config('avatar'));
 583
 584        return @val ? @val : @_;
 585}
 586
 587# checking HEAD file with -e is fragile if the repository was
 588# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
 589# and then pruned.
 590sub check_head_link {
 591        my ($dir) = @_;
 592        my $headfile = "$dir/HEAD";
 593        return ((-e $headfile) ||
 594                (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
 595}
 596
 597sub check_export_ok {
 598        my ($dir) = @_;
 599        return (check_head_link($dir) &&
 600                (!$export_ok || -e "$dir/$export_ok") &&
 601                (!$export_auth_hook || $export_auth_hook->($dir)));
 602}
 603
 604# process alternate names for backward compatibility
 605# filter out unsupported (unknown) snapshot formats
 606sub filter_snapshot_fmts {
 607        my @fmts = @_;
 608
 609        @fmts = map {
 610                exists $known_snapshot_format_aliases{$_} ?
 611                       $known_snapshot_format_aliases{$_} : $_} @fmts;
 612        @fmts = grep {
 613                exists $known_snapshot_formats{$_} &&
 614                !$known_snapshot_formats{$_}{'disabled'}} @fmts;
 615}
 616
 617# If it is set to code reference, it is code that it is to be run once per
 618# request, allowing updating configurations that change with each request,
 619# while running other code in config file only once.
 620#
 621# Otherwise, if it is false then gitweb would process config file only once;
 622# if it is true then gitweb config would be run for each request.
 623our $per_request_config = 1;
 624
 625our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM);
 626sub evaluate_gitweb_config {
 627        our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
 628        our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
 629        # die if there are errors parsing config file
 630        if (-e $GITWEB_CONFIG) {
 631                do $GITWEB_CONFIG;
 632                die $@ if $@;
 633        } elsif (-e $GITWEB_CONFIG_SYSTEM) {
 634                do $GITWEB_CONFIG_SYSTEM;
 635                die $@ if $@;
 636        }
 637}
 638
 639# Get loadavg of system, to compare against $maxload.
 640# Currently it requires '/proc/loadavg' present to get loadavg;
 641# if it is not present it returns 0, which means no load checking.
 642sub get_loadavg {
 643        if( -e '/proc/loadavg' ){
 644                open my $fd, '<', '/proc/loadavg'
 645                        or return 0;
 646                my @load = split(/\s+/, scalar <$fd>);
 647                close $fd;
 648
 649                # The first three columns measure CPU and IO utilization of the last one,
 650                # five, and 10 minute periods.  The fourth column shows the number of
 651                # currently running processes and the total number of processes in the m/n
 652                # format.  The last column displays the last process ID used.
 653                return $load[0] || 0;
 654        }
 655        # additional checks for load average should go here for things that don't export
 656        # /proc/loadavg
 657
 658        return 0;
 659}
 660
 661# version of the core git binary
 662our $git_version;
 663sub evaluate_git_version {
 664        our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
 665        $number_of_git_cmds++;
 666}
 667
 668sub check_loadavg {
 669        if (defined $maxload && get_loadavg() > $maxload) {
 670                die_error(503, "The load average on the server is too high");
 671        }
 672}
 673
 674# ======================================================================
 675# input validation and dispatch
 676
 677# input parameters can be collected from a variety of sources (presently, CGI
 678# and PATH_INFO), so we define an %input_params hash that collects them all
 679# together during validation: this allows subsequent uses (e.g. href()) to be
 680# agnostic of the parameter origin
 681
 682our %input_params = ();
 683
 684# input parameters are stored with the long parameter name as key. This will
 685# also be used in the href subroutine to convert parameters to their CGI
 686# equivalent, and since the href() usage is the most frequent one, we store
 687# the name -> CGI key mapping here, instead of the reverse.
 688#
 689# XXX: Warning: If you touch this, check the search form for updating,
 690# too.
 691
 692our @cgi_param_mapping = (
 693        project => "p",
 694        action => "a",
 695        file_name => "f",
 696        file_parent => "fp",
 697        hash => "h",
 698        hash_parent => "hp",
 699        hash_base => "hb",
 700        hash_parent_base => "hpb",
 701        page => "pg",
 702        order => "o",
 703        searchtext => "s",
 704        searchtype => "st",
 705        snapshot_format => "sf",
 706        extra_options => "opt",
 707        search_use_regexp => "sr",
 708        # this must be last entry (for manipulation from JavaScript)
 709        javascript => "js"
 710);
 711our %cgi_param_mapping = @cgi_param_mapping;
 712
 713# we will also need to know the possible actions, for validation
 714our %actions = (
 715        "blame" => \&git_blame,
 716        "blame_incremental" => \&git_blame_incremental,
 717        "blame_data" => \&git_blame_data,
 718        "blobdiff" => \&git_blobdiff,
 719        "blobdiff_plain" => \&git_blobdiff_plain,
 720        "blob" => \&git_blob,
 721        "blob_plain" => \&git_blob_plain,
 722        "commitdiff" => \&git_commitdiff,
 723        "commitdiff_plain" => \&git_commitdiff_plain,
 724        "commit" => \&git_commit,
 725        "forks" => \&git_forks,
 726        "heads" => \&git_heads,
 727        "history" => \&git_history,
 728        "log" => \&git_log,
 729        "patch" => \&git_patch,
 730        "patches" => \&git_patches,
 731        "remotes" => \&git_remotes,
 732        "rss" => \&git_rss,
 733        "atom" => \&git_atom,
 734        "search" => \&git_search,
 735        "search_help" => \&git_search_help,
 736        "shortlog" => \&git_shortlog,
 737        "summary" => \&git_summary,
 738        "tag" => \&git_tag,
 739        "tags" => \&git_tags,
 740        "tree" => \&git_tree,
 741        "snapshot" => \&git_snapshot,
 742        "object" => \&git_object,
 743        # those below don't need $project
 744        "opml" => \&git_opml,
 745        "project_list" => \&git_project_list,
 746        "project_index" => \&git_project_index,
 747);
 748
 749# finally, we have the hash of allowed extra_options for the commands that
 750# allow them
 751our %allowed_options = (
 752        "--no-merges" => [ qw(rss atom log shortlog history) ],
 753);
 754
 755# fill %input_params with the CGI parameters. All values except for 'opt'
 756# should be single values, but opt can be an array. We should probably
 757# build an array of parameters that can be multi-valued, but since for the time
 758# being it's only this one, we just single it out
 759sub evaluate_query_params {
 760        our $cgi;
 761
 762        while (my ($name, $symbol) = each %cgi_param_mapping) {
 763                if ($symbol eq 'opt') {
 764                        $input_params{$name} = [ $cgi->param($symbol) ];
 765                } else {
 766                        $input_params{$name} = $cgi->param($symbol);
 767                }
 768        }
 769}
 770
 771# now read PATH_INFO and update the parameter list for missing parameters
 772sub evaluate_path_info {
 773        return if defined $input_params{'project'};
 774        return if !$path_info;
 775        $path_info =~ s,^/+,,;
 776        return if !$path_info;
 777
 778        # find which part of PATH_INFO is project
 779        my $project = $path_info;
 780        $project =~ s,/+$,,;
 781        while ($project && !check_head_link("$projectroot/$project")) {
 782                $project =~ s,/*[^/]*$,,;
 783        }
 784        return unless $project;
 785        $input_params{'project'} = $project;
 786
 787        # do not change any parameters if an action is given using the query string
 788        return if $input_params{'action'};
 789        $path_info =~ s,^\Q$project\E/*,,;
 790
 791        # next, check if we have an action
 792        my $action = $path_info;
 793        $action =~ s,/.*$,,;
 794        if (exists $actions{$action}) {
 795                $path_info =~ s,^$action/*,,;
 796                $input_params{'action'} = $action;
 797        }
 798
 799        # list of actions that want hash_base instead of hash, but can have no
 800        # pathname (f) parameter
 801        my @wants_base = (
 802                'tree',
 803                'history',
 804        );
 805
 806        # we want to catch, among others
 807        # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
 808        my ($parentrefname, $parentpathname, $refname, $pathname) =
 809                ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
 810
 811        # first, analyze the 'current' part
 812        if (defined $pathname) {
 813                # we got "branch:filename" or "branch:dir/"
 814                # we could use git_get_type(branch:pathname), but:
 815                # - it needs $git_dir
 816                # - it does a git() call
 817                # - the convention of terminating directories with a slash
 818                #   makes it superfluous
 819                # - embedding the action in the PATH_INFO would make it even
 820                #   more superfluous
 821                $pathname =~ s,^/+,,;
 822                if (!$pathname || substr($pathname, -1) eq "/") {
 823                        $input_params{'action'} ||= "tree";
 824                        $pathname =~ s,/$,,;
 825                } else {
 826                        # the default action depends on whether we had parent info
 827                        # or not
 828                        if ($parentrefname) {
 829                                $input_params{'action'} ||= "blobdiff_plain";
 830                        } else {
 831                                $input_params{'action'} ||= "blob_plain";
 832                        }
 833                }
 834                $input_params{'hash_base'} ||= $refname;
 835                $input_params{'file_name'} ||= $pathname;
 836        } elsif (defined $refname) {
 837                # we got "branch". In this case we have to choose if we have to
 838                # set hash or hash_base.
 839                #
 840                # Most of the actions without a pathname only want hash to be
 841                # set, except for the ones specified in @wants_base that want
 842                # hash_base instead. It should also be noted that hand-crafted
 843                # links having 'history' as an action and no pathname or hash
 844                # set will fail, but that happens regardless of PATH_INFO.
 845                if (defined $parentrefname) {
 846                        # if there is parent let the default be 'shortlog' action
 847                        # (for http://git.example.com/repo.git/A..B links); if there
 848                        # is no parent, dispatch will detect type of object and set
 849                        # action appropriately if required (if action is not set)
 850                        $input_params{'action'} ||= "shortlog";
 851                }
 852                if ($input_params{'action'} &&
 853                    grep { $_ eq $input_params{'action'} } @wants_base) {
 854                        $input_params{'hash_base'} ||= $refname;
 855                } else {
 856                        $input_params{'hash'} ||= $refname;
 857                }
 858        }
 859
 860        # next, handle the 'parent' part, if present
 861        if (defined $parentrefname) {
 862                # a missing pathspec defaults to the 'current' filename, allowing e.g.
 863                # someproject/blobdiff/oldrev..newrev:/filename
 864                if ($parentpathname) {
 865                        $parentpathname =~ s,^/+,,;
 866                        $parentpathname =~ s,/$,,;
 867                        $input_params{'file_parent'} ||= $parentpathname;
 868                } else {
 869                        $input_params{'file_parent'} ||= $input_params{'file_name'};
 870                }
 871                # we assume that hash_parent_base is wanted if a path was specified,
 872                # or if the action wants hash_base instead of hash
 873                if (defined $input_params{'file_parent'} ||
 874                        grep { $_ eq $input_params{'action'} } @wants_base) {
 875                        $input_params{'hash_parent_base'} ||= $parentrefname;
 876                } else {
 877                        $input_params{'hash_parent'} ||= $parentrefname;
 878                }
 879        }
 880
 881        # for the snapshot action, we allow URLs in the form
 882        # $project/snapshot/$hash.ext
 883        # where .ext determines the snapshot and gets removed from the
 884        # passed $refname to provide the $hash.
 885        #
 886        # To be able to tell that $refname includes the format extension, we
 887        # require the following two conditions to be satisfied:
 888        # - the hash input parameter MUST have been set from the $refname part
 889        #   of the URL (i.e. they must be equal)
 890        # - the snapshot format MUST NOT have been defined already (e.g. from
 891        #   CGI parameter sf)
 892        # It's also useless to try any matching unless $refname has a dot,
 893        # so we check for that too
 894        if (defined $input_params{'action'} &&
 895                $input_params{'action'} eq 'snapshot' &&
 896                defined $refname && index($refname, '.') != -1 &&
 897                $refname eq $input_params{'hash'} &&
 898                !defined $input_params{'snapshot_format'}) {
 899                # We loop over the known snapshot formats, checking for
 900                # extensions. Allowed extensions are both the defined suffix
 901                # (which includes the initial dot already) and the snapshot
 902                # format key itself, with a prepended dot
 903                while (my ($fmt, $opt) = each %known_snapshot_formats) {
 904                        my $hash = $refname;
 905                        unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
 906                                next;
 907                        }
 908                        my $sfx = $1;
 909                        # a valid suffix was found, so set the snapshot format
 910                        # and reset the hash parameter
 911                        $input_params{'snapshot_format'} = $fmt;
 912                        $input_params{'hash'} = $hash;
 913                        # we also set the format suffix to the one requested
 914                        # in the URL: this way a request for e.g. .tgz returns
 915                        # a .tgz instead of a .tar.gz
 916                        $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
 917                        last;
 918                }
 919        }
 920}
 921
 922our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
 923     $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
 924     $searchtext, $search_regexp);
 925sub evaluate_and_validate_params {
 926        our $action = $input_params{'action'};
 927        if (defined $action) {
 928                if (!validate_action($action)) {
 929                        die_error(400, "Invalid action parameter");
 930                }
 931        }
 932
 933        # parameters which are pathnames
 934        our $project = $input_params{'project'};
 935        if (defined $project) {
 936                if (!validate_project($project)) {
 937                        undef $project;
 938                        die_error(404, "No such project");
 939                }
 940        }
 941
 942        our $file_name = $input_params{'file_name'};
 943        if (defined $file_name) {
 944                if (!validate_pathname($file_name)) {
 945                        die_error(400, "Invalid file parameter");
 946                }
 947        }
 948
 949        our $file_parent = $input_params{'file_parent'};
 950        if (defined $file_parent) {
 951                if (!validate_pathname($file_parent)) {
 952                        die_error(400, "Invalid file parent parameter");
 953                }
 954        }
 955
 956        # parameters which are refnames
 957        our $hash = $input_params{'hash'};
 958        if (defined $hash) {
 959                if (!validate_refname($hash)) {
 960                        die_error(400, "Invalid hash parameter");
 961                }
 962        }
 963
 964        our $hash_parent = $input_params{'hash_parent'};
 965        if (defined $hash_parent) {
 966                if (!validate_refname($hash_parent)) {
 967                        die_error(400, "Invalid hash parent parameter");
 968                }
 969        }
 970
 971        our $hash_base = $input_params{'hash_base'};
 972        if (defined $hash_base) {
 973                if (!validate_refname($hash_base)) {
 974                        die_error(400, "Invalid hash base parameter");
 975                }
 976        }
 977
 978        our @extra_options = @{$input_params{'extra_options'}};
 979        # @extra_options is always defined, since it can only be (currently) set from
 980        # CGI, and $cgi->param() returns the empty array in array context if the param
 981        # is not set
 982        foreach my $opt (@extra_options) {
 983                if (not exists $allowed_options{$opt}) {
 984                        die_error(400, "Invalid option parameter");
 985                }
 986                if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
 987                        die_error(400, "Invalid option parameter for this action");
 988                }
 989        }
 990
 991        our $hash_parent_base = $input_params{'hash_parent_base'};
 992        if (defined $hash_parent_base) {
 993                if (!validate_refname($hash_parent_base)) {
 994                        die_error(400, "Invalid hash parent base parameter");
 995                }
 996        }
 997
 998        # other parameters
 999        our $page = $input_params{'page'};
1000        if (defined $page) {
1001                if ($page =~ m/[^0-9]/) {
1002                        die_error(400, "Invalid page parameter");
1003                }
1004        }
1005
1006        our $searchtype = $input_params{'searchtype'};
1007        if (defined $searchtype) {
1008                if ($searchtype =~ m/[^a-z]/) {
1009                        die_error(400, "Invalid searchtype parameter");
1010                }
1011        }
1012
1013        our $search_use_regexp = $input_params{'search_use_regexp'};
1014
1015        our $searchtext = $input_params{'searchtext'};
1016        our $search_regexp;
1017        if (defined $searchtext) {
1018                if (length($searchtext) < 2) {
1019                        die_error(403, "At least two characters are required for search parameter");
1020                }
1021                $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
1022        }
1023}
1024
1025# path to the current git repository
1026our $git_dir;
1027sub evaluate_git_dir {
1028        our $git_dir = "$projectroot/$project" if $project;
1029}
1030
1031our (@snapshot_fmts, $git_avatar);
1032sub configure_gitweb_features {
1033        # list of supported snapshot formats
1034        our @snapshot_fmts = gitweb_get_feature('snapshot');
1035        @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1036
1037        # check that the avatar feature is set to a known provider name,
1038        # and for each provider check if the dependencies are satisfied.
1039        # if the provider name is invalid or the dependencies are not met,
1040        # reset $git_avatar to the empty string.
1041        our ($git_avatar) = gitweb_get_feature('avatar');
1042        if ($git_avatar eq 'gravatar') {
1043                $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1044        } elsif ($git_avatar eq 'picon') {
1045                # no dependencies
1046        } else {
1047                $git_avatar = '';
1048        }
1049}
1050
1051# custom error handler: 'die <message>' is Internal Server Error
1052sub handle_errors_html {
1053        my $msg = shift; # it is already HTML escaped
1054
1055        # to avoid infinite loop where error occurs in die_error,
1056        # change handler to default handler, disabling handle_errors_html
1057        set_message("Error occured when inside die_error:\n$msg");
1058
1059        # you cannot jump out of die_error when called as error handler;
1060        # the subroutine set via CGI::Carp::set_message is called _after_
1061        # HTTP headers are already written, so it cannot write them itself
1062        die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1063}
1064set_message(\&handle_errors_html);
1065
1066# dispatch
1067sub dispatch {
1068        if (!defined $action) {
1069                if (defined $hash) {
1070                        $action = git_get_type($hash);
1071                } elsif (defined $hash_base && defined $file_name) {
1072                        $action = git_get_type("$hash_base:$file_name");
1073                } elsif (defined $project) {
1074                        $action = 'summary';
1075                } else {
1076                        $action = 'project_list';
1077                }
1078        }
1079        if (!defined($actions{$action})) {
1080                die_error(400, "Unknown action");
1081        }
1082        if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1083            !$project) {
1084                die_error(400, "Project needed");
1085        }
1086        $actions{$action}->();
1087}
1088
1089sub reset_timer {
1090        our $t0 = [ gettimeofday() ]
1091                if defined $t0;
1092        our $number_of_git_cmds = 0;
1093}
1094
1095our $first_request = 1;
1096sub run_request {
1097        reset_timer();
1098
1099        evaluate_uri();
1100        if ($first_request) {
1101                evaluate_gitweb_config();
1102                evaluate_git_version();
1103        }
1104        if ($per_request_config) {
1105                if (ref($per_request_config) eq 'CODE') {
1106                        $per_request_config->();
1107                } elsif (!$first_request) {
1108                        evaluate_gitweb_config();
1109                }
1110        }
1111        check_loadavg();
1112
1113        # $projectroot and $projects_list might be set in gitweb config file
1114        $projects_list ||= $projectroot;
1115
1116        evaluate_query_params();
1117        evaluate_path_info();
1118        evaluate_and_validate_params();
1119        evaluate_git_dir();
1120
1121        configure_gitweb_features();
1122
1123        dispatch();
1124}
1125
1126our $is_last_request = sub { 1 };
1127our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1128our $CGI = 'CGI';
1129our $cgi;
1130sub configure_as_fcgi {
1131        require CGI::Fast;
1132        our $CGI = 'CGI::Fast';
1133
1134        my $request_number = 0;
1135        # let each child service 100 requests
1136        our $is_last_request = sub { ++$request_number > 100 };
1137}
1138sub evaluate_argv {
1139        my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1140        configure_as_fcgi()
1141                if $script_name =~ /\.fcgi$/;
1142
1143        return unless (@ARGV);
1144
1145        require Getopt::Long;
1146        Getopt::Long::GetOptions(
1147                'fastcgi|fcgi|f' => \&configure_as_fcgi,
1148                'nproc|n=i' => sub {
1149                        my ($arg, $val) = @_;
1150                        return unless eval { require FCGI::ProcManager; 1; };
1151                        my $proc_manager = FCGI::ProcManager->new({
1152                                n_processes => $val,
1153                        });
1154                        our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1155                        our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1156                        our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1157                },
1158        );
1159}
1160
1161sub run {
1162        evaluate_argv();
1163
1164        $first_request = 1;
1165        $pre_listen_hook->()
1166                if $pre_listen_hook;
1167
1168 REQUEST:
1169        while ($cgi = $CGI->new()) {
1170                $pre_dispatch_hook->()
1171                        if $pre_dispatch_hook;
1172
1173                run_request();
1174
1175                $post_dispatch_hook->()
1176                        if $post_dispatch_hook;
1177                $first_request = 0;
1178
1179                last REQUEST if ($is_last_request->());
1180        }
1181
1182 DONE_GITWEB:
1183        1;
1184}
1185
1186run();
1187
1188if (defined caller) {
1189        # wrapped in a subroutine processing requests,
1190        # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1191        return;
1192} else {
1193        # pure CGI script, serving single request
1194        exit;
1195}
1196
1197## ======================================================================
1198## action links
1199
1200# possible values of extra options
1201# -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1202# -replay => 1      - start from a current view (replay with modifications)
1203# -path_info => 0|1 - don't use/use path_info URL (if possible)
1204# -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1205sub href {
1206        my %params = @_;
1207        # default is to use -absolute url() i.e. $my_uri
1208        my $href = $params{-full} ? $my_url : $my_uri;
1209
1210        # implicit -replay, must be first of implicit params
1211        $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1212
1213        $params{'project'} = $project unless exists $params{'project'};
1214
1215        if ($params{-replay}) {
1216                while (my ($name, $symbol) = each %cgi_param_mapping) {
1217                        if (!exists $params{$name}) {
1218                                $params{$name} = $input_params{$name};
1219                        }
1220                }
1221        }
1222
1223        my $use_pathinfo = gitweb_check_feature('pathinfo');
1224        if (defined $params{'project'} &&
1225            (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1226                # try to put as many parameters as possible in PATH_INFO:
1227                #   - project name
1228                #   - action
1229                #   - hash_parent or hash_parent_base:/file_parent
1230                #   - hash or hash_base:/filename
1231                #   - the snapshot_format as an appropriate suffix
1232
1233                # When the script is the root DirectoryIndex for the domain,
1234                # $href here would be something like http://gitweb.example.com/
1235                # Thus, we strip any trailing / from $href, to spare us double
1236                # slashes in the final URL
1237                $href =~ s,/$,,;
1238
1239                # Then add the project name, if present
1240                $href .= "/".esc_path_info($params{'project'});
1241                delete $params{'project'};
1242
1243                # since we destructively absorb parameters, we keep this
1244                # boolean that remembers if we're handling a snapshot
1245                my $is_snapshot = $params{'action'} eq 'snapshot';
1246
1247                # Summary just uses the project path URL, any other action is
1248                # added to the URL
1249                if (defined $params{'action'}) {
1250                        $href .= "/".esc_path_info($params{'action'})
1251                                unless $params{'action'} eq 'summary';
1252                        delete $params{'action'};
1253                }
1254
1255                # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1256                # stripping nonexistent or useless pieces
1257                $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1258                        || $params{'hash_parent'} || $params{'hash'});
1259                if (defined $params{'hash_base'}) {
1260                        if (defined $params{'hash_parent_base'}) {
1261                                $href .= esc_path_info($params{'hash_parent_base'});
1262                                # skip the file_parent if it's the same as the file_name
1263                                if (defined $params{'file_parent'}) {
1264                                        if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1265                                                delete $params{'file_parent'};
1266                                        } elsif ($params{'file_parent'} !~ /\.\./) {
1267                                                $href .= ":/".esc_path_info($params{'file_parent'});
1268                                                delete $params{'file_parent'};
1269                                        }
1270                                }
1271                                $href .= "..";
1272                                delete $params{'hash_parent'};
1273                                delete $params{'hash_parent_base'};
1274                        } elsif (defined $params{'hash_parent'}) {
1275                                $href .= esc_path_info($params{'hash_parent'}). "..";
1276                                delete $params{'hash_parent'};
1277                        }
1278
1279                        $href .= esc_path_info($params{'hash_base'});
1280                        if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1281                                $href .= ":/".esc_path_info($params{'file_name'});
1282                                delete $params{'file_name'};
1283                        }
1284                        delete $params{'hash'};
1285                        delete $params{'hash_base'};
1286                } elsif (defined $params{'hash'}) {
1287                        $href .= esc_path_info($params{'hash'});
1288                        delete $params{'hash'};
1289                }
1290
1291                # If the action was a snapshot, we can absorb the
1292                # snapshot_format parameter too
1293                if ($is_snapshot) {
1294                        my $fmt = $params{'snapshot_format'};
1295                        # snapshot_format should always be defined when href()
1296                        # is called, but just in case some code forgets, we
1297                        # fall back to the default
1298                        $fmt ||= $snapshot_fmts[0];
1299                        $href .= $known_snapshot_formats{$fmt}{'suffix'};
1300                        delete $params{'snapshot_format'};
1301                }
1302        }
1303
1304        # now encode the parameters explicitly
1305        my @result = ();
1306        for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1307                my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1308                if (defined $params{$name}) {
1309                        if (ref($params{$name}) eq "ARRAY") {
1310                                foreach my $par (@{$params{$name}}) {
1311                                        push @result, $symbol . "=" . esc_param($par);
1312                                }
1313                        } else {
1314                                push @result, $symbol . "=" . esc_param($params{$name});
1315                        }
1316                }
1317        }
1318        $href .= "?" . join(';', @result) if scalar @result;
1319
1320        # final transformation: trailing spaces must be escaped (URI-encoded)
1321        $href =~ s/(\s+)$/CGI::escape($1)/e;
1322
1323        if ($params{-anchor}) {
1324                $href .= "#".esc_param($params{-anchor});
1325        }
1326
1327        return $href;
1328}
1329
1330
1331## ======================================================================
1332## validation, quoting/unquoting and escaping
1333
1334sub validate_action {
1335        my $input = shift || return undef;
1336        return undef unless exists $actions{$input};
1337        return $input;
1338}
1339
1340sub validate_project {
1341        my $input = shift || return undef;
1342        if (!validate_pathname($input) ||
1343                !(-d "$projectroot/$input") ||
1344                !check_export_ok("$projectroot/$input") ||
1345                ($strict_export && !project_in_list($input))) {
1346                return undef;
1347        } else {
1348                return $input;
1349        }
1350}
1351
1352sub validate_pathname {
1353        my $input = shift || return undef;
1354
1355        # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1356        # at the beginning, at the end, and between slashes.
1357        # also this catches doubled slashes
1358        if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1359                return undef;
1360        }
1361        # no null characters
1362        if ($input =~ m!\0!) {
1363                return undef;
1364        }
1365        return $input;
1366}
1367
1368sub validate_refname {
1369        my $input = shift || return undef;
1370
1371        # textual hashes are O.K.
1372        if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1373                return $input;
1374        }
1375        # it must be correct pathname
1376        $input = validate_pathname($input)
1377                or return undef;
1378        # restrictions on ref name according to git-check-ref-format
1379        if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1380                return undef;
1381        }
1382        return $input;
1383}
1384
1385# decode sequences of octets in utf8 into Perl's internal form,
1386# which is utf-8 with utf8 flag set if needed.  gitweb writes out
1387# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1388sub to_utf8 {
1389        my $str = shift;
1390        return undef unless defined $str;
1391        if (utf8::valid($str)) {
1392                utf8::decode($str);
1393                return $str;
1394        } else {
1395                return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1396        }
1397}
1398
1399# quote unsafe chars, but keep the slash, even when it's not
1400# correct, but quoted slashes look too horrible in bookmarks
1401sub esc_param {
1402        my $str = shift;
1403        return undef unless defined $str;
1404        $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1405        $str =~ s/ /\+/g;
1406        return $str;
1407}
1408
1409# the quoting rules for path_info fragment are slightly different
1410sub esc_path_info {
1411        my $str = shift;
1412        return undef unless defined $str;
1413
1414        # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1415        $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1416
1417        return $str;
1418}
1419
1420# quote unsafe chars in whole URL, so some characters cannot be quoted
1421sub esc_url {
1422        my $str = shift;
1423        return undef unless defined $str;
1424        $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1425        $str =~ s/ /\+/g;
1426        return $str;
1427}
1428
1429# quote unsafe characters in HTML attributes
1430sub esc_attr {
1431
1432        # for XHTML conformance escaping '"' to '&quot;' is not enough
1433        return esc_html(@_);
1434}
1435
1436# replace invalid utf8 character with SUBSTITUTION sequence
1437sub esc_html {
1438        my $str = shift;
1439        my %opts = @_;
1440
1441        return undef unless defined $str;
1442
1443        $str = to_utf8($str);
1444        $str = $cgi->escapeHTML($str);
1445        if ($opts{'-nbsp'}) {
1446                $str =~ s/ /&nbsp;/g;
1447        }
1448        $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1449        return $str;
1450}
1451
1452# quote control characters and escape filename to HTML
1453sub esc_path {
1454        my $str = shift;
1455        my %opts = @_;
1456
1457        return undef unless defined $str;
1458
1459        $str = to_utf8($str);
1460        $str = $cgi->escapeHTML($str);
1461        if ($opts{'-nbsp'}) {
1462                $str =~ s/ /&nbsp;/g;
1463        }
1464        $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1465        return $str;
1466}
1467
1468# Make control characters "printable", using character escape codes (CEC)
1469sub quot_cec {
1470        my $cntrl = shift;
1471        my %opts = @_;
1472        my %es = ( # character escape codes, aka escape sequences
1473                "\t" => '\t',   # tab            (HT)
1474                "\n" => '\n',   # line feed      (LF)
1475                "\r" => '\r',   # carrige return (CR)
1476                "\f" => '\f',   # form feed      (FF)
1477                "\b" => '\b',   # backspace      (BS)
1478                "\a" => '\a',   # alarm (bell)   (BEL)
1479                "\e" => '\e',   # escape         (ESC)
1480                "\013" => '\v', # vertical tab   (VT)
1481                "\000" => '\0', # nul character  (NUL)
1482        );
1483        my $chr = ( (exists $es{$cntrl})
1484                    ? $es{$cntrl}
1485                    : sprintf('\%2x', ord($cntrl)) );
1486        if ($opts{-nohtml}) {
1487                return $chr;
1488        } else {
1489                return "<span class=\"cntrl\">$chr</span>";
1490        }
1491}
1492
1493# Alternatively use unicode control pictures codepoints,
1494# Unicode "printable representation" (PR)
1495sub quot_upr {
1496        my $cntrl = shift;
1497        my %opts = @_;
1498
1499        my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1500        if ($opts{-nohtml}) {
1501                return $chr;
1502        } else {
1503                return "<span class=\"cntrl\">$chr</span>";
1504        }
1505}
1506
1507# git may return quoted and escaped filenames
1508sub unquote {
1509        my $str = shift;
1510
1511        sub unq {
1512                my $seq = shift;
1513                my %es = ( # character escape codes, aka escape sequences
1514                        't' => "\t",   # tab            (HT, TAB)
1515                        'n' => "\n",   # newline        (NL)
1516                        'r' => "\r",   # return         (CR)
1517                        'f' => "\f",   # form feed      (FF)
1518                        'b' => "\b",   # backspace      (BS)
1519                        'a' => "\a",   # alarm (bell)   (BEL)
1520                        'e' => "\e",   # escape         (ESC)
1521                        'v' => "\013", # vertical tab   (VT)
1522                );
1523
1524                if ($seq =~ m/^[0-7]{1,3}$/) {
1525                        # octal char sequence
1526                        return chr(oct($seq));
1527                } elsif (exists $es{$seq}) {
1528                        # C escape sequence, aka character escape code
1529                        return $es{$seq};
1530                }
1531                # quoted ordinary character
1532                return $seq;
1533        }
1534
1535        if ($str =~ m/^"(.*)"$/) {
1536                # needs unquoting
1537                $str = $1;
1538                $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1539        }
1540        return $str;
1541}
1542
1543# escape tabs (convert tabs to spaces)
1544sub untabify {
1545        my $line = shift;
1546
1547        while ((my $pos = index($line, "\t")) != -1) {
1548                if (my $count = (8 - ($pos % 8))) {
1549                        my $spaces = ' ' x $count;
1550                        $line =~ s/\t/$spaces/;
1551                }
1552        }
1553
1554        return $line;
1555}
1556
1557sub project_in_list {
1558        my $project = shift;
1559        my @list = git_get_projects_list();
1560        return @list && scalar(grep { $_->{'path'} eq $project } @list);
1561}
1562
1563## ----------------------------------------------------------------------
1564## HTML aware string manipulation
1565
1566# Try to chop given string on a word boundary between position
1567# $len and $len+$add_len. If there is no word boundary there,
1568# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1569# (marking chopped part) would be longer than given string.
1570sub chop_str {
1571        my $str = shift;
1572        my $len = shift;
1573        my $add_len = shift || 10;
1574        my $where = shift || 'right'; # 'left' | 'center' | 'right'
1575
1576        # Make sure perl knows it is utf8 encoded so we don't
1577        # cut in the middle of a utf8 multibyte char.
1578        $str = to_utf8($str);
1579
1580        # allow only $len chars, but don't cut a word if it would fit in $add_len
1581        # if it doesn't fit, cut it if it's still longer than the dots we would add
1582        # remove chopped character entities entirely
1583
1584        # when chopping in the middle, distribute $len into left and right part
1585        # return early if chopping wouldn't make string shorter
1586        if ($where eq 'center') {
1587                return $str if ($len + 5 >= length($str)); # filler is length 5
1588                $len = int($len/2);
1589        } else {
1590                return $str if ($len + 4 >= length($str)); # filler is length 4
1591        }
1592
1593        # regexps: ending and beginning with word part up to $add_len
1594        my $endre = qr/.{$len}\w{0,$add_len}/;
1595        my $begre = qr/\w{0,$add_len}.{$len}/;
1596
1597        if ($where eq 'left') {
1598                $str =~ m/^(.*?)($begre)$/;
1599                my ($lead, $body) = ($1, $2);
1600                if (length($lead) > 4) {
1601                        $lead = " ...";
1602                }
1603                return "$lead$body";
1604
1605        } elsif ($where eq 'center') {
1606                $str =~ m/^($endre)(.*)$/;
1607                my ($left, $str)  = ($1, $2);
1608                $str =~ m/^(.*?)($begre)$/;
1609                my ($mid, $right) = ($1, $2);
1610                if (length($mid) > 5) {
1611                        $mid = " ... ";
1612                }
1613                return "$left$mid$right";
1614
1615        } else {
1616                $str =~ m/^($endre)(.*)$/;
1617                my $body = $1;
1618                my $tail = $2;
1619                if (length($tail) > 4) {
1620                        $tail = "... ";
1621                }
1622                return "$body$tail";
1623        }
1624}
1625
1626# takes the same arguments as chop_str, but also wraps a <span> around the
1627# result with a title attribute if it does get chopped. Additionally, the
1628# string is HTML-escaped.
1629sub chop_and_escape_str {
1630        my ($str) = @_;
1631
1632        my $chopped = chop_str(@_);
1633        if ($chopped eq $str) {
1634                return esc_html($chopped);
1635        } else {
1636                $str =~ s/[[:cntrl:]]/?/g;
1637                return $cgi->span({-title=>$str}, esc_html($chopped));
1638        }
1639}
1640
1641## ----------------------------------------------------------------------
1642## functions returning short strings
1643
1644# CSS class for given age value (in seconds)
1645sub age_class {
1646        my $age = shift;
1647
1648        if (!defined $age) {
1649                return "noage";
1650        } elsif ($age < 60*60*2) {
1651                return "age0";
1652        } elsif ($age < 60*60*24*2) {
1653                return "age1";
1654        } else {
1655                return "age2";
1656        }
1657}
1658
1659# convert age in seconds to "nn units ago" string
1660sub age_string {
1661        my $age = shift;
1662        my $age_str;
1663
1664        if ($age > 60*60*24*365*2) {
1665                $age_str = (int $age/60/60/24/365);
1666                $age_str .= " years ago";
1667        } elsif ($age > 60*60*24*(365/12)*2) {
1668                $age_str = int $age/60/60/24/(365/12);
1669                $age_str .= " months ago";
1670        } elsif ($age > 60*60*24*7*2) {
1671                $age_str = int $age/60/60/24/7;
1672                $age_str .= " weeks ago";
1673        } elsif ($age > 60*60*24*2) {
1674                $age_str = int $age/60/60/24;
1675                $age_str .= " days ago";
1676        } elsif ($age > 60*60*2) {
1677                $age_str = int $age/60/60;
1678                $age_str .= " hours ago";
1679        } elsif ($age > 60*2) {
1680                $age_str = int $age/60;
1681                $age_str .= " min ago";
1682        } elsif ($age > 2) {
1683                $age_str = int $age;
1684                $age_str .= " sec ago";
1685        } else {
1686                $age_str .= " right now";
1687        }
1688        return $age_str;
1689}
1690
1691use constant {
1692        S_IFINVALID => 0030000,
1693        S_IFGITLINK => 0160000,
1694};
1695
1696# submodule/subproject, a commit object reference
1697sub S_ISGITLINK {
1698        my $mode = shift;
1699
1700        return (($mode & S_IFMT) == S_IFGITLINK)
1701}
1702
1703# convert file mode in octal to symbolic file mode string
1704sub mode_str {
1705        my $mode = oct shift;
1706
1707        if (S_ISGITLINK($mode)) {
1708                return 'm---------';
1709        } elsif (S_ISDIR($mode & S_IFMT)) {
1710                return 'drwxr-xr-x';
1711        } elsif (S_ISLNK($mode)) {
1712                return 'lrwxrwxrwx';
1713        } elsif (S_ISREG($mode)) {
1714                # git cares only about the executable bit
1715                if ($mode & S_IXUSR) {
1716                        return '-rwxr-xr-x';
1717                } else {
1718                        return '-rw-r--r--';
1719                };
1720        } else {
1721                return '----------';
1722        }
1723}
1724
1725# convert file mode in octal to file type string
1726sub file_type {
1727        my $mode = shift;
1728
1729        if ($mode !~ m/^[0-7]+$/) {
1730                return $mode;
1731        } else {
1732                $mode = oct $mode;
1733        }
1734
1735        if (S_ISGITLINK($mode)) {
1736                return "submodule";
1737        } elsif (S_ISDIR($mode & S_IFMT)) {
1738                return "directory";
1739        } elsif (S_ISLNK($mode)) {
1740                return "symlink";
1741        } elsif (S_ISREG($mode)) {
1742                return "file";
1743        } else {
1744                return "unknown";
1745        }
1746}
1747
1748# convert file mode in octal to file type description string
1749sub file_type_long {
1750        my $mode = shift;
1751
1752        if ($mode !~ m/^[0-7]+$/) {
1753                return $mode;
1754        } else {
1755                $mode = oct $mode;
1756        }
1757
1758        if (S_ISGITLINK($mode)) {
1759                return "submodule";
1760        } elsif (S_ISDIR($mode & S_IFMT)) {
1761                return "directory";
1762        } elsif (S_ISLNK($mode)) {
1763                return "symlink";
1764        } elsif (S_ISREG($mode)) {
1765                if ($mode & S_IXUSR) {
1766                        return "executable";
1767                } else {
1768                        return "file";
1769                };
1770        } else {
1771                return "unknown";
1772        }
1773}
1774
1775
1776## ----------------------------------------------------------------------
1777## functions returning short HTML fragments, or transforming HTML fragments
1778## which don't belong to other sections
1779
1780# format line of commit message.
1781sub format_log_line_html {
1782        my $line = shift;
1783
1784        $line = esc_html($line, -nbsp=>1);
1785        $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1786                $cgi->a({-href => href(action=>"object", hash=>$1),
1787                                        -class => "text"}, $1);
1788        }eg;
1789
1790        return $line;
1791}
1792
1793# format marker of refs pointing to given object
1794
1795# the destination action is chosen based on object type and current context:
1796# - for annotated tags, we choose the tag view unless it's the current view
1797#   already, in which case we go to shortlog view
1798# - for other refs, we keep the current view if we're in history, shortlog or
1799#   log view, and select shortlog otherwise
1800sub format_ref_marker {
1801        my ($refs, $id) = @_;
1802        my $markers = '';
1803
1804        if (defined $refs->{$id}) {
1805                foreach my $ref (@{$refs->{$id}}) {
1806                        # this code exploits the fact that non-lightweight tags are the
1807                        # only indirect objects, and that they are the only objects for which
1808                        # we want to use tag instead of shortlog as action
1809                        my ($type, $name) = qw();
1810                        my $indirect = ($ref =~ s/\^\{\}$//);
1811                        # e.g. tags/v2.6.11 or heads/next
1812                        if ($ref =~ m!^(.*?)s?/(.*)$!) {
1813                                $type = $1;
1814                                $name = $2;
1815                        } else {
1816                                $type = "ref";
1817                                $name = $ref;
1818                        }
1819
1820                        my $class = $type;
1821                        $class .= " indirect" if $indirect;
1822
1823                        my $dest_action = "shortlog";
1824
1825                        if ($indirect) {
1826                                $dest_action = "tag" unless $action eq "tag";
1827                        } elsif ($action =~ /^(history|(short)?log)$/) {
1828                                $dest_action = $action;
1829                        }
1830
1831                        my $dest = "";
1832                        $dest .= "refs/" unless $ref =~ m!^refs/!;
1833                        $dest .= $ref;
1834
1835                        my $link = $cgi->a({
1836                                -href => href(
1837                                        action=>$dest_action,
1838                                        hash=>$dest
1839                                )}, $name);
1840
1841                        $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
1842                                $link . "</span>";
1843                }
1844        }
1845
1846        if ($markers) {
1847                return ' <span class="refs">'. $markers . '</span>';
1848        } else {
1849                return "";
1850        }
1851}
1852
1853# format, perhaps shortened and with markers, title line
1854sub format_subject_html {
1855        my ($long, $short, $href, $extra) = @_;
1856        $extra = '' unless defined($extra);
1857
1858        if (length($short) < length($long)) {
1859                $long =~ s/[[:cntrl:]]/?/g;
1860                return $cgi->a({-href => $href, -class => "list subject",
1861                                -title => to_utf8($long)},
1862                       esc_html($short)) . $extra;
1863        } else {
1864                return $cgi->a({-href => $href, -class => "list subject"},
1865                       esc_html($long)) . $extra;
1866        }
1867}
1868
1869# Rather than recomputing the url for an email multiple times, we cache it
1870# after the first hit. This gives a visible benefit in views where the avatar
1871# for the same email is used repeatedly (e.g. shortlog).
1872# The cache is shared by all avatar engines (currently gravatar only), which
1873# are free to use it as preferred. Since only one avatar engine is used for any
1874# given page, there's no risk for cache conflicts.
1875our %avatar_cache = ();
1876
1877# Compute the picon url for a given email, by using the picon search service over at
1878# http://www.cs.indiana.edu/picons/search.html
1879sub picon_url {
1880        my $email = lc shift;
1881        if (!$avatar_cache{$email}) {
1882                my ($user, $domain) = split('@', $email);
1883                $avatar_cache{$email} =
1884                        "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1885                        "$domain/$user/" .
1886                        "users+domains+unknown/up/single";
1887        }
1888        return $avatar_cache{$email};
1889}
1890
1891# Compute the gravatar url for a given email, if it's not in the cache already.
1892# Gravatar stores only the part of the URL before the size, since that's the
1893# one computationally more expensive. This also allows reuse of the cache for
1894# different sizes (for this particular engine).
1895sub gravatar_url {
1896        my $email = lc shift;
1897        my $size = shift;
1898        $avatar_cache{$email} ||=
1899                "http://www.gravatar.com/avatar/" .
1900                        Digest::MD5::md5_hex($email) . "?s=";
1901        return $avatar_cache{$email} . $size;
1902}
1903
1904# Insert an avatar for the given $email at the given $size if the feature
1905# is enabled.
1906sub git_get_avatar {
1907        my ($email, %opts) = @_;
1908        my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1909        my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1910        $opts{-size} ||= 'default';
1911        my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1912        my $url = "";
1913        if ($git_avatar eq 'gravatar') {
1914                $url = gravatar_url($email, $size);
1915        } elsif ($git_avatar eq 'picon') {
1916                $url = picon_url($email);
1917        }
1918        # Other providers can be added by extending the if chain, defining $url
1919        # as needed. If no variant puts something in $url, we assume avatars
1920        # are completely disabled/unavailable.
1921        if ($url) {
1922                return $pre_white .
1923                       "<img width=\"$size\" " .
1924                            "class=\"avatar\" " .
1925                            "src=\"".esc_url($url)."\" " .
1926                            "alt=\"\" " .
1927                       "/>" . $post_white;
1928        } else {
1929                return "";
1930        }
1931}
1932
1933sub format_search_author {
1934        my ($author, $searchtype, $displaytext) = @_;
1935        my $have_search = gitweb_check_feature('search');
1936
1937        if ($have_search) {
1938                my $performed = "";
1939                if ($searchtype eq 'author') {
1940                        $performed = "authored";
1941                } elsif ($searchtype eq 'committer') {
1942                        $performed = "committed";
1943                }
1944
1945                return $cgi->a({-href => href(action=>"search", hash=>$hash,
1946                                searchtext=>$author,
1947                                searchtype=>$searchtype), class=>"list",
1948                                title=>"Search for commits $performed by $author"},
1949                                $displaytext);
1950
1951        } else {
1952                return $displaytext;
1953        }
1954}
1955
1956# format the author name of the given commit with the given tag
1957# the author name is chopped and escaped according to the other
1958# optional parameters (see chop_str).
1959sub format_author_html {
1960        my $tag = shift;
1961        my $co = shift;
1962        my $author = chop_and_escape_str($co->{'author_name'}, @_);
1963        return "<$tag class=\"author\">" .
1964               format_search_author($co->{'author_name'}, "author",
1965                       git_get_avatar($co->{'author_email'}, -pad_after => 1) .
1966                       $author) .
1967               "</$tag>";
1968}
1969
1970# format git diff header line, i.e. "diff --(git|combined|cc) ..."
1971sub format_git_diff_header_line {
1972        my $line = shift;
1973        my $diffinfo = shift;
1974        my ($from, $to) = @_;
1975
1976        if ($diffinfo->{'nparents'}) {
1977                # combined diff
1978                $line =~ s!^(diff (.*?) )"?.*$!$1!;
1979                if ($to->{'href'}) {
1980                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1981                                         esc_path($to->{'file'}));
1982                } else { # file was deleted (no href)
1983                        $line .= esc_path($to->{'file'});
1984                }
1985        } else {
1986                # "ordinary" diff
1987                $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
1988                if ($from->{'href'}) {
1989                        $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
1990                                         'a/' . esc_path($from->{'file'}));
1991                } else { # file was added (no href)
1992                        $line .= 'a/' . esc_path($from->{'file'});
1993                }
1994                $line .= ' ';
1995                if ($to->{'href'}) {
1996                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1997                                         'b/' . esc_path($to->{'file'}));
1998                } else { # file was deleted
1999                        $line .= 'b/' . esc_path($to->{'file'});
2000                }
2001        }
2002
2003        return "<div class=\"diff header\">$line</div>\n";
2004}
2005
2006# format extended diff header line, before patch itself
2007sub format_extended_diff_header_line {
2008        my $line = shift;
2009        my $diffinfo = shift;
2010        my ($from, $to) = @_;
2011
2012        # match <path>
2013        if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2014                $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2015                                       esc_path($from->{'file'}));
2016        }
2017        if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2018                $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2019                                 esc_path($to->{'file'}));
2020        }
2021        # match single <mode>
2022        if ($line =~ m/\s(\d{6})$/) {
2023                $line .= '<span class="info"> (' .
2024                         file_type_long($1) .
2025                         ')</span>';
2026        }
2027        # match <hash>
2028        if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2029                # can match only for combined diff
2030                $line = 'index ';
2031                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2032                        if ($from->{'href'}[$i]) {
2033                                $line .= $cgi->a({-href=>$from->{'href'}[$i],
2034                                                  -class=>"hash"},
2035                                                 substr($diffinfo->{'from_id'}[$i],0,7));
2036                        } else {
2037                                $line .= '0' x 7;
2038                        }
2039                        # separator
2040                        $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2041                }
2042                $line .= '..';
2043                if ($to->{'href'}) {
2044                        $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2045                                         substr($diffinfo->{'to_id'},0,7));
2046                } else {
2047                        $line .= '0' x 7;
2048                }
2049
2050        } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2051                # can match only for ordinary diff
2052                my ($from_link, $to_link);
2053                if ($from->{'href'}) {
2054                        $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2055                                             substr($diffinfo->{'from_id'},0,7));
2056                } else {
2057                        $from_link = '0' x 7;
2058                }
2059                if ($to->{'href'}) {
2060                        $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2061                                           substr($diffinfo->{'to_id'},0,7));
2062                } else {
2063                        $to_link = '0' x 7;
2064                }
2065                my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2066                $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2067        }
2068
2069        return $line . "<br/>\n";
2070}
2071
2072# format from-file/to-file diff header
2073sub format_diff_from_to_header {
2074        my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2075        my $line;
2076        my $result = '';
2077
2078        $line = $from_line;
2079        #assert($line =~ m/^---/) if DEBUG;
2080        # no extra formatting for "^--- /dev/null"
2081        if (! $diffinfo->{'nparents'}) {
2082                # ordinary (single parent) diff
2083                if ($line =~ m!^--- "?a/!) {
2084                        if ($from->{'href'}) {
2085                                $line = '--- a/' .
2086                                        $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2087                                                esc_path($from->{'file'}));
2088                        } else {
2089                                $line = '--- a/' .
2090                                        esc_path($from->{'file'});
2091                        }
2092                }
2093                $result .= qq!<div class="diff from_file">$line</div>\n!;
2094
2095        } else {
2096                # combined diff (merge commit)
2097                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2098                        if ($from->{'href'}[$i]) {
2099                                $line = '--- ' .
2100                                        $cgi->a({-href=>href(action=>"blobdiff",
2101                                                             hash_parent=>$diffinfo->{'from_id'}[$i],
2102                                                             hash_parent_base=>$parents[$i],
2103                                                             file_parent=>$from->{'file'}[$i],
2104                                                             hash=>$diffinfo->{'to_id'},
2105                                                             hash_base=>$hash,
2106                                                             file_name=>$to->{'file'}),
2107                                                 -class=>"path",
2108                                                 -title=>"diff" . ($i+1)},
2109                                                $i+1) .
2110                                        '/' .
2111                                        $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2112                                                esc_path($from->{'file'}[$i]));
2113                        } else {
2114                                $line = '--- /dev/null';
2115                        }
2116                        $result .= qq!<div class="diff from_file">$line</div>\n!;
2117                }
2118        }
2119
2120        $line = $to_line;
2121        #assert($line =~ m/^\+\+\+/) if DEBUG;
2122        # no extra formatting for "^+++ /dev/null"
2123        if ($line =~ m!^\+\+\+ "?b/!) {
2124                if ($to->{'href'}) {
2125                        $line = '+++ b/' .
2126                                $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2127                                        esc_path($to->{'file'}));
2128                } else {
2129                        $line = '+++ b/' .
2130                                esc_path($to->{'file'});
2131                }
2132        }
2133        $result .= qq!<div class="diff to_file">$line</div>\n!;
2134
2135        return $result;
2136}
2137
2138# create note for patch simplified by combined diff
2139sub format_diff_cc_simplified {
2140        my ($diffinfo, @parents) = @_;
2141        my $result = '';
2142
2143        $result .= "<div class=\"diff header\">" .
2144                   "diff --cc ";
2145        if (!is_deleted($diffinfo)) {
2146                $result .= $cgi->a({-href => href(action=>"blob",
2147                                                  hash_base=>$hash,
2148                                                  hash=>$diffinfo->{'to_id'},
2149                                                  file_name=>$diffinfo->{'to_file'}),
2150                                    -class => "path"},
2151                                   esc_path($diffinfo->{'to_file'}));
2152        } else {
2153                $result .= esc_path($diffinfo->{'to_file'});
2154        }
2155        $result .= "</div>\n" . # class="diff header"
2156                   "<div class=\"diff nodifferences\">" .
2157                   "Simple merge" .
2158                   "</div>\n"; # class="diff nodifferences"
2159
2160        return $result;
2161}
2162
2163# format patch (diff) line (not to be used for diff headers)
2164sub format_diff_line {
2165        my $line = shift;
2166        my ($from, $to) = @_;
2167        my $diff_class = "";
2168
2169        chomp $line;
2170
2171        if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2172                # combined diff
2173                my $prefix = substr($line, 0, scalar @{$from->{'href'}});
2174                if ($line =~ m/^\@{3}/) {
2175                        $diff_class = " chunk_header";
2176                } elsif ($line =~ m/^\\/) {
2177                        $diff_class = " incomplete";
2178                } elsif ($prefix =~ tr/+/+/) {
2179                        $diff_class = " add";
2180                } elsif ($prefix =~ tr/-/-/) {
2181                        $diff_class = " rem";
2182                }
2183        } else {
2184                # assume ordinary diff
2185                my $char = substr($line, 0, 1);
2186                if ($char eq '+') {
2187                        $diff_class = " add";
2188                } elsif ($char eq '-') {
2189                        $diff_class = " rem";
2190                } elsif ($char eq '@') {
2191                        $diff_class = " chunk_header";
2192                } elsif ($char eq "\\") {
2193                        $diff_class = " incomplete";
2194                }
2195        }
2196        $line = untabify($line);
2197        if ($from && $to && $line =~ m/^\@{2} /) {
2198                my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2199                        $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2200
2201                $from_lines = 0 unless defined $from_lines;
2202                $to_lines   = 0 unless defined $to_lines;
2203
2204                if ($from->{'href'}) {
2205                        $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2206                                             -class=>"list"}, $from_text);
2207                }
2208                if ($to->{'href'}) {
2209                        $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2210                                             -class=>"list"}, $to_text);
2211                }
2212                $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2213                        "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2214                return "<div class=\"diff$diff_class\">$line</div>\n";
2215        } elsif ($from && $to && $line =~ m/^\@{3}/) {
2216                my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2217                my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2218
2219                @from_text = split(' ', $ranges);
2220                for (my $i = 0; $i < @from_text; ++$i) {
2221                        ($from_start[$i], $from_nlines[$i]) =
2222                                (split(',', substr($from_text[$i], 1)), 0);
2223                }
2224
2225                $to_text   = pop @from_text;
2226                $to_start  = pop @from_start;
2227                $to_nlines = pop @from_nlines;
2228
2229                $line = "<span class=\"chunk_info\">$prefix ";
2230                for (my $i = 0; $i < @from_text; ++$i) {
2231                        if ($from->{'href'}[$i]) {
2232                                $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2233                                                  -class=>"list"}, $from_text[$i]);
2234                        } else {
2235                                $line .= $from_text[$i];
2236                        }
2237                        $line .= " ";
2238                }
2239                if ($to->{'href'}) {
2240                        $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2241                                          -class=>"list"}, $to_text);
2242                } else {
2243                        $line .= $to_text;
2244                }
2245                $line .= " $prefix</span>" .
2246                         "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2247                return "<div class=\"diff$diff_class\">$line</div>\n";
2248        }
2249        return "<div class=\"diff$diff_class\">" . esc_html($line, -nbsp=>1) . "</div>\n";
2250}
2251
2252# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2253# linked.  Pass the hash of the tree/commit to snapshot.
2254sub format_snapshot_links {
2255        my ($hash) = @_;
2256        my $num_fmts = @snapshot_fmts;
2257        if ($num_fmts > 1) {
2258                # A parenthesized list of links bearing format names.
2259                # e.g. "snapshot (_tar.gz_ _zip_)"
2260                return "snapshot (" . join(' ', map
2261                        $cgi->a({
2262                                -href => href(
2263                                        action=>"snapshot",
2264                                        hash=>$hash,
2265                                        snapshot_format=>$_
2266                                )
2267                        }, $known_snapshot_formats{$_}{'display'})
2268                , @snapshot_fmts) . ")";
2269        } elsif ($num_fmts == 1) {
2270                # A single "snapshot" link whose tooltip bears the format name.
2271                # i.e. "_snapshot_"
2272                my ($fmt) = @snapshot_fmts;
2273                return
2274                        $cgi->a({
2275                                -href => href(
2276                                        action=>"snapshot",
2277                                        hash=>$hash,
2278                                        snapshot_format=>$fmt
2279                                ),
2280                                -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2281                        }, "snapshot");
2282        } else { # $num_fmts == 0
2283                return undef;
2284        }
2285}
2286
2287## ......................................................................
2288## functions returning values to be passed, perhaps after some
2289## transformation, to other functions; e.g. returning arguments to href()
2290
2291# returns hash to be passed to href to generate gitweb URL
2292# in -title key it returns description of link
2293sub get_feed_info {
2294        my $format = shift || 'Atom';
2295        my %res = (action => lc($format));
2296
2297        # feed links are possible only for project views
2298        return unless (defined $project);
2299        # some views should link to OPML, or to generic project feed,
2300        # or don't have specific feed yet (so they should use generic)
2301        return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2302
2303        my $branch;
2304        # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2305        # from tag links; this also makes possible to detect branch links
2306        if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2307            (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2308                $branch = $1;
2309        }
2310        # find log type for feed description (title)
2311        my $type = 'log';
2312        if (defined $file_name) {
2313                $type  = "history of $file_name";
2314                $type .= "/" if ($action eq 'tree');
2315                $type .= " on '$branch'" if (defined $branch);
2316        } else {
2317                $type = "log of $branch" if (defined $branch);
2318        }
2319
2320        $res{-title} = $type;
2321        $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2322        $res{'file_name'} = $file_name;
2323
2324        return %res;
2325}
2326
2327## ----------------------------------------------------------------------
2328## git utility subroutines, invoking git commands
2329
2330# returns path to the core git executable and the --git-dir parameter as list
2331sub git_cmd {
2332        $number_of_git_cmds++;
2333        return $GIT, '--git-dir='.$git_dir;
2334}
2335
2336# quote the given arguments for passing them to the shell
2337# quote_command("command", "arg 1", "arg with ' and ! characters")
2338# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2339# Try to avoid using this function wherever possible.
2340sub quote_command {
2341        return join(' ',
2342                map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2343}
2344
2345# get HEAD ref of given project as hash
2346sub git_get_head_hash {
2347        return git_get_full_hash(shift, 'HEAD');
2348}
2349
2350sub git_get_full_hash {
2351        return git_get_hash(@_);
2352}
2353
2354sub git_get_short_hash {
2355        return git_get_hash(@_, '--short=7');
2356}
2357
2358sub git_get_hash {
2359        my ($project, $hash, @options) = @_;
2360        my $o_git_dir = $git_dir;
2361        my $retval = undef;
2362        $git_dir = "$projectroot/$project";
2363        if (open my $fd, '-|', git_cmd(), 'rev-parse',
2364            '--verify', '-q', @options, $hash) {
2365                $retval = <$fd>;
2366                chomp $retval if defined $retval;
2367                close $fd;
2368        }
2369        if (defined $o_git_dir) {
2370                $git_dir = $o_git_dir;
2371        }
2372        return $retval;
2373}
2374
2375# get type of given object
2376sub git_get_type {
2377        my $hash = shift;
2378
2379        open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2380        my $type = <$fd>;
2381        close $fd or return;
2382        chomp $type;
2383        return $type;
2384}
2385
2386# repository configuration
2387our $config_file = '';
2388our %config;
2389
2390# store multiple values for single key as anonymous array reference
2391# single values stored directly in the hash, not as [ <value> ]
2392sub hash_set_multi {
2393        my ($hash, $key, $value) = @_;
2394
2395        if (!exists $hash->{$key}) {
2396                $hash->{$key} = $value;
2397        } elsif (!ref $hash->{$key}) {
2398                $hash->{$key} = [ $hash->{$key}, $value ];
2399        } else {
2400                push @{$hash->{$key}}, $value;
2401        }
2402}
2403
2404# return hash of git project configuration
2405# optionally limited to some section, e.g. 'gitweb'
2406sub git_parse_project_config {
2407        my $section_regexp = shift;
2408        my %config;
2409
2410        local $/ = "\0";
2411
2412        open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2413                or return;
2414
2415        while (my $keyval = <$fh>) {
2416                chomp $keyval;
2417                my ($key, $value) = split(/\n/, $keyval, 2);
2418
2419                hash_set_multi(\%config, $key, $value)
2420                        if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2421        }
2422        close $fh;
2423
2424        return %config;
2425}
2426
2427# convert config value to boolean: 'true' or 'false'
2428# no value, number > 0, 'true' and 'yes' values are true
2429# rest of values are treated as false (never as error)
2430sub config_to_bool {
2431        my $val = shift;
2432
2433        return 1 if !defined $val;             # section.key
2434
2435        # strip leading and trailing whitespace
2436        $val =~ s/^\s+//;
2437        $val =~ s/\s+$//;
2438
2439        return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2440                ($val =~ /^(?:true|yes)$/i));  # section.key = true
2441}
2442
2443# convert config value to simple decimal number
2444# an optional value suffix of 'k', 'm', or 'g' will cause the value
2445# to be multiplied by 1024, 1048576, or 1073741824
2446sub config_to_int {
2447        my $val = shift;
2448
2449        # strip leading and trailing whitespace
2450        $val =~ s/^\s+//;
2451        $val =~ s/\s+$//;
2452
2453        if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2454                $unit = lc($unit);
2455                # unknown unit is treated as 1
2456                return $num * ($unit eq 'g' ? 1073741824 :
2457                               $unit eq 'm' ?    1048576 :
2458                               $unit eq 'k' ?       1024 : 1);
2459        }
2460        return $val;
2461}
2462
2463# convert config value to array reference, if needed
2464sub config_to_multi {
2465        my $val = shift;
2466
2467        return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2468}
2469
2470sub git_get_project_config {
2471        my ($key, $type) = @_;
2472
2473        return unless defined $git_dir;
2474
2475        # key sanity check
2476        return unless ($key);
2477        $key =~ s/^gitweb\.//;
2478        return if ($key =~ m/\W/);
2479
2480        # type sanity check
2481        if (defined $type) {
2482                $type =~ s/^--//;
2483                $type = undef
2484                        unless ($type eq 'bool' || $type eq 'int');
2485        }
2486
2487        # get config
2488        if (!defined $config_file ||
2489            $config_file ne "$git_dir/config") {
2490                %config = git_parse_project_config('gitweb');
2491                $config_file = "$git_dir/config";
2492        }
2493
2494        # check if config variable (key) exists
2495        return unless exists $config{"gitweb.$key"};
2496
2497        # ensure given type
2498        if (!defined $type) {
2499                return $config{"gitweb.$key"};
2500        } elsif ($type eq 'bool') {
2501                # backward compatibility: 'git config --bool' returns true/false
2502                return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2503        } elsif ($type eq 'int') {
2504                return config_to_int($config{"gitweb.$key"});
2505        }
2506        return $config{"gitweb.$key"};
2507}
2508
2509# get hash of given path at given ref
2510sub git_get_hash_by_path {
2511        my $base = shift;
2512        my $path = shift || return undef;
2513        my $type = shift;
2514
2515        $path =~ s,/+$,,;
2516
2517        open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2518                or die_error(500, "Open git-ls-tree failed");
2519        my $line = <$fd>;
2520        close $fd or return undef;
2521
2522        if (!defined $line) {
2523                # there is no tree or hash given by $path at $base
2524                return undef;
2525        }
2526
2527        #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2528        $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2529        if (defined $type && $type ne $2) {
2530                # type doesn't match
2531                return undef;
2532        }
2533        return $3;
2534}
2535
2536# get path of entry with given hash at given tree-ish (ref)
2537# used to get 'from' filename for combined diff (merge commit) for renames
2538sub git_get_path_by_hash {
2539        my $base = shift || return;
2540        my $hash = shift || return;
2541
2542        local $/ = "\0";
2543
2544        open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2545                or return undef;
2546        while (my $line = <$fd>) {
2547                chomp $line;
2548
2549                #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2550                #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2551                if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2552                        close $fd;
2553                        return $1;
2554                }
2555        }
2556        close $fd;
2557        return undef;
2558}
2559
2560## ......................................................................
2561## git utility functions, directly accessing git repository
2562
2563sub git_get_project_description {
2564        my $path = shift;
2565
2566        $git_dir = "$projectroot/$path";
2567        open my $fd, '<', "$git_dir/description"
2568                or return git_get_project_config('description');
2569        my $descr = <$fd>;
2570        close $fd;
2571        if (defined $descr) {
2572                chomp $descr;
2573        }
2574        return $descr;
2575}
2576
2577sub git_get_project_ctags {
2578        my $path = shift;
2579        my $ctags = {};
2580
2581        $git_dir = "$projectroot/$path";
2582        opendir my $dh, "$git_dir/ctags"
2583                or return $ctags;
2584        foreach (grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh)) {
2585                open my $ct, '<', $_ or next;
2586                my $val = <$ct>;
2587                chomp $val;
2588                close $ct;
2589                my $ctag = $_; $ctag =~ s#.*/##;
2590                $ctags->{$ctag} = $val;
2591        }
2592        closedir $dh;
2593        $ctags;
2594}
2595
2596sub git_populate_project_tagcloud {
2597        my $ctags = shift;
2598
2599        # First, merge different-cased tags; tags vote on casing
2600        my %ctags_lc;
2601        foreach (keys %$ctags) {
2602                $ctags_lc{lc $_}->{count} += $ctags->{$_};
2603                if (not $ctags_lc{lc $_}->{topcount}
2604                    or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2605                        $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2606                        $ctags_lc{lc $_}->{topname} = $_;
2607                }
2608        }
2609
2610        my $cloud;
2611        if (eval { require HTML::TagCloud; 1; }) {
2612                $cloud = HTML::TagCloud->new;
2613                foreach (sort keys %ctags_lc) {
2614                        # Pad the title with spaces so that the cloud looks
2615                        # less crammed.
2616                        my $title = $ctags_lc{$_}->{topname};
2617                        $title =~ s/ /&nbsp;/g;
2618                        $title =~ s/^/&nbsp;/g;
2619                        $title =~ s/$/&nbsp;/g;
2620                        $cloud->add($title, $home_link."?by_tag=".$_, $ctags_lc{$_}->{count});
2621                }
2622        } else {
2623                $cloud = \%ctags_lc;
2624        }
2625        $cloud;
2626}
2627
2628sub git_show_project_tagcloud {
2629        my ($cloud, $count) = @_;
2630        print STDERR ref($cloud)."..\n";
2631        if (ref $cloud eq 'HTML::TagCloud') {
2632                return $cloud->html_and_css($count);
2633        } else {
2634                my @tags = sort { $cloud->{$a}->{count} <=> $cloud->{$b}->{count} } keys %$cloud;
2635                return '<p align="center">' . join (', ', map {
2636                        $cgi->a({-href=>"$home_link?by_tag=$_"}, $cloud->{$_}->{topname})
2637                } splice(@tags, 0, $count)) . '</p>';
2638        }
2639}
2640
2641sub git_get_project_url_list {
2642        my $path = shift;
2643
2644        $git_dir = "$projectroot/$path";
2645        open my $fd, '<', "$git_dir/cloneurl"
2646                or return wantarray ?
2647                @{ config_to_multi(git_get_project_config('url')) } :
2648                   config_to_multi(git_get_project_config('url'));
2649        my @git_project_url_list = map { chomp; $_ } <$fd>;
2650        close $fd;
2651
2652        return wantarray ? @git_project_url_list : \@git_project_url_list;
2653}
2654
2655sub git_get_projects_list {
2656        my ($filter) = @_;
2657        my @list;
2658
2659        $filter ||= '';
2660        $filter =~ s/\.git$//;
2661
2662        my $check_forks = gitweb_check_feature('forks');
2663
2664        if (-d $projects_list) {
2665                # search in directory
2666                my $dir = $projects_list . ($filter ? "/$filter" : '');
2667                # remove the trailing "/"
2668                $dir =~ s!/+$!!;
2669                my $pfxlen = length("$dir");
2670                my $pfxdepth = ($dir =~ tr!/!!);
2671
2672                File::Find::find({
2673                        follow_fast => 1, # follow symbolic links
2674                        follow_skip => 2, # ignore duplicates
2675                        dangling_symlinks => 0, # ignore dangling symlinks, silently
2676                        wanted => sub {
2677                                # global variables
2678                                our $project_maxdepth;
2679                                our $projectroot;
2680                                # skip project-list toplevel, if we get it.
2681                                return if (m!^[/.]$!);
2682                                # only directories can be git repositories
2683                                return unless (-d $_);
2684                                # don't traverse too deep (Find is super slow on os x)
2685                                if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2686                                        $File::Find::prune = 1;
2687                                        return;
2688                                }
2689
2690                                my $subdir = substr($File::Find::name, $pfxlen + 1);
2691                                # we check related file in $projectroot
2692                                my $path = ($filter ? "$filter/" : '') . $subdir;
2693                                if (check_export_ok("$projectroot/$path")) {
2694                                        push @list, { path => $path };
2695                                        $File::Find::prune = 1;
2696                                }
2697                        },
2698                }, "$dir");
2699
2700        } elsif (-f $projects_list) {
2701                # read from file(url-encoded):
2702                # 'git%2Fgit.git Linus+Torvalds'
2703                # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2704                # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2705                my %paths;
2706                open my $fd, '<', $projects_list or return;
2707        PROJECT:
2708                while (my $line = <$fd>) {
2709                        chomp $line;
2710                        my ($path, $owner) = split ' ', $line;
2711                        $path = unescape($path);
2712                        $owner = unescape($owner);
2713                        if (!defined $path) {
2714                                next;
2715                        }
2716                        if ($filter ne '') {
2717                                # looking for forks;
2718                                my $pfx = substr($path, 0, length($filter));
2719                                if ($pfx ne $filter) {
2720                                        next PROJECT;
2721                                }
2722                                my $sfx = substr($path, length($filter));
2723                                if ($sfx !~ /^\/.*\.git$/) {
2724                                        next PROJECT;
2725                                }
2726                        } elsif ($check_forks) {
2727                        PATH:
2728                                foreach my $filter (keys %paths) {
2729                                        # looking for forks;
2730                                        my $pfx = substr($path, 0, length($filter));
2731                                        if ($pfx ne $filter) {
2732                                                next PATH;
2733                                        }
2734                                        my $sfx = substr($path, length($filter));
2735                                        if ($sfx !~ /^\/.*\.git$/) {
2736                                                next PATH;
2737                                        }
2738                                        # is a fork, don't include it in
2739                                        # the list
2740                                        next PROJECT;
2741                                }
2742                        }
2743                        if (check_export_ok("$projectroot/$path")) {
2744                                my $pr = {
2745                                        path => $path,
2746                                        owner => to_utf8($owner),
2747                                };
2748                                push @list, $pr;
2749                                (my $forks_path = $path) =~ s/\.git$//;
2750                                $paths{$forks_path}++;
2751                        }
2752                }
2753                close $fd;
2754        }
2755        return @list;
2756}
2757
2758our $gitweb_project_owner = undef;
2759sub git_get_project_list_from_file {
2760
2761        return if (defined $gitweb_project_owner);
2762
2763        $gitweb_project_owner = {};
2764        # read from file (url-encoded):
2765        # 'git%2Fgit.git Linus+Torvalds'
2766        # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2767        # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2768        if (-f $projects_list) {
2769                open(my $fd, '<', $projects_list);
2770                while (my $line = <$fd>) {
2771                        chomp $line;
2772                        my ($pr, $ow) = split ' ', $line;
2773                        $pr = unescape($pr);
2774                        $ow = unescape($ow);
2775                        $gitweb_project_owner->{$pr} = to_utf8($ow);
2776                }
2777                close $fd;
2778        }
2779}
2780
2781sub git_get_project_owner {
2782        my $project = shift;
2783        my $owner;
2784
2785        return undef unless $project;
2786        $git_dir = "$projectroot/$project";
2787
2788        if (!defined $gitweb_project_owner) {
2789                git_get_project_list_from_file();
2790        }
2791
2792        if (exists $gitweb_project_owner->{$project}) {
2793                $owner = $gitweb_project_owner->{$project};
2794        }
2795        if (!defined $owner){
2796                $owner = git_get_project_config('owner');
2797        }
2798        if (!defined $owner) {
2799                $owner = get_file_owner("$git_dir");
2800        }
2801
2802        return $owner;
2803}
2804
2805sub git_get_last_activity {
2806        my ($path) = @_;
2807        my $fd;
2808
2809        $git_dir = "$projectroot/$path";
2810        open($fd, "-|", git_cmd(), 'for-each-ref',
2811             '--format=%(committer)',
2812             '--sort=-committerdate',
2813             '--count=1',
2814             'refs/heads') or return;
2815        my $most_recent = <$fd>;
2816        close $fd or return;
2817        if (defined $most_recent &&
2818            $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
2819                my $timestamp = $1;
2820                my $age = time - $timestamp;
2821                return ($age, age_string($age));
2822        }
2823        return (undef, undef);
2824}
2825
2826# Implementation note: when a single remote is wanted, we cannot use 'git
2827# remote show -n' because that command always work (assuming it's a remote URL
2828# if it's not defined), and we cannot use 'git remote show' because that would
2829# try to make a network roundtrip. So the only way to find if that particular
2830# remote is defined is to walk the list provided by 'git remote -v' and stop if
2831# and when we find what we want.
2832sub git_get_remotes_list {
2833        my $wanted = shift;
2834        my %remotes = ();
2835
2836        open my $fd, '-|' , git_cmd(), 'remote', '-v';
2837        return unless $fd;
2838        while (my $remote = <$fd>) {
2839                chomp $remote;
2840                $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
2841                next if $wanted and not $remote eq $wanted;
2842                my ($url, $key) = ($1, $2);
2843
2844                $remotes{$remote} ||= { 'heads' => () };
2845                $remotes{$remote}{$key} = $url;
2846        }
2847        close $fd or return;
2848        return wantarray ? %remotes : \%remotes;
2849}
2850
2851# Takes a hash of remotes as first parameter and fills it by adding the
2852# available remote heads for each of the indicated remotes.
2853sub fill_remote_heads {
2854        my $remotes = shift;
2855        my @heads = map { "remotes/$_" } keys %$remotes;
2856        my @remoteheads = git_get_heads_list(undef, @heads);
2857        foreach my $remote (keys %$remotes) {
2858                $remotes->{$remote}{'heads'} = [ grep {
2859                        $_->{'name'} =~ s!^$remote/!!
2860                        } @remoteheads ];
2861        }
2862}
2863
2864sub git_get_references {
2865        my $type = shift || "";
2866        my %refs;
2867        # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
2868        # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
2869        open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
2870                ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
2871                or return;
2872
2873        while (my $line = <$fd>) {
2874                chomp $line;
2875                if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
2876                        if (defined $refs{$1}) {
2877                                push @{$refs{$1}}, $2;
2878                        } else {
2879                                $refs{$1} = [ $2 ];
2880                        }
2881                }
2882        }
2883        close $fd or return;
2884        return \%refs;
2885}
2886
2887sub git_get_rev_name_tags {
2888        my $hash = shift || return undef;
2889
2890        open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
2891                or return;
2892        my $name_rev = <$fd>;
2893        close $fd;
2894
2895        if ($name_rev =~ m|^$hash tags/(.*)$|) {
2896                return $1;
2897        } else {
2898                # catches also '$hash undefined' output
2899                return undef;
2900        }
2901}
2902
2903## ----------------------------------------------------------------------
2904## parse to hash functions
2905
2906sub parse_date {
2907        my $epoch = shift;
2908        my $tz = shift || "-0000";
2909
2910        my %date;
2911        my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
2912        my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
2913        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
2914        $date{'hour'} = $hour;
2915        $date{'minute'} = $min;
2916        $date{'mday'} = $mday;
2917        $date{'day'} = $days[$wday];
2918        $date{'month'} = $months[$mon];
2919        $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
2920                             $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
2921        $date{'mday-time'} = sprintf "%d %s %02d:%02d",
2922                             $mday, $months[$mon], $hour ,$min;
2923        $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
2924                             1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
2925
2926        my ($tz_sign, $tz_hour, $tz_min) =
2927                ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
2928        $tz_sign = ($tz_sign eq '-' ? -1 : +1);
2929        my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
2930        ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
2931        $date{'hour_local'} = $hour;
2932        $date{'minute_local'} = $min;
2933        $date{'tz_local'} = $tz;
2934        $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
2935                                  1900+$year, $mon+1, $mday,
2936                                  $hour, $min, $sec, $tz);
2937        return %date;
2938}
2939
2940sub parse_tag {
2941        my $tag_id = shift;
2942        my %tag;
2943        my @comment;
2944
2945        open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
2946        $tag{'id'} = $tag_id;
2947        while (my $line = <$fd>) {
2948                chomp $line;
2949                if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
2950                        $tag{'object'} = $1;
2951                } elsif ($line =~ m/^type (.+)$/) {
2952                        $tag{'type'} = $1;
2953                } elsif ($line =~ m/^tag (.+)$/) {
2954                        $tag{'name'} = $1;
2955                } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
2956                        $tag{'author'} = $1;
2957                        $tag{'author_epoch'} = $2;
2958                        $tag{'author_tz'} = $3;
2959                        if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
2960                                $tag{'author_name'}  = $1;
2961                                $tag{'author_email'} = $2;
2962                        } else {
2963                                $tag{'author_name'} = $tag{'author'};
2964                        }
2965                } elsif ($line =~ m/--BEGIN/) {
2966                        push @comment, $line;
2967                        last;
2968                } elsif ($line eq "") {
2969                        last;
2970                }
2971        }
2972        push @comment, <$fd>;
2973        $tag{'comment'} = \@comment;
2974        close $fd or return;
2975        if (!defined $tag{'name'}) {
2976                return
2977        };
2978        return %tag
2979}
2980
2981sub parse_commit_text {
2982        my ($commit_text, $withparents) = @_;
2983        my @commit_lines = split '\n', $commit_text;
2984        my %co;
2985
2986        pop @commit_lines; # Remove '\0'
2987
2988        if (! @commit_lines) {
2989                return;
2990        }
2991
2992        my $header = shift @commit_lines;
2993        if ($header !~ m/^[0-9a-fA-F]{40}/) {
2994                return;
2995        }
2996        ($co{'id'}, my @parents) = split ' ', $header;
2997        while (my $line = shift @commit_lines) {
2998                last if $line eq "\n";
2999                if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3000                        $co{'tree'} = $1;
3001                } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3002                        push @parents, $1;
3003                } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3004                        $co{'author'} = to_utf8($1);
3005                        $co{'author_epoch'} = $2;
3006                        $co{'author_tz'} = $3;
3007                        if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3008                                $co{'author_name'}  = $1;
3009                                $co{'author_email'} = $2;
3010                        } else {
3011                                $co{'author_name'} = $co{'author'};
3012                        }
3013                } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3014                        $co{'committer'} = to_utf8($1);
3015                        $co{'committer_epoch'} = $2;
3016                        $co{'committer_tz'} = $3;
3017                        if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3018                                $co{'committer_name'}  = $1;
3019                                $co{'committer_email'} = $2;
3020                        } else {
3021                                $co{'committer_name'} = $co{'committer'};
3022                        }
3023                }
3024        }
3025        if (!defined $co{'tree'}) {
3026                return;
3027        };
3028        $co{'parents'} = \@parents;
3029        $co{'parent'} = $parents[0];
3030
3031        foreach my $title (@commit_lines) {
3032                $title =~ s/^    //;
3033                if ($title ne "") {
3034                        $co{'title'} = chop_str($title, 80, 5);
3035                        # remove leading stuff of merges to make the interesting part visible
3036                        if (length($title) > 50) {
3037                                $title =~ s/^Automatic //;
3038                                $title =~ s/^merge (of|with) /Merge ... /i;
3039                                if (length($title) > 50) {
3040                                        $title =~ s/(http|rsync):\/\///;
3041                                }
3042                                if (length($title) > 50) {
3043                                        $title =~ s/(master|www|rsync)\.//;
3044                                }
3045                                if (length($title) > 50) {
3046                                        $title =~ s/kernel.org:?//;
3047                                }
3048                                if (length($title) > 50) {
3049                                        $title =~ s/\/pub\/scm//;
3050                                }
3051                        }
3052                        $co{'title_short'} = chop_str($title, 50, 5);
3053                        last;
3054                }
3055        }
3056        if (! defined $co{'title'} || $co{'title'} eq "") {
3057                $co{'title'} = $co{'title_short'} = '(no commit message)';
3058        }
3059        # remove added spaces
3060        foreach my $line (@commit_lines) {
3061                $line =~ s/^    //;
3062        }
3063        $co{'comment'} = \@commit_lines;
3064
3065        my $age = time - $co{'committer_epoch'};
3066        $co{'age'} = $age;
3067        $co{'age_string'} = age_string($age);
3068        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3069        if ($age > 60*60*24*7*2) {
3070                $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3071                $co{'age_string_age'} = $co{'age_string'};
3072        } else {
3073                $co{'age_string_date'} = $co{'age_string'};
3074                $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3075        }
3076        return %co;
3077}
3078
3079sub parse_commit {
3080        my ($commit_id) = @_;
3081        my %co;
3082
3083        local $/ = "\0";
3084
3085        open my $fd, "-|", git_cmd(), "rev-list",
3086                "--parents",
3087                "--header",
3088                "--max-count=1",
3089                $commit_id,
3090                "--",
3091                or die_error(500, "Open git-rev-list failed");
3092        %co = parse_commit_text(<$fd>, 1);
3093        close $fd;
3094
3095        return %co;
3096}
3097
3098sub parse_commits {
3099        my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3100        my @cos;
3101
3102        $maxcount ||= 1;
3103        $skip ||= 0;
3104
3105        local $/ = "\0";
3106
3107        open my $fd, "-|", git_cmd(), "rev-list",
3108                "--header",
3109                @args,
3110                ("--max-count=" . $maxcount),
3111                ("--skip=" . $skip),
3112                @extra_options,
3113                $commit_id,
3114                "--",
3115                ($filename ? ($filename) : ())
3116                or die_error(500, "Open git-rev-list failed");
3117        while (my $line = <$fd>) {
3118                my %co = parse_commit_text($line);
3119                push @cos, \%co;
3120        }
3121        close $fd;
3122
3123        return wantarray ? @cos : \@cos;
3124}
3125
3126# parse line of git-diff-tree "raw" output
3127sub parse_difftree_raw_line {
3128        my $line = shift;
3129        my %res;
3130
3131        # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3132        # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3133        if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3134                $res{'from_mode'} = $1;
3135                $res{'to_mode'} = $2;
3136                $res{'from_id'} = $3;
3137                $res{'to_id'} = $4;
3138                $res{'status'} = $5;
3139                $res{'similarity'} = $6;
3140                if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3141                        ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3142                } else {
3143                        $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3144                }
3145        }
3146        # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3147        # combined diff (for merge commit)
3148        elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3149                $res{'nparents'}  = length($1);
3150                $res{'from_mode'} = [ split(' ', $2) ];
3151                $res{'to_mode'} = pop @{$res{'from_mode'}};
3152                $res{'from_id'} = [ split(' ', $3) ];
3153                $res{'to_id'} = pop @{$res{'from_id'}};
3154                $res{'status'} = [ split('', $4) ];
3155                $res{'to_file'} = unquote($5);
3156        }
3157        # 'c512b523472485aef4fff9e57b229d9d243c967f'
3158        elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3159                $res{'commit'} = $1;
3160        }
3161
3162        return wantarray ? %res : \%res;
3163}
3164
3165# wrapper: return parsed line of git-diff-tree "raw" output
3166# (the argument might be raw line, or parsed info)
3167sub parsed_difftree_line {
3168        my $line_or_ref = shift;
3169
3170        if (ref($line_or_ref) eq "HASH") {
3171                # pre-parsed (or generated by hand)
3172                return $line_or_ref;
3173        } else {
3174                return parse_difftree_raw_line($line_or_ref);
3175        }
3176}
3177
3178# parse line of git-ls-tree output
3179sub parse_ls_tree_line {
3180        my $line = shift;
3181        my %opts = @_;
3182        my %res;
3183
3184        if ($opts{'-l'}) {
3185                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3186                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3187
3188                $res{'mode'} = $1;
3189                $res{'type'} = $2;
3190                $res{'hash'} = $3;
3191                $res{'size'} = $4;
3192                if ($opts{'-z'}) {
3193                        $res{'name'} = $5;
3194                } else {
3195                        $res{'name'} = unquote($5);
3196                }
3197        } else {
3198                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3199                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3200
3201                $res{'mode'} = $1;
3202                $res{'type'} = $2;
3203                $res{'hash'} = $3;
3204                if ($opts{'-z'}) {
3205                        $res{'name'} = $4;
3206                } else {
3207                        $res{'name'} = unquote($4);
3208                }
3209        }
3210
3211        return wantarray ? %res : \%res;
3212}
3213
3214# generates _two_ hashes, references to which are passed as 2 and 3 argument
3215sub parse_from_to_diffinfo {
3216        my ($diffinfo, $from, $to, @parents) = @_;
3217
3218        if ($diffinfo->{'nparents'}) {
3219                # combined diff
3220                $from->{'file'} = [];
3221                $from->{'href'} = [];
3222                fill_from_file_info($diffinfo, @parents)
3223                        unless exists $diffinfo->{'from_file'};
3224                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3225                        $from->{'file'}[$i] =
3226                                defined $diffinfo->{'from_file'}[$i] ?
3227                                        $diffinfo->{'from_file'}[$i] :
3228                                        $diffinfo->{'to_file'};
3229                        if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3230                                $from->{'href'}[$i] = href(action=>"blob",
3231                                                           hash_base=>$parents[$i],
3232                                                           hash=>$diffinfo->{'from_id'}[$i],
3233                                                           file_name=>$from->{'file'}[$i]);
3234                        } else {
3235                                $from->{'href'}[$i] = undef;
3236                        }
3237                }
3238        } else {
3239                # ordinary (not combined) diff
3240                $from->{'file'} = $diffinfo->{'from_file'};
3241                if ($diffinfo->{'status'} ne "A") { # not new (added) file
3242                        $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3243                                               hash=>$diffinfo->{'from_id'},
3244                                               file_name=>$from->{'file'});
3245                } else {
3246                        delete $from->{'href'};
3247                }
3248        }
3249
3250        $to->{'file'} = $diffinfo->{'to_file'};
3251        if (!is_deleted($diffinfo)) { # file exists in result
3252                $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3253                                     hash=>$diffinfo->{'to_id'},
3254                                     file_name=>$to->{'file'});
3255        } else {
3256                delete $to->{'href'};
3257        }
3258}
3259
3260## ......................................................................
3261## parse to array of hashes functions
3262
3263sub git_get_heads_list {
3264        my ($limit, @classes) = @_;
3265        @classes = ('heads') unless @classes;
3266        my @patterns = map { "refs/$_" } @classes;
3267        my @headslist;
3268
3269        open my $fd, '-|', git_cmd(), 'for-each-ref',
3270                ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3271                '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3272                @patterns
3273                or return;
3274        while (my $line = <$fd>) {
3275                my %ref_item;
3276
3277                chomp $line;
3278                my ($refinfo, $committerinfo) = split(/\0/, $line);
3279                my ($hash, $name, $title) = split(' ', $refinfo, 3);
3280                my ($committer, $epoch, $tz) =
3281                        ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3282                $ref_item{'fullname'}  = $name;
3283                $name =~ s!^refs/(?:head|remote)s/!!;
3284
3285                $ref_item{'name'}  = $name;
3286                $ref_item{'id'}    = $hash;
3287                $ref_item{'title'} = $title || '(no commit message)';
3288                $ref_item{'epoch'} = $epoch;
3289                if ($epoch) {
3290                        $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3291                } else {
3292                        $ref_item{'age'} = "unknown";
3293                }
3294
3295                push @headslist, \%ref_item;
3296        }
3297        close $fd;
3298
3299        return wantarray ? @headslist : \@headslist;
3300}
3301
3302sub git_get_tags_list {
3303        my $limit = shift;
3304        my @tagslist;
3305
3306        open my $fd, '-|', git_cmd(), 'for-each-ref',
3307                ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3308                '--format=%(objectname) %(objecttype) %(refname) '.
3309                '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3310                'refs/tags'
3311                or return;
3312        while (my $line = <$fd>) {
3313                my %ref_item;
3314
3315                chomp $line;
3316                my ($refinfo, $creatorinfo) = split(/\0/, $line);
3317                my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3318                my ($creator, $epoch, $tz) =
3319                        ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3320                $ref_item{'fullname'} = $name;
3321                $name =~ s!^refs/tags/!!;
3322
3323                $ref_item{'type'} = $type;
3324                $ref_item{'id'} = $id;
3325                $ref_item{'name'} = $name;
3326                if ($type eq "tag") {
3327                        $ref_item{'subject'} = $title;
3328                        $ref_item{'reftype'} = $reftype;
3329                        $ref_item{'refid'}   = $refid;
3330                } else {
3331                        $ref_item{'reftype'} = $type;
3332                        $ref_item{'refid'}   = $id;
3333                }
3334
3335                if ($type eq "tag" || $type eq "commit") {
3336                        $ref_item{'epoch'} = $epoch;
3337                        if ($epoch) {
3338                                $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3339                        } else {
3340                                $ref_item{'age'} = "unknown";
3341                        }
3342                }
3343
3344                push @tagslist, \%ref_item;
3345        }
3346        close $fd;
3347
3348        return wantarray ? @tagslist : \@tagslist;
3349}
3350
3351## ----------------------------------------------------------------------
3352## filesystem-related functions
3353
3354sub get_file_owner {
3355        my $path = shift;
3356
3357        my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3358        my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3359        if (!defined $gcos) {
3360                return undef;
3361        }
3362        my $owner = $gcos;
3363        $owner =~ s/[,;].*$//;
3364        return to_utf8($owner);
3365}
3366
3367# assume that file exists
3368sub insert_file {
3369        my $filename = shift;
3370
3371        open my $fd, '<', $filename;
3372        print map { to_utf8($_) } <$fd>;
3373        close $fd;
3374}
3375
3376## ......................................................................
3377## mimetype related functions
3378
3379sub mimetype_guess_file {
3380        my $filename = shift;
3381        my $mimemap = shift;
3382        -r $mimemap or return undef;
3383
3384        my %mimemap;
3385        open(my $mh, '<', $mimemap) or return undef;
3386        while (<$mh>) {
3387                next if m/^#/; # skip comments
3388                my ($mimetype, $exts) = split(/\t+/);
3389                if (defined $exts) {
3390                        my @exts = split(/\s+/, $exts);
3391                        foreach my $ext (@exts) {
3392                                $mimemap{$ext} = $mimetype;
3393                        }
3394                }
3395        }
3396        close($mh);
3397
3398        $filename =~ /\.([^.]*)$/;
3399        return $mimemap{$1};
3400}
3401
3402sub mimetype_guess {
3403        my $filename = shift;
3404        my $mime;
3405        $filename =~ /\./ or return undef;
3406
3407        if ($mimetypes_file) {
3408                my $file = $mimetypes_file;
3409                if ($file !~ m!^/!) { # if it is relative path
3410                        # it is relative to project
3411                        $file = "$projectroot/$project/$file";
3412                }
3413                $mime = mimetype_guess_file($filename, $file);
3414        }
3415        $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3416        return $mime;
3417}
3418
3419sub blob_mimetype {
3420        my $fd = shift;
3421        my $filename = shift;
3422
3423        if ($filename) {
3424                my $mime = mimetype_guess($filename);
3425                $mime and return $mime;
3426        }
3427
3428        # just in case
3429        return $default_blob_plain_mimetype unless $fd;
3430
3431        if (-T $fd) {
3432                return 'text/plain';
3433        } elsif (! $filename) {
3434                return 'application/octet-stream';
3435        } elsif ($filename =~ m/\.png$/i) {
3436                return 'image/png';
3437        } elsif ($filename =~ m/\.gif$/i) {
3438                return 'image/gif';
3439        } elsif ($filename =~ m/\.jpe?g$/i) {
3440                return 'image/jpeg';
3441        } else {
3442                return 'application/octet-stream';
3443        }
3444}
3445
3446sub blob_contenttype {
3447        my ($fd, $file_name, $type) = @_;
3448
3449        $type ||= blob_mimetype($fd, $file_name);
3450        if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3451                $type .= "; charset=$default_text_plain_charset";
3452        }
3453
3454        return $type;
3455}
3456
3457# guess file syntax for syntax highlighting; return undef if no highlighting
3458# the name of syntax can (in the future) depend on syntax highlighter used
3459sub guess_file_syntax {
3460        my ($highlight, $mimetype, $file_name) = @_;
3461        return undef unless ($highlight && defined $file_name);
3462        my $basename = basename($file_name, '.in');
3463        return $highlight_basename{$basename}
3464                if exists $highlight_basename{$basename};
3465
3466        $basename =~ /\.([^.]*)$/;
3467        my $ext = $1 or return undef;
3468        return $highlight_ext{$ext}
3469                if exists $highlight_ext{$ext};
3470
3471        return undef;
3472}
3473
3474# run highlighter and return FD of its output,
3475# or return original FD if no highlighting
3476sub run_highlighter {
3477        my ($fd, $highlight, $syntax) = @_;
3478        return $fd unless ($highlight && defined $syntax);
3479
3480        close $fd;
3481        open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3482                  quote_command($highlight_bin).
3483                  " --replace-tabs=8 --fragment --syntax $syntax |"
3484                or die_error(500, "Couldn't open file or run syntax highlighter");
3485        return $fd;
3486}
3487
3488## ======================================================================
3489## functions printing HTML: header, footer, error page
3490
3491sub get_page_title {
3492        my $title = to_utf8($site_name);
3493
3494        return $title unless (defined $project);
3495        $title .= " - " . to_utf8($project);
3496
3497        return $title unless (defined $action);
3498        $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3499
3500        return $title unless (defined $file_name);
3501        $title .= " - " . esc_path($file_name);
3502        if ($action eq "tree" && $file_name !~ m|/$|) {
3503                $title .= "/";
3504        }
3505
3506        return $title;
3507}
3508
3509sub print_feed_meta {
3510        if (defined $project) {
3511                my %href_params = get_feed_info();
3512                if (!exists $href_params{'-title'}) {
3513                        $href_params{'-title'} = 'log';
3514                }
3515
3516                foreach my $format (qw(RSS Atom)) {
3517                        my $type = lc($format);
3518                        my %link_attr = (
3519                                '-rel' => 'alternate',
3520                                '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3521                                '-type' => "application/$type+xml"
3522                        );
3523
3524                        $href_params{'action'} = $type;
3525                        $link_attr{'-href'} = href(%href_params);
3526                        print "<link ".
3527                              "rel=\"$link_attr{'-rel'}\" ".
3528                              "title=\"$link_attr{'-title'}\" ".
3529                              "href=\"$link_attr{'-href'}\" ".
3530                              "type=\"$link_attr{'-type'}\" ".
3531                              "/>\n";
3532
3533                        $href_params{'extra_options'} = '--no-merges';
3534                        $link_attr{'-href'} = href(%href_params);
3535                        $link_attr{'-title'} .= ' (no merges)';
3536                        print "<link ".
3537                              "rel=\"$link_attr{'-rel'}\" ".
3538                              "title=\"$link_attr{'-title'}\" ".
3539                              "href=\"$link_attr{'-href'}\" ".
3540                              "type=\"$link_attr{'-type'}\" ".
3541                              "/>\n";
3542                }
3543
3544        } else {
3545                printf('<link rel="alternate" title="%s projects list" '.
3546                       'href="%s" type="text/plain; charset=utf-8" />'."\n",
3547                       esc_attr($site_name), href(project=>undef, action=>"project_index"));
3548                printf('<link rel="alternate" title="%s projects feeds" '.
3549                       'href="%s" type="text/x-opml" />'."\n",
3550                       esc_attr($site_name), href(project=>undef, action=>"opml"));
3551        }
3552}
3553
3554sub git_header_html {
3555        my $status = shift || "200 OK";
3556        my $expires = shift;
3557        my %opts = @_;
3558
3559        my $title = get_page_title();
3560        my $content_type;
3561        # require explicit support from the UA if we are to send the page as
3562        # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3563        # we have to do this because MSIE sometimes globs '*/*', pretending to
3564        # support xhtml+xml but choking when it gets what it asked for.
3565        if (defined $cgi->http('HTTP_ACCEPT') &&
3566            $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3567            $cgi->Accept('application/xhtml+xml') != 0) {
3568                $content_type = 'application/xhtml+xml';
3569        } else {
3570                $content_type = 'text/html';
3571        }
3572        print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3573                           -status=> $status, -expires => $expires)
3574                unless ($opts{'-no_http_header'});
3575        my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3576        print <<EOF;
3577<?xml version="1.0" encoding="utf-8"?>
3578<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3579<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3580<!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3581<!-- git core binaries version $git_version -->
3582<head>
3583<meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3584<meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3585<meta name="robots" content="index, nofollow"/>
3586<title>$title</title>
3587EOF
3588        # the stylesheet, favicon etc urls won't work correctly with path_info
3589        # unless we set the appropriate base URL
3590        if ($ENV{'PATH_INFO'}) {
3591                print "<base href=\"".esc_url($base_url)."\" />\n";
3592        }
3593        # print out each stylesheet that exist, providing backwards capability
3594        # for those people who defined $stylesheet in a config file
3595        if (defined $stylesheet) {
3596                print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3597        } else {
3598                foreach my $stylesheet (@stylesheets) {
3599                        next unless $stylesheet;
3600                        print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3601                }
3602        }
3603        print_feed_meta()
3604                if ($status eq '200 OK');
3605        if (defined $favicon) {
3606                print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3607        }
3608
3609        print "</head>\n" .
3610              "<body>\n";
3611
3612        if (defined $site_header && -f $site_header) {
3613                insert_file($site_header);
3614        }
3615
3616        print "<div class=\"page_header\">\n";
3617        if (defined $logo) {
3618                print $cgi->a({-href => esc_url($logo_url),
3619                               -title => $logo_label},
3620                              $cgi->img({-src => esc_url($logo),
3621                                         -width => 72, -height => 27,
3622                                         -alt => "git",
3623                                         -class => "logo"}));
3624        }
3625        print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3626        if (defined $project) {
3627                print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3628                if (defined $action) {
3629                        my $action_print = $action ;
3630                        if (defined $opts{-action_extra}) {
3631                                $action_print = $cgi->a({-href => href(action=>$action)},
3632                                        $action);
3633                        }
3634                        print " / $action_print";
3635                }
3636                if (defined $opts{-action_extra}) {
3637                        print " / $opts{-action_extra}";
3638                }
3639                print "\n";
3640        }
3641        print "</div>\n";
3642
3643        my $have_search = gitweb_check_feature('search');
3644        if (defined $project && $have_search) {
3645                if (!defined $searchtext) {
3646                        $searchtext = "";
3647                }
3648                my $search_hash;
3649                if (defined $hash_base) {
3650                        $search_hash = $hash_base;
3651                } elsif (defined $hash) {
3652                        $search_hash = $hash;
3653                } else {
3654                        $search_hash = "HEAD";
3655                }
3656                my $action = $my_uri;
3657                my $use_pathinfo = gitweb_check_feature('pathinfo');
3658                if ($use_pathinfo) {
3659                        $action .= "/".esc_url($project);
3660                }
3661                print $cgi->startform(-method => "get", -action => $action) .
3662                      "<div class=\"search\">\n" .
3663                      (!$use_pathinfo &&
3664                      $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3665                      $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3666                      $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3667                      $cgi->popup_menu(-name => 'st', -default => 'commit',
3668                                       -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3669                      $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3670                      " search:\n",
3671                      $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3672                      "<span title=\"Extended regular expression\">" .
3673                      $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3674                                     -checked => $search_use_regexp) .
3675                      "</span>" .
3676                      "</div>" .
3677                      $cgi->end_form() . "\n";
3678        }
3679}
3680
3681sub git_footer_html {
3682        my $feed_class = 'rss_logo';
3683
3684        print "<div class=\"page_footer\">\n";
3685        if (defined $project) {
3686                my $descr = git_get_project_description($project);
3687                if (defined $descr) {
3688                        print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3689                }
3690
3691                my %href_params = get_feed_info();
3692                if (!%href_params) {
3693                        $feed_class .= ' generic';
3694                }
3695                $href_params{'-title'} ||= 'log';
3696
3697                foreach my $format (qw(RSS Atom)) {
3698                        $href_params{'action'} = lc($format);
3699                        print $cgi->a({-href => href(%href_params),
3700                                      -title => "$href_params{'-title'} $format feed",
3701                                      -class => $feed_class}, $format)."\n";
3702                }
3703
3704        } else {
3705                print $cgi->a({-href => href(project=>undef, action=>"opml"),
3706                              -class => $feed_class}, "OPML") . " ";
3707                print $cgi->a({-href => href(project=>undef, action=>"project_index"),
3708                              -class => $feed_class}, "TXT") . "\n";
3709        }
3710        print "</div>\n"; # class="page_footer"
3711
3712        if (defined $t0 && gitweb_check_feature('timed')) {
3713                print "<div id=\"generating_info\">\n";
3714                print 'This page took '.
3715                      '<span id="generating_time" class="time_span">'.
3716                      tv_interval($t0, [ gettimeofday() ]).
3717                      ' seconds </span>'.
3718                      ' and '.
3719                      '<span id="generating_cmd">'.
3720                      $number_of_git_cmds.
3721                      '</span> git commands '.
3722                      " to generate.\n";
3723                print "</div>\n"; # class="page_footer"
3724        }
3725
3726        if (defined $site_footer && -f $site_footer) {
3727                insert_file($site_footer);
3728        }
3729
3730        print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
3731        if (defined $action &&
3732            $action eq 'blame_incremental') {
3733                print qq!<script type="text/javascript">\n!.
3734                      qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
3735                      qq!           "!. href() .qq!");\n!.
3736                      qq!</script>\n!;
3737        } elsif (gitweb_check_feature('javascript-actions')) {
3738                print qq!<script type="text/javascript">\n!.
3739                      qq!window.onload = fixLinks;\n!.
3740                      qq!</script>\n!;
3741        }
3742
3743        print "</body>\n" .
3744              "</html>";
3745}
3746
3747# die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
3748# Example: die_error(404, 'Hash not found')
3749# By convention, use the following status codes (as defined in RFC 2616):
3750# 400: Invalid or missing CGI parameters, or
3751#      requested object exists but has wrong type.
3752# 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
3753#      this server or project.
3754# 404: Requested object/revision/project doesn't exist.
3755# 500: The server isn't configured properly, or
3756#      an internal error occurred (e.g. failed assertions caused by bugs), or
3757#      an unknown error occurred (e.g. the git binary died unexpectedly).
3758# 503: The server is currently unavailable (because it is overloaded,
3759#      or down for maintenance).  Generally, this is a temporary state.
3760sub die_error {
3761        my $status = shift || 500;
3762        my $error = esc_html(shift) || "Internal Server Error";
3763        my $extra = shift;
3764        my %opts = @_;
3765
3766        my %http_responses = (
3767                400 => '400 Bad Request',
3768                403 => '403 Forbidden',
3769                404 => '404 Not Found',
3770                500 => '500 Internal Server Error',
3771                503 => '503 Service Unavailable',
3772        );
3773        git_header_html($http_responses{$status}, undef, %opts);
3774        print <<EOF;
3775<div class="page_body">
3776<br /><br />
3777$status - $error
3778<br />
3779EOF
3780        if (defined $extra) {
3781                print "<hr />\n" .
3782                      "$extra\n";
3783        }
3784        print "</div>\n";
3785
3786        git_footer_html();
3787        goto DONE_GITWEB
3788                unless ($opts{'-error_handler'});
3789}
3790
3791## ----------------------------------------------------------------------
3792## functions printing or outputting HTML: navigation
3793
3794sub git_print_page_nav {
3795        my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
3796        $extra = '' if !defined $extra; # pager or formats
3797
3798        my @navs = qw(summary shortlog log commit commitdiff tree);
3799        if ($suppress) {
3800                @navs = grep { $_ ne $suppress } @navs;
3801        }
3802
3803        my %arg = map { $_ => {action=>$_} } @navs;
3804        if (defined $head) {
3805                for (qw(commit commitdiff)) {
3806                        $arg{$_}{'hash'} = $head;
3807                }
3808                if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
3809                        for (qw(shortlog log)) {
3810                                $arg{$_}{'hash'} = $head;
3811                        }
3812                }
3813        }
3814
3815        $arg{'tree'}{'hash'} = $treehead if defined $treehead;
3816        $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
3817
3818        my @actions = gitweb_get_feature('actions');
3819        my %repl = (
3820                '%' => '%',
3821                'n' => $project,         # project name
3822                'f' => $git_dir,         # project path within filesystem
3823                'h' => $treehead || '',  # current hash ('h' parameter)
3824                'b' => $treebase || '',  # hash base ('hb' parameter)
3825        );
3826        while (@actions) {
3827                my ($label, $link, $pos) = splice(@actions,0,3);
3828                # insert
3829                @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
3830                # munch munch
3831                $link =~ s/%([%nfhb])/$repl{$1}/g;
3832                $arg{$label}{'_href'} = $link;
3833        }
3834
3835        print "<div class=\"page_nav\">\n" .
3836                (join " | ",
3837                 map { $_ eq $current ?
3838                       $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
3839                 } @navs);
3840        print "<br/>\n$extra<br/>\n" .
3841              "</div>\n";
3842}
3843
3844# returns a submenu for the nagivation of the refs views (tags, heads,
3845# remotes) with the current view disabled and the remotes view only
3846# available if the feature is enabled
3847sub format_ref_views {
3848        my ($current) = @_;
3849        my @ref_views = qw{tags heads};
3850        push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
3851        return join " | ", map {
3852                $_ eq $current ? $_ :
3853                $cgi->a({-href => href(action=>$_)}, $_)
3854        } @ref_views
3855}
3856
3857sub format_paging_nav {
3858        my ($action, $page, $has_next_link) = @_;
3859        my $paging_nav;
3860
3861
3862        if ($page > 0) {
3863                $paging_nav .=
3864                        $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
3865                        " &sdot; " .
3866                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
3867                                 -accesskey => "p", -title => "Alt-p"}, "prev");
3868        } else {
3869                $paging_nav .= "first &sdot; prev";
3870        }
3871
3872        if ($has_next_link) {
3873                $paging_nav .= " &sdot; " .
3874                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
3875                                 -accesskey => "n", -title => "Alt-n"}, "next");
3876        } else {
3877                $paging_nav .= " &sdot; next";
3878        }
3879
3880        return $paging_nav;
3881}
3882
3883## ......................................................................
3884## functions printing or outputting HTML: div
3885
3886sub git_print_header_div {
3887        my ($action, $title, $hash, $hash_base) = @_;
3888        my %args = ();
3889
3890        $args{'action'} = $action;
3891        $args{'hash'} = $hash if $hash;
3892        $args{'hash_base'} = $hash_base if $hash_base;
3893
3894        print "<div class=\"header\">\n" .
3895              $cgi->a({-href => href(%args), -class => "title"},
3896              $title ? $title : $action) .
3897              "\n</div>\n";
3898}
3899
3900sub format_repo_url {
3901        my ($name, $url) = @_;
3902        return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
3903}
3904
3905# Group output by placing it in a DIV element and adding a header.
3906# Options for start_div() can be provided by passing a hash reference as the
3907# first parameter to the function.
3908# Options to git_print_header_div() can be provided by passing an array
3909# reference. This must follow the options to start_div if they are present.
3910# The content can be a scalar, which is output as-is, a scalar reference, which
3911# is output after html escaping, an IO handle passed either as *handle or
3912# *handle{IO}, or a function reference. In the latter case all following
3913# parameters will be taken as argument to the content function call.
3914sub git_print_section {
3915        my ($div_args, $header_args, $content);
3916        my $arg = shift;
3917        if (ref($arg) eq 'HASH') {
3918                $div_args = $arg;
3919                $arg = shift;
3920        }
3921        if (ref($arg) eq 'ARRAY') {
3922                $header_args = $arg;
3923                $arg = shift;
3924        }
3925        $content = $arg;
3926
3927        print $cgi->start_div($div_args);
3928        git_print_header_div(@$header_args);
3929
3930        if (ref($content) eq 'CODE') {
3931                $content->(@_);
3932        } elsif (ref($content) eq 'SCALAR') {
3933                print esc_html($$content);
3934        } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
3935                print <$content>;
3936        } elsif (!ref($content) && defined($content)) {
3937                print $content;
3938        }
3939
3940        print $cgi->end_div;
3941}
3942
3943sub print_local_time {
3944        print format_local_time(@_);
3945}
3946
3947sub format_local_time {
3948        my $localtime = '';
3949        my %date = @_;
3950        if ($date{'hour_local'} < 6) {
3951                $localtime .= sprintf(" (<span class=\"atnight\">%02d:%02d</span> %s)",
3952                        $date{'hour_local'}, $date{'minute_local'}, $date{'tz_local'});
3953        } else {
3954                $localtime .= sprintf(" (%02d:%02d %s)",
3955                        $date{'hour_local'}, $date{'minute_local'}, $date{'tz_local'});
3956        }
3957
3958        return $localtime;
3959}
3960
3961# Outputs the author name and date in long form
3962sub git_print_authorship {
3963        my $co = shift;
3964        my %opts = @_;
3965        my $tag = $opts{-tag} || 'div';
3966        my $author = $co->{'author_name'};
3967
3968        my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
3969        print "<$tag class=\"author_date\">" .
3970              format_search_author($author, "author", esc_html($author)) .
3971              " [$ad{'rfc2822'}";
3972        print_local_time(%ad) if ($opts{-localtime});
3973        print "]" . git_get_avatar($co->{'author_email'}, -pad_before => 1)
3974                  . "</$tag>\n";
3975}
3976
3977# Outputs table rows containing the full author or committer information,
3978# in the format expected for 'commit' view (& similar).
3979# Parameters are a commit hash reference, followed by the list of people
3980# to output information for. If the list is empty it defaults to both
3981# author and committer.
3982sub git_print_authorship_rows {
3983        my $co = shift;
3984        # too bad we can't use @people = @_ || ('author', 'committer')
3985        my @people = @_;
3986        @people = ('author', 'committer') unless @people;
3987        foreach my $who (@people) {
3988                my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
3989                print "<tr><td>$who</td><td>" .
3990                      format_search_author($co->{"${who}_name"}, $who,
3991                               esc_html($co->{"${who}_name"})) . " " .
3992                      format_search_author($co->{"${who}_email"}, $who,
3993                               esc_html("<" . $co->{"${who}_email"} . ">")) .
3994                      "</td><td rowspan=\"2\">" .
3995                      git_get_avatar($co->{"${who}_email"}, -size => 'double') .
3996                      "</td></tr>\n" .
3997                      "<tr>" .
3998                      "<td></td><td> $wd{'rfc2822'}";
3999                print_local_time(%wd);
4000                print "</td>" .
4001                      "</tr>\n";
4002        }
4003}
4004
4005sub git_print_page_path {
4006        my $name = shift;
4007        my $type = shift;
4008        my $hb = shift;
4009
4010
4011        print "<div class=\"page_path\">";
4012        print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4013                      -title => 'tree root'}, to_utf8("[$project]"));
4014        print " / ";
4015        if (defined $name) {
4016                my @dirname = split '/', $name;
4017                my $basename = pop @dirname;
4018                my $fullname = '';
4019
4020                foreach my $dir (@dirname) {
4021                        $fullname .= ($fullname ? '/' : '') . $dir;
4022                        print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4023                                                     hash_base=>$hb),
4024                                      -title => $fullname}, esc_path($dir));
4025                        print " / ";
4026                }
4027                if (defined $type && $type eq 'blob') {
4028                        print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4029                                                     hash_base=>$hb),
4030                                      -title => $name}, esc_path($basename));
4031                } elsif (defined $type && $type eq 'tree') {
4032                        print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4033                                                     hash_base=>$hb),
4034                                      -title => $name}, esc_path($basename));
4035                        print " / ";
4036                } else {
4037                        print esc_path($basename);
4038                }
4039        }
4040        print "<br/></div>\n";
4041}
4042
4043sub git_print_log {
4044        my $log = shift;
4045        my %opts = @_;
4046
4047        if ($opts{'-remove_title'}) {
4048                # remove title, i.e. first line of log
4049                shift @$log;
4050        }
4051        # remove leading empty lines
4052        while (defined $log->[0] && $log->[0] eq "") {
4053                shift @$log;
4054        }
4055
4056        # print log
4057        my $signoff = 0;
4058        my $empty = 0;
4059        foreach my $line (@$log) {
4060                if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4061                        $signoff = 1;
4062                        $empty = 0;
4063                        if (! $opts{'-remove_signoff'}) {
4064                                print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4065                                next;
4066                        } else {
4067                                # remove signoff lines
4068                                next;
4069                        }
4070                } else {
4071                        $signoff = 0;
4072                }
4073
4074                # print only one empty line
4075                # do not print empty line after signoff
4076                if ($line eq "") {
4077                        next if ($empty || $signoff);
4078                        $empty = 1;
4079                } else {
4080                        $empty = 0;
4081                }
4082
4083                print format_log_line_html($line) . "<br/>\n";
4084        }
4085
4086        if ($opts{'-final_empty_line'}) {
4087                # end with single empty line
4088                print "<br/>\n" unless $empty;
4089        }
4090}
4091
4092# return link target (what link points to)
4093sub git_get_link_target {
4094        my $hash = shift;
4095        my $link_target;
4096
4097        # read link
4098        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4099                or return;
4100        {
4101                local $/ = undef;
4102                $link_target = <$fd>;
4103        }
4104        close $fd
4105                or return;
4106
4107        return $link_target;
4108}
4109
4110# given link target, and the directory (basedir) the link is in,
4111# return target of link relative to top directory (top tree);
4112# return undef if it is not possible (including absolute links).
4113sub normalize_link_target {
4114        my ($link_target, $basedir) = @_;
4115
4116        # absolute symlinks (beginning with '/') cannot be normalized
4117        return if (substr($link_target, 0, 1) eq '/');
4118
4119        # normalize link target to path from top (root) tree (dir)
4120        my $path;
4121        if ($basedir) {
4122                $path = $basedir . '/' . $link_target;
4123        } else {
4124                # we are in top (root) tree (dir)
4125                $path = $link_target;
4126        }
4127
4128        # remove //, /./, and /../
4129        my @path_parts;
4130        foreach my $part (split('/', $path)) {
4131                # discard '.' and ''
4132                next if (!$part || $part eq '.');
4133                # handle '..'
4134                if ($part eq '..') {
4135                        if (@path_parts) {
4136                                pop @path_parts;
4137                        } else {
4138                                # link leads outside repository (outside top dir)
4139                                return;
4140                        }
4141                } else {
4142                        push @path_parts, $part;
4143                }
4144        }
4145        $path = join('/', @path_parts);
4146
4147        return $path;
4148}
4149
4150# print tree entry (row of git_tree), but without encompassing <tr> element
4151sub git_print_tree_entry {
4152        my ($t, $basedir, $hash_base, $have_blame) = @_;
4153
4154        my %base_key = ();
4155        $base_key{'hash_base'} = $hash_base if defined $hash_base;
4156
4157        # The format of a table row is: mode list link.  Where mode is
4158        # the mode of the entry, list is the name of the entry, an href,
4159        # and link is the action links of the entry.
4160
4161        print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4162        if (exists $t->{'size'}) {
4163                print "<td class=\"size\">$t->{'size'}</td>\n";
4164        }
4165        if ($t->{'type'} eq "blob") {
4166                print "<td class=\"list\">" .
4167                        $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4168                                               file_name=>"$basedir$t->{'name'}", %base_key),
4169                                -class => "list"}, esc_path($t->{'name'}));
4170                if (S_ISLNK(oct $t->{'mode'})) {
4171                        my $link_target = git_get_link_target($t->{'hash'});
4172                        if ($link_target) {
4173                                my $norm_target = normalize_link_target($link_target, $basedir);
4174                                if (defined $norm_target) {
4175                                        print " -> " .
4176                                              $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4177                                                                     file_name=>$norm_target),
4178                                                       -title => $norm_target}, esc_path($link_target));
4179                                } else {
4180                                        print " -> " . esc_path($link_target);
4181                                }
4182                        }
4183                }
4184                print "</td>\n";
4185                print "<td class=\"link\">";
4186                print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4187                                             file_name=>"$basedir$t->{'name'}", %base_key)},
4188                              "blob");
4189                if ($have_blame) {
4190                        print " | " .
4191                              $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4192                                                     file_name=>"$basedir$t->{'name'}", %base_key)},
4193                                      "blame");
4194                }
4195                if (defined $hash_base) {
4196                        print " | " .
4197                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4198                                                     hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4199                                      "history");
4200                }
4201                print " | " .
4202                        $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4203                                               file_name=>"$basedir$t->{'name'}")},
4204                                "raw");
4205                print "</td>\n";
4206
4207        } elsif ($t->{'type'} eq "tree") {
4208                print "<td class=\"list\">";
4209                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4210                                             file_name=>"$basedir$t->{'name'}",
4211                                             %base_key)},
4212                              esc_path($t->{'name'}));
4213                print "</td>\n";
4214                print "<td class=\"link\">";
4215                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4216                                             file_name=>"$basedir$t->{'name'}",
4217                                             %base_key)},
4218                              "tree");
4219                if (defined $hash_base) {
4220                        print " | " .
4221                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4222                                                     file_name=>"$basedir$t->{'name'}")},
4223                                      "history");
4224                }
4225                print "</td>\n";
4226        } else {
4227                # unknown object: we can only present history for it
4228                # (this includes 'commit' object, i.e. submodule support)
4229                print "<td class=\"list\">" .
4230                      esc_path($t->{'name'}) .
4231                      "</td>\n";
4232                print "<td class=\"link\">";
4233                if (defined $hash_base) {
4234                        print $cgi->a({-href => href(action=>"history",
4235                                                     hash_base=>$hash_base,
4236                                                     file_name=>"$basedir$t->{'name'}")},
4237                                      "history");
4238                }
4239                print "</td>\n";
4240        }
4241}
4242
4243## ......................................................................
4244## functions printing large fragments of HTML
4245
4246# get pre-image filenames for merge (combined) diff
4247sub fill_from_file_info {
4248        my ($diff, @parents) = @_;
4249
4250        $diff->{'from_file'} = [ ];
4251        $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4252        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4253                if ($diff->{'status'}[$i] eq 'R' ||
4254                    $diff->{'status'}[$i] eq 'C') {
4255                        $diff->{'from_file'}[$i] =
4256                                git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4257                }
4258        }
4259
4260        return $diff;
4261}
4262
4263# is current raw difftree line of file deletion
4264sub is_deleted {
4265        my $diffinfo = shift;
4266
4267        return $diffinfo->{'to_id'} eq ('0' x 40);
4268}
4269
4270# does patch correspond to [previous] difftree raw line
4271# $diffinfo  - hashref of parsed raw diff format
4272# $patchinfo - hashref of parsed patch diff format
4273#              (the same keys as in $diffinfo)
4274sub is_patch_split {
4275        my ($diffinfo, $patchinfo) = @_;
4276
4277        return defined $diffinfo && defined $patchinfo
4278                && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4279}
4280
4281
4282sub git_difftree_body {
4283        my ($difftree, $hash, @parents) = @_;
4284        my ($parent) = $parents[0];
4285        my $have_blame = gitweb_check_feature('blame');
4286        print "<div class=\"list_head\">\n";
4287        if ($#{$difftree} > 10) {
4288                print(($#{$difftree} + 1) . " files changed:\n");
4289        }
4290        print "</div>\n";
4291
4292        print "<table class=\"" .
4293              (@parents > 1 ? "combined " : "") .
4294              "diff_tree\">\n";
4295
4296        # header only for combined diff in 'commitdiff' view
4297        my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4298        if ($has_header) {
4299                # table header
4300                print "<thead><tr>\n" .
4301                       "<th></th><th></th>\n"; # filename, patchN link
4302                for (my $i = 0; $i < @parents; $i++) {
4303                        my $par = $parents[$i];
4304                        print "<th>" .
4305                              $cgi->a({-href => href(action=>"commitdiff",
4306                                                     hash=>$hash, hash_parent=>$par),
4307                                       -title => 'commitdiff to parent number ' .
4308                                                  ($i+1) . ': ' . substr($par,0,7)},
4309                                      $i+1) .
4310                              "&nbsp;</th>\n";
4311                }
4312                print "</tr></thead>\n<tbody>\n";
4313        }
4314
4315        my $alternate = 1;
4316        my $patchno = 0;
4317        foreach my $line (@{$difftree}) {
4318                my $diff = parsed_difftree_line($line);
4319
4320                if ($alternate) {
4321                        print "<tr class=\"dark\">\n";
4322                } else {
4323                        print "<tr class=\"light\">\n";
4324                }
4325                $alternate ^= 1;
4326
4327                if (exists $diff->{'nparents'}) { # combined diff
4328
4329                        fill_from_file_info($diff, @parents)
4330                                unless exists $diff->{'from_file'};
4331
4332                        if (!is_deleted($diff)) {
4333                                # file exists in the result (child) commit
4334                                print "<td>" .
4335                                      $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4336                                                             file_name=>$diff->{'to_file'},
4337                                                             hash_base=>$hash),
4338                                              -class => "list"}, esc_path($diff->{'to_file'})) .
4339                                      "</td>\n";
4340                        } else {
4341                                print "<td>" .
4342                                      esc_path($diff->{'to_file'}) .
4343                                      "</td>\n";
4344                        }
4345
4346                        if ($action eq 'commitdiff') {
4347                                # link to patch
4348                                $patchno++;
4349                                print "<td class=\"link\">" .
4350                                      $cgi->a({-href => href(-anchor=>"patch$patchno")},
4351                                              "patch") .
4352                                      " | " .
4353                                      "</td>\n";
4354                        }
4355
4356                        my $has_history = 0;
4357                        my $not_deleted = 0;
4358                        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4359                                my $hash_parent = $parents[$i];
4360                                my $from_hash = $diff->{'from_id'}[$i];
4361                                my $from_path = $diff->{'from_file'}[$i];
4362                                my $status = $diff->{'status'}[$i];
4363
4364                                $has_history ||= ($status ne 'A');
4365                                $not_deleted ||= ($status ne 'D');
4366
4367                                if ($status eq 'A') {
4368                                        print "<td  class=\"link\" align=\"right\"> | </td>\n";
4369                                } elsif ($status eq 'D') {
4370                                        print "<td class=\"link\">" .
4371                                              $cgi->a({-href => href(action=>"blob",
4372                                                                     hash_base=>$hash,
4373                                                                     hash=>$from_hash,
4374                                                                     file_name=>$from_path)},
4375                                                      "blob" . ($i+1)) .
4376                                              " | </td>\n";
4377                                } else {
4378                                        if ($diff->{'to_id'} eq $from_hash) {
4379                                                print "<td class=\"link nochange\">";
4380                                        } else {
4381                                                print "<td class=\"link\">";
4382                                        }
4383                                        print $cgi->a({-href => href(action=>"blobdiff",
4384                                                                     hash=>$diff->{'to_id'},
4385                                                                     hash_parent=>$from_hash,
4386                                                                     hash_base=>$hash,
4387                                                                     hash_parent_base=>$hash_parent,
4388                                                                     file_name=>$diff->{'to_file'},
4389                                                                     file_parent=>$from_path)},
4390                                                      "diff" . ($i+1)) .
4391                                              " | </td>\n";
4392                                }
4393                        }
4394
4395                        print "<td class=\"link\">";
4396                        if ($not_deleted) {
4397                                print $cgi->a({-href => href(action=>"blob",
4398                                                             hash=>$diff->{'to_id'},
4399                                                             file_name=>$diff->{'to_file'},
4400                                                             hash_base=>$hash)},
4401                                              "blob");
4402                                print " | " if ($has_history);
4403                        }
4404                        if ($has_history) {
4405                                print $cgi->a({-href => href(action=>"history",
4406                                                             file_name=>$diff->{'to_file'},
4407                                                             hash_base=>$hash)},
4408                                              "history");
4409                        }
4410                        print "</td>\n";
4411
4412                        print "</tr>\n";
4413                        next; # instead of 'else' clause, to avoid extra indent
4414                }
4415                # else ordinary diff
4416
4417                my ($to_mode_oct, $to_mode_str, $to_file_type);
4418                my ($from_mode_oct, $from_mode_str, $from_file_type);
4419                if ($diff->{'to_mode'} ne ('0' x 6)) {
4420                        $to_mode_oct = oct $diff->{'to_mode'};
4421                        if (S_ISREG($to_mode_oct)) { # only for regular file
4422                                $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4423                        }
4424                        $to_file_type = file_type($diff->{'to_mode'});
4425                }
4426                if ($diff->{'from_mode'} ne ('0' x 6)) {
4427                        $from_mode_oct = oct $diff->{'from_mode'};
4428                        if (S_ISREG($from_mode_oct)) { # only for regular file
4429                                $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4430                        }
4431                        $from_file_type = file_type($diff->{'from_mode'});
4432                }
4433
4434                if ($diff->{'status'} eq "A") { # created
4435                        my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4436                        $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4437                        $mode_chng   .= "]</span>";
4438                        print "<td>";
4439                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4440                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4441                                      -class => "list"}, esc_path($diff->{'file'}));
4442                        print "</td>\n";
4443                        print "<td>$mode_chng</td>\n";
4444                        print "<td class=\"link\">";
4445                        if ($action eq 'commitdiff') {
4446                                # link to patch
4447                                $patchno++;
4448                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4449                                              "patch") .
4450                                      " | ";
4451                        }
4452                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4453                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4454                                      "blob");
4455                        print "</td>\n";
4456
4457                } elsif ($diff->{'status'} eq "D") { # deleted
4458                        my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4459                        print "<td>";
4460                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4461                                                     hash_base=>$parent, file_name=>$diff->{'file'}),
4462                                       -class => "list"}, esc_path($diff->{'file'}));
4463                        print "</td>\n";
4464                        print "<td>$mode_chng</td>\n";
4465                        print "<td class=\"link\">";
4466                        if ($action eq 'commitdiff') {
4467                                # link to patch
4468                                $patchno++;
4469                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4470                                              "patch") .
4471                                      " | ";
4472                        }
4473                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4474                                                     hash_base=>$parent, file_name=>$diff->{'file'})},
4475                                      "blob") . " | ";
4476                        if ($have_blame) {
4477                                print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4478                                                             file_name=>$diff->{'file'})},
4479                                              "blame") . " | ";
4480                        }
4481                        print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4482                                                     file_name=>$diff->{'file'})},
4483                                      "history");
4484                        print "</td>\n";
4485
4486                } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4487                        my $mode_chnge = "";
4488                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4489                                $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4490                                if ($from_file_type ne $to_file_type) {
4491                                        $mode_chnge .= " from $from_file_type to $to_file_type";
4492                                }
4493                                if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4494                                        if ($from_mode_str && $to_mode_str) {
4495                                                $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4496                                        } elsif ($to_mode_str) {
4497                                                $mode_chnge .= " mode: $to_mode_str";
4498                                        }
4499                                }
4500                                $mode_chnge .= "]</span>\n";
4501                        }
4502                        print "<td>";
4503                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4504                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4505                                      -class => "list"}, esc_path($diff->{'file'}));
4506                        print "</td>\n";
4507                        print "<td>$mode_chnge</td>\n";
4508                        print "<td class=\"link\">";
4509                        if ($action eq 'commitdiff') {
4510                                # link to patch
4511                                $patchno++;
4512                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4513                                              "patch") .
4514                                      " | ";
4515                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4516                                # "commit" view and modified file (not onlu mode changed)
4517                                print $cgi->a({-href => href(action=>"blobdiff",
4518                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4519                                                             hash_base=>$hash, hash_parent_base=>$parent,
4520                                                             file_name=>$diff->{'file'})},
4521                                              "diff") .
4522                                      " | ";
4523                        }
4524                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4525                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4526                                       "blob") . " | ";
4527                        if ($have_blame) {
4528                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4529                                                             file_name=>$diff->{'file'})},
4530                                              "blame") . " | ";
4531                        }
4532                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4533                                                     file_name=>$diff->{'file'})},
4534                                      "history");
4535                        print "</td>\n";
4536
4537                } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4538                        my %status_name = ('R' => 'moved', 'C' => 'copied');
4539                        my $nstatus = $status_name{$diff->{'status'}};
4540                        my $mode_chng = "";
4541                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4542                                # mode also for directories, so we cannot use $to_mode_str
4543                                $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4544                        }
4545                        print "<td>" .
4546                              $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4547                                                     hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4548                                      -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4549                              "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4550                              $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4551                                                     hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4552                                      -class => "list"}, esc_path($diff->{'from_file'})) .
4553                              " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4554                              "<td class=\"link\">";
4555                        if ($action eq 'commitdiff') {
4556                                # link to patch
4557                                $patchno++;
4558                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4559                                              "patch") .
4560                                      " | ";
4561                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4562                                # "commit" view and modified file (not only pure rename or copy)
4563                                print $cgi->a({-href => href(action=>"blobdiff",
4564                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4565                                                             hash_base=>$hash, hash_parent_base=>$parent,
4566                                                             file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4567                                              "diff") .
4568                                      " | ";
4569                        }
4570                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4571                                                     hash_base=>$parent, file_name=>$diff->{'to_file'})},
4572                                      "blob") . " | ";
4573                        if ($have_blame) {
4574                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4575                                                             file_name=>$diff->{'to_file'})},
4576                                              "blame") . " | ";
4577                        }
4578                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4579                                                    file_name=>$diff->{'to_file'})},
4580                                      "history");
4581                        print "</td>\n";
4582
4583                } # we should not encounter Unmerged (U) or Unknown (X) status
4584                print "</tr>\n";
4585        }
4586        print "</tbody>" if $has_header;
4587        print "</table>\n";
4588}
4589
4590sub git_patchset_body {
4591        my ($fd, $difftree, $hash, @hash_parents) = @_;
4592        my ($hash_parent) = $hash_parents[0];
4593
4594        my $is_combined = (@hash_parents > 1);
4595        my $patch_idx = 0;
4596        my $patch_number = 0;
4597        my $patch_line;
4598        my $diffinfo;
4599        my $to_name;
4600        my (%from, %to);
4601
4602        print "<div class=\"patchset\">\n";
4603
4604        # skip to first patch
4605        while ($patch_line = <$fd>) {
4606                chomp $patch_line;
4607
4608                last if ($patch_line =~ m/^diff /);
4609        }
4610
4611 PATCH:
4612        while ($patch_line) {
4613
4614                # parse "git diff" header line
4615                if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
4616                        # $1 is from_name, which we do not use
4617                        $to_name = unquote($2);
4618                        $to_name =~ s!^b/!!;
4619                } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
4620                        # $1 is 'cc' or 'combined', which we do not use
4621                        $to_name = unquote($2);
4622                } else {
4623                        $to_name = undef;
4624                }
4625
4626                # check if current patch belong to current raw line
4627                # and parse raw git-diff line if needed
4628                if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
4629                        # this is continuation of a split patch
4630                        print "<div class=\"patch cont\">\n";
4631                } else {
4632                        # advance raw git-diff output if needed
4633                        $patch_idx++ if defined $diffinfo;
4634
4635                        # read and prepare patch information
4636                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4637
4638                        # compact combined diff output can have some patches skipped
4639                        # find which patch (using pathname of result) we are at now;
4640                        if ($is_combined) {
4641                                while ($to_name ne $diffinfo->{'to_file'}) {
4642                                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4643                                              format_diff_cc_simplified($diffinfo, @hash_parents) .
4644                                              "</div>\n";  # class="patch"
4645
4646                                        $patch_idx++;
4647                                        $patch_number++;
4648
4649                                        last if $patch_idx > $#$difftree;
4650                                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4651                                }
4652                        }
4653
4654                        # modifies %from, %to hashes
4655                        parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
4656
4657                        # this is first patch for raw difftree line with $patch_idx index
4658                        # we index @$difftree array from 0, but number patches from 1
4659                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
4660                }
4661
4662                # git diff header
4663                #assert($patch_line =~ m/^diff /) if DEBUG;
4664                #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
4665                $patch_number++;
4666                # print "git diff" header
4667                print format_git_diff_header_line($patch_line, $diffinfo,
4668                                                  \%from, \%to);
4669
4670                # print extended diff header
4671                print "<div class=\"diff extended_header\">\n";
4672        EXTENDED_HEADER:
4673                while ($patch_line = <$fd>) {
4674                        chomp $patch_line;
4675
4676                        last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
4677
4678                        print format_extended_diff_header_line($patch_line, $diffinfo,
4679                                                               \%from, \%to);
4680                }
4681                print "</div>\n"; # class="diff extended_header"
4682
4683                # from-file/to-file diff header
4684                if (! $patch_line) {
4685                        print "</div>\n"; # class="patch"
4686                        last PATCH;
4687                }
4688                next PATCH if ($patch_line =~ m/^diff /);
4689                #assert($patch_line =~ m/^---/) if DEBUG;
4690
4691                my $last_patch_line = $patch_line;
4692                $patch_line = <$fd>;
4693                chomp $patch_line;
4694                #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
4695
4696                print format_diff_from_to_header($last_patch_line, $patch_line,
4697                                                 $diffinfo, \%from, \%to,
4698                                                 @hash_parents);
4699
4700                # the patch itself
4701        LINE:
4702                while ($patch_line = <$fd>) {
4703                        chomp $patch_line;
4704
4705                        next PATCH if ($patch_line =~ m/^diff /);
4706
4707                        print format_diff_line($patch_line, \%from, \%to);
4708                }
4709
4710        } continue {
4711                print "</div>\n"; # class="patch"
4712        }
4713
4714        # for compact combined (--cc) format, with chunk and patch simplification
4715        # the patchset might be empty, but there might be unprocessed raw lines
4716        for (++$patch_idx if $patch_number > 0;
4717             $patch_idx < @$difftree;
4718             ++$patch_idx) {
4719                # read and prepare patch information
4720                $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4721
4722                # generate anchor for "patch" links in difftree / whatchanged part
4723                print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4724                      format_diff_cc_simplified($diffinfo, @hash_parents) .
4725                      "</div>\n";  # class="patch"
4726
4727                $patch_number++;
4728        }
4729
4730        if ($patch_number == 0) {
4731                if (@hash_parents > 1) {
4732                        print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
4733                } else {
4734                        print "<div class=\"diff nodifferences\">No differences found</div>\n";
4735                }
4736        }
4737
4738        print "</div>\n"; # class="patchset"
4739}
4740
4741# . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
4742
4743# fills project list info (age, description, owner, forks) for each
4744# project in the list, removing invalid projects from returned list
4745# NOTE: modifies $projlist, but does not remove entries from it
4746sub fill_project_list_info {
4747        my ($projlist, $check_forks) = @_;
4748        my @projects;
4749
4750        my $show_ctags = gitweb_check_feature('ctags');
4751 PROJECT:
4752        foreach my $pr (@$projlist) {
4753                my (@activity) = git_get_last_activity($pr->{'path'});
4754                unless (@activity) {
4755                        next PROJECT;
4756                }
4757                ($pr->{'age'}, $pr->{'age_string'}) = @activity;
4758                if (!defined $pr->{'descr'}) {
4759                        my $descr = git_get_project_description($pr->{'path'}) || "";
4760                        $descr = to_utf8($descr);
4761                        $pr->{'descr_long'} = $descr;
4762                        $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
4763                }
4764                if (!defined $pr->{'owner'}) {
4765                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
4766                }
4767                if ($check_forks) {
4768                        my $pname = $pr->{'path'};
4769                        if (($pname =~ s/\.git$//) &&
4770                            ($pname !~ /\/$/) &&
4771                            (-d "$projectroot/$pname")) {
4772                                $pr->{'forks'} = "-d $projectroot/$pname";
4773                        } else {
4774                                $pr->{'forks'} = 0;
4775                        }
4776                }
4777                $show_ctags and $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
4778                push @projects, $pr;
4779        }
4780
4781        return @projects;
4782}
4783
4784# print 'sort by' <th> element, generating 'sort by $name' replay link
4785# if that order is not selected
4786sub print_sort_th {
4787        print format_sort_th(@_);
4788}
4789
4790sub format_sort_th {
4791        my ($name, $order, $header) = @_;
4792        my $sort_th = "";
4793        $header ||= ucfirst($name);
4794
4795        if ($order eq $name) {
4796                $sort_th .= "<th>$header</th>\n";
4797        } else {
4798                $sort_th .= "<th>" .
4799                            $cgi->a({-href => href(-replay=>1, order=>$name),
4800                                     -class => "header"}, $header) .
4801                            "</th>\n";
4802        }
4803
4804        return $sort_th;
4805}
4806
4807sub git_project_list_body {
4808        # actually uses global variable $project
4809        my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
4810
4811        my $check_forks = gitweb_check_feature('forks');
4812        my @projects = fill_project_list_info($projlist, $check_forks);
4813
4814        $order ||= $default_projects_order;
4815        $from = 0 unless defined $from;
4816        $to = $#projects if (!defined $to || $#projects < $to);
4817
4818        my %order_info = (
4819                project => { key => 'path', type => 'str' },
4820                descr => { key => 'descr_long', type => 'str' },
4821                owner => { key => 'owner', type => 'str' },
4822                age => { key => 'age', type => 'num' }
4823        );
4824        my $oi = $order_info{$order};
4825        if ($oi->{'type'} eq 'str') {
4826                @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @projects;
4827        } else {
4828                @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @projects;
4829        }
4830
4831        my $show_ctags = gitweb_check_feature('ctags');
4832        if ($show_ctags) {
4833                my %ctags;
4834                foreach my $p (@projects) {
4835                        foreach my $ct (keys %{$p->{'ctags'}}) {
4836                                $ctags{$ct} += $p->{'ctags'}->{$ct};
4837                        }
4838                }
4839                my $cloud = git_populate_project_tagcloud(\%ctags);
4840                print git_show_project_tagcloud($cloud, 64);
4841        }
4842
4843        print "<table class=\"project_list\">\n";
4844        unless ($no_header) {
4845                print "<tr>\n";
4846                if ($check_forks) {
4847                        print "<th></th>\n";
4848                }
4849                print_sort_th('project', $order, 'Project');
4850                print_sort_th('descr', $order, 'Description');
4851                print_sort_th('owner', $order, 'Owner');
4852                print_sort_th('age', $order, 'Last Change');
4853                print "<th></th>\n" . # for links
4854                      "</tr>\n";
4855        }
4856        my $alternate = 1;
4857        my $tagfilter = $cgi->param('by_tag');
4858        for (my $i = $from; $i <= $to; $i++) {
4859                my $pr = $projects[$i];
4860
4861                next if $tagfilter and $show_ctags and not grep { lc $_ eq lc $tagfilter } keys %{$pr->{'ctags'}};
4862                next if $searchtext and not $pr->{'path'} =~ /$searchtext/
4863                        and not $pr->{'descr_long'} =~ /$searchtext/;
4864                # Weed out forks or non-matching entries of search
4865                if ($check_forks) {
4866                        my $forkbase = $project; $forkbase ||= ''; $forkbase =~ s#\.git$#/#;
4867                        $forkbase="^$forkbase" if $forkbase;
4868                        next if not $searchtext and not $tagfilter and $show_ctags
4869                                and $pr->{'path'} =~ m#$forkbase.*/.*#; # regexp-safe
4870                }
4871
4872                if ($alternate) {
4873                        print "<tr class=\"dark\">\n";
4874                } else {
4875                        print "<tr class=\"light\">\n";
4876                }
4877                $alternate ^= 1;
4878                if ($check_forks) {
4879                        print "<td>";
4880                        if ($pr->{'forks'}) {
4881                                print "<!-- $pr->{'forks'} -->\n";
4882                                print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "+");
4883                        }
4884                        print "</td>\n";
4885                }
4886                print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4887                                        -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
4888                      "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4889                                        -class => "list", -title => $pr->{'descr_long'}},
4890                                        esc_html($pr->{'descr'})) . "</td>\n" .
4891                      "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
4892                print "<td class=\"". age_class($pr->{'age'}) . "\">" .
4893                      (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
4894                      "<td class=\"link\">" .
4895                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
4896                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
4897                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
4898                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
4899                      ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
4900                      "</td>\n" .
4901                      "</tr>\n";
4902        }
4903        if (defined $extra) {
4904                print "<tr>\n";
4905                if ($check_forks) {
4906                        print "<td></td>\n";
4907                }
4908                print "<td colspan=\"5\">$extra</td>\n" .
4909                      "</tr>\n";
4910        }
4911        print "</table>\n";
4912}
4913
4914sub git_log_body {
4915        # uses global variable $project
4916        my ($commitlist, $from, $to, $refs, $extra) = @_;
4917
4918        $from = 0 unless defined $from;
4919        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4920
4921        for (my $i = 0; $i <= $to; $i++) {
4922                my %co = %{$commitlist->[$i]};
4923                next if !%co;
4924                my $commit = $co{'id'};
4925                my $ref = format_ref_marker($refs, $commit);
4926                git_print_header_div('commit',
4927                               "<span class=\"age\">$co{'age_string'}</span>" .
4928                               esc_html($co{'title'}) . $ref,
4929                               $commit);
4930                print "<div class=\"title_text\">\n" .
4931                      "<div class=\"log_link\">\n" .
4932                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
4933                      " | " .
4934                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
4935                      " | " .
4936                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
4937                      "<br/>\n" .
4938                      "</div>\n";
4939                      git_print_authorship(\%co, -tag => 'span');
4940                      print "<br/>\n</div>\n";
4941
4942                print "<div class=\"log_body\">\n";
4943                git_print_log($co{'comment'}, -final_empty_line=> 1);
4944                print "</div>\n";
4945        }
4946        if ($extra) {
4947                print "<div class=\"page_nav\">\n";
4948                print "$extra\n";
4949                print "</div>\n";
4950        }
4951}
4952
4953sub git_shortlog_body {
4954        # uses global variable $project
4955        my ($commitlist, $from, $to, $refs, $extra) = @_;
4956
4957        $from = 0 unless defined $from;
4958        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4959
4960        print "<table class=\"shortlog\">\n";
4961        my $alternate = 1;
4962        for (my $i = $from; $i <= $to; $i++) {
4963                my %co = %{$commitlist->[$i]};
4964                my $commit = $co{'id'};
4965                my $ref = format_ref_marker($refs, $commit);
4966                if ($alternate) {
4967                        print "<tr class=\"dark\">\n";
4968                } else {
4969                        print "<tr class=\"light\">\n";
4970                }
4971                $alternate ^= 1;
4972                # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
4973                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4974                      format_author_html('td', \%co, 10) . "<td>";
4975                print format_subject_html($co{'title'}, $co{'title_short'},
4976                                          href(action=>"commit", hash=>$commit), $ref);
4977                print "</td>\n" .
4978                      "<td class=\"link\">" .
4979                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
4980                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
4981                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
4982                my $snapshot_links = format_snapshot_links($commit);
4983                if (defined $snapshot_links) {
4984                        print " | " . $snapshot_links;
4985                }
4986                print "</td>\n" .
4987                      "</tr>\n";
4988        }
4989        if (defined $extra) {
4990                print "<tr>\n" .
4991                      "<td colspan=\"4\">$extra</td>\n" .
4992                      "</tr>\n";
4993        }
4994        print "</table>\n";
4995}
4996
4997sub git_history_body {
4998        # Warning: assumes constant type (blob or tree) during history
4999        my ($commitlist, $from, $to, $refs, $extra,
5000            $file_name, $file_hash, $ftype) = @_;
5001
5002        $from = 0 unless defined $from;
5003        $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5004
5005        print "<table class=\"history\">\n";
5006        my $alternate = 1;
5007        for (my $i = $from; $i <= $to; $i++) {
5008                my %co = %{$commitlist->[$i]};
5009                if (!%co) {
5010                        next;
5011                }
5012                my $commit = $co{'id'};
5013
5014                my $ref = format_ref_marker($refs, $commit);
5015
5016                if ($alternate) {
5017                        print "<tr class=\"dark\">\n";
5018                } else {
5019                        print "<tr class=\"light\">\n";
5020                }
5021                $alternate ^= 1;
5022                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5023        # shortlog:   format_author_html('td', \%co, 10)
5024                      format_author_html('td', \%co, 15, 3) . "<td>";
5025                # originally git_history used chop_str($co{'title'}, 50)
5026                print format_subject_html($co{'title'}, $co{'title_short'},
5027                                          href(action=>"commit", hash=>$commit), $ref);
5028                print "</td>\n" .
5029                      "<td class=\"link\">" .
5030                      $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5031                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5032
5033                if ($ftype eq 'blob') {
5034                        my $blob_current = $file_hash;
5035                        my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5036                        if (defined $blob_current && defined $blob_parent &&
5037                                        $blob_current ne $blob_parent) {
5038                                print " | " .
5039                                        $cgi->a({-href => href(action=>"blobdiff",
5040                                                               hash=>$blob_current, hash_parent=>$blob_parent,
5041                                                               hash_base=>$hash_base, hash_parent_base=>$commit,
5042                                                               file_name=>$file_name)},
5043                                                "diff to current");
5044                        }
5045                }
5046                print "</td>\n" .
5047                      "</tr>\n";
5048        }
5049        if (defined $extra) {
5050                print "<tr>\n" .
5051                      "<td colspan=\"4\">$extra</td>\n" .
5052                      "</tr>\n";
5053        }
5054        print "</table>\n";
5055}
5056
5057sub git_tags_body {
5058        # uses global variable $project
5059        my ($taglist, $from, $to, $extra) = @_;
5060        $from = 0 unless defined $from;
5061        $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5062
5063        print "<table class=\"tags\">\n";
5064        my $alternate = 1;
5065        for (my $i = $from; $i <= $to; $i++) {
5066                my $entry = $taglist->[$i];
5067                my %tag = %$entry;
5068                my $comment = $tag{'subject'};
5069                my $comment_short;
5070                if (defined $comment) {
5071                        $comment_short = chop_str($comment, 30, 5);
5072                }
5073                if ($alternate) {
5074                        print "<tr class=\"dark\">\n";
5075                } else {
5076                        print "<tr class=\"light\">\n";
5077                }
5078                $alternate ^= 1;
5079                if (defined $tag{'age'}) {
5080                        print "<td><i>$tag{'age'}</i></td>\n";
5081                } else {
5082                        print "<td></td>\n";
5083                }
5084                print "<td>" .
5085                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5086                               -class => "list name"}, esc_html($tag{'name'})) .
5087                      "</td>\n" .
5088                      "<td>";
5089                if (defined $comment) {
5090                        print format_subject_html($comment, $comment_short,
5091                                                  href(action=>"tag", hash=>$tag{'id'}));
5092                }
5093                print "</td>\n" .
5094                      "<td class=\"selflink\">";
5095                if ($tag{'type'} eq "tag") {
5096                        print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5097                } else {
5098                        print "&nbsp;";
5099                }
5100                print "</td>\n" .
5101                      "<td class=\"link\">" . " | " .
5102                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5103                if ($tag{'reftype'} eq "commit") {
5104                        print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5105                              " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5106                } elsif ($tag{'reftype'} eq "blob") {
5107                        print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5108                }
5109                print "</td>\n" .
5110                      "</tr>";
5111        }
5112        if (defined $extra) {
5113                print "<tr>\n" .
5114                      "<td colspan=\"5\">$extra</td>\n" .
5115                      "</tr>\n";
5116        }
5117        print "</table>\n";
5118}
5119
5120sub git_heads_body {
5121        # uses global variable $project
5122        my ($headlist, $head, $from, $to, $extra) = @_;
5123        $from = 0 unless defined $from;
5124        $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5125
5126        print "<table class=\"heads\">\n";
5127        my $alternate = 1;
5128        for (my $i = $from; $i <= $to; $i++) {
5129                my $entry = $headlist->[$i];
5130                my %ref = %$entry;
5131                my $curr = $ref{'id'} eq $head;
5132                if ($alternate) {
5133                        print "<tr class=\"dark\">\n";
5134                } else {
5135                        print "<tr class=\"light\">\n";
5136                }
5137                $alternate ^= 1;
5138                print "<td><i>$ref{'age'}</i></td>\n" .
5139                      ($curr ? "<td class=\"current_head\">" : "<td>") .
5140                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5141                               -class => "list name"},esc_html($ref{'name'})) .
5142                      "</td>\n" .
5143                      "<td class=\"link\">" .
5144                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5145                      $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5146                      $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5147                      "</td>\n" .
5148                      "</tr>";
5149        }
5150        if (defined $extra) {
5151                print "<tr>\n" .
5152                      "<td colspan=\"3\">$extra</td>\n" .
5153                      "</tr>\n";
5154        }
5155        print "</table>\n";
5156}
5157
5158# Display a single remote block
5159sub git_remote_block {
5160        my ($remote, $rdata, $limit, $head) = @_;
5161
5162        my $heads = $rdata->{'heads'};
5163        my $fetch = $rdata->{'fetch'};
5164        my $push = $rdata->{'push'};
5165
5166        my $urls_table = "<table class=\"projects_list\">\n" ;
5167
5168        if (defined $fetch) {
5169                if ($fetch eq $push) {
5170                        $urls_table .= format_repo_url("URL", $fetch);
5171                } else {
5172                        $urls_table .= format_repo_url("Fetch URL", $fetch);
5173                        $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5174                }
5175        } elsif (defined $push) {
5176                $urls_table .= format_repo_url("Push URL", $push);
5177        } else {
5178                $urls_table .= format_repo_url("", "No remote URL");
5179        }
5180
5181        $urls_table .= "</table>\n";
5182
5183        my $dots;
5184        if (defined $limit && $limit < @$heads) {
5185                $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5186        }
5187
5188        print $urls_table;
5189        git_heads_body($heads, $head, 0, $limit, $dots);
5190}
5191
5192# Display a list of remote names with the respective fetch and push URLs
5193sub git_remotes_list {
5194        my ($remotedata, $limit) = @_;
5195        print "<table class=\"heads\">\n";
5196        my $alternate = 1;
5197        my @remotes = sort keys %$remotedata;
5198
5199        my $limited = $limit && $limit < @remotes;
5200
5201        $#remotes = $limit - 1 if $limited;
5202
5203        while (my $remote = shift @remotes) {
5204                my $rdata = $remotedata->{$remote};
5205                my $fetch = $rdata->{'fetch'};
5206                my $push = $rdata->{'push'};
5207                if ($alternate) {
5208                        print "<tr class=\"dark\">\n";
5209                } else {
5210                        print "<tr class=\"light\">\n";
5211                }
5212                $alternate ^= 1;
5213                print "<td>" .
5214                      $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5215                               -class=> "list name"},esc_html($remote)) .
5216                      "</td>";
5217                print "<td class=\"link\">" .
5218                      (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5219                      " | " .
5220                      (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5221                      "</td>";
5222
5223                print "</tr>\n";
5224        }
5225
5226        if ($limited) {
5227                print "<tr>\n" .
5228                      "<td colspan=\"3\">" .
5229                      $cgi->a({-href => href(action=>"remotes")}, "...") .
5230                      "</td>\n" . "</tr>\n";
5231        }
5232
5233        print "</table>";
5234}
5235
5236# Display remote heads grouped by remote, unless there are too many
5237# remotes, in which case we only display the remote names
5238sub git_remotes_body {
5239        my ($remotedata, $limit, $head) = @_;
5240        if ($limit and $limit < keys %$remotedata) {
5241                git_remotes_list($remotedata, $limit);
5242        } else {
5243                fill_remote_heads($remotedata);
5244                while (my ($remote, $rdata) = each %$remotedata) {
5245                        git_print_section({-class=>"remote", -id=>$remote},
5246                                ["remotes", $remote, $remote], sub {
5247                                        git_remote_block($remote, $rdata, $limit, $head);
5248                                });
5249                }
5250        }
5251}
5252
5253sub git_search_grep_body {
5254        my ($commitlist, $from, $to, $extra) = @_;
5255        $from = 0 unless defined $from;
5256        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5257
5258        print "<table class=\"commit_search\">\n";
5259        my $alternate = 1;
5260        for (my $i = $from; $i <= $to; $i++) {
5261                my %co = %{$commitlist->[$i]};
5262                if (!%co) {
5263                        next;
5264                }
5265                my $commit = $co{'id'};
5266                if ($alternate) {
5267                        print "<tr class=\"dark\">\n";
5268                } else {
5269                        print "<tr class=\"light\">\n";
5270                }
5271                $alternate ^= 1;
5272                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5273                      format_author_html('td', \%co, 15, 5) .
5274                      "<td>" .
5275                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5276                               -class => "list subject"},
5277                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
5278                my $comment = $co{'comment'};
5279                foreach my $line (@$comment) {
5280                        if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
5281                                my ($lead, $match, $trail) = ($1, $2, $3);
5282                                $match = chop_str($match, 70, 5, 'center');
5283                                my $contextlen = int((80 - length($match))/2);
5284                                $contextlen = 30 if ($contextlen > 30);
5285                                $lead  = chop_str($lead,  $contextlen, 10, 'left');
5286                                $trail = chop_str($trail, $contextlen, 10, 'right');
5287
5288                                $lead  = esc_html($lead);
5289                                $match = esc_html($match);
5290                                $trail = esc_html($trail);
5291
5292                                print "$lead<span class=\"match\">$match</span>$trail<br />";
5293                        }
5294                }
5295                print "</td>\n" .
5296                      "<td class=\"link\">" .
5297                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5298                      " | " .
5299                      $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5300                      " | " .
5301                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5302                print "</td>\n" .
5303                      "</tr>\n";
5304        }
5305        if (defined $extra) {
5306                print "<tr>\n" .
5307                      "<td colspan=\"3\">$extra</td>\n" .
5308                      "</tr>\n";
5309        }
5310        print "</table>\n";
5311}
5312
5313## ======================================================================
5314## ======================================================================
5315## actions
5316
5317sub git_project_list {
5318        my $order = $input_params{'order'};
5319        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5320                die_error(400, "Unknown order parameter");
5321        }
5322
5323        my @list = git_get_projects_list();
5324        if (!@list) {
5325                die_error(404, "No projects found");
5326        }
5327
5328        git_header_html();
5329        if (defined $home_text && -f $home_text) {
5330                print "<div class=\"index_include\">\n";
5331                insert_file($home_text);
5332                print "</div>\n";
5333        }
5334        print $cgi->startform(-method => "get") .
5335              "<p class=\"projsearch\">Search:\n" .
5336              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
5337              "</p>" .
5338              $cgi->end_form() . "\n";
5339        git_project_list_body(\@list, $order);
5340        git_footer_html();
5341}
5342
5343sub git_forks {
5344        my $order = $input_params{'order'};
5345        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5346                die_error(400, "Unknown order parameter");
5347        }
5348
5349        my @list = git_get_projects_list($project);
5350        if (!@list) {
5351                die_error(404, "No forks found");
5352        }
5353
5354        git_header_html();
5355        git_print_page_nav('','');
5356        git_print_header_div('summary', "$project forks");
5357        git_project_list_body(\@list, $order);
5358        git_footer_html();
5359}
5360
5361sub git_project_index {
5362        my @projects = git_get_projects_list($project);
5363
5364        print $cgi->header(
5365                -type => 'text/plain',
5366                -charset => 'utf-8',
5367                -content_disposition => 'inline; filename="index.aux"');
5368
5369        foreach my $pr (@projects) {
5370                if (!exists $pr->{'owner'}) {
5371                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
5372                }
5373
5374                my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
5375                # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
5376                $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5377                $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5378                $path  =~ s/ /\+/g;
5379                $owner =~ s/ /\+/g;
5380
5381                print "$path $owner\n";
5382        }
5383}
5384
5385sub git_summary {
5386        my $descr = git_get_project_description($project) || "none";
5387        my %co = parse_commit("HEAD");
5388        my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
5389        my $head = $co{'id'};
5390        my $remote_heads = gitweb_check_feature('remote_heads');
5391
5392        my $owner = git_get_project_owner($project);
5393
5394        my $refs = git_get_references();
5395        # These get_*_list functions return one more to allow us to see if
5396        # there are more ...
5397        my @taglist  = git_get_tags_list(16);
5398        my @headlist = git_get_heads_list(16);
5399        my %remotedata = $remote_heads ? git_get_remotes_list() : ();
5400        my @forklist;
5401        my $check_forks = gitweb_check_feature('forks');
5402
5403        if ($check_forks) {
5404                @forklist = git_get_projects_list($project);
5405        }
5406
5407        git_header_html();
5408        git_print_page_nav('summary','', $head);
5409
5410        print "<div class=\"title\">&nbsp;</div>\n";
5411        print "<table class=\"projects_list\">\n" .
5412              "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
5413              "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
5414        if (defined $cd{'rfc2822'}) {
5415                print "<tr id=\"metadata_lchange\"><td>last change</td><td>$cd{'rfc2822'}</td></tr>\n";
5416        }
5417
5418        # use per project git URL list in $projectroot/$project/cloneurl
5419        # or make project git URL from git base URL and project name
5420        my $url_tag = "URL";
5421        my @url_list = git_get_project_url_list($project);
5422        @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
5423        foreach my $git_url (@url_list) {
5424                next unless $git_url;
5425                print format_repo_url($url_tag, $git_url);
5426                $url_tag = "";
5427        }
5428
5429        # Tag cloud
5430        my $show_ctags = gitweb_check_feature('ctags');
5431        if ($show_ctags) {
5432                my $ctags = git_get_project_ctags($project);
5433                my $cloud = git_populate_project_tagcloud($ctags);
5434                print "<tr id=\"metadata_ctags\"><td>Content tags:<br />";
5435                print "</td>\n<td>" unless %$ctags;
5436                print "<form action=\"$show_ctags\" method=\"post\"><input type=\"hidden\" name=\"p\" value=\"$project\" />Add: <input type=\"text\" name=\"t\" size=\"8\" /></form>";
5437                print "</td>\n<td>" if %$ctags;
5438                print git_show_project_tagcloud($cloud, 48);
5439                print "</td></tr>";
5440        }
5441
5442        print "</table>\n";
5443
5444        # If XSS prevention is on, we don't include README.html.
5445        # TODO: Allow a readme in some safe format.
5446        if (!$prevent_xss && -s "$projectroot/$project/README.html") {
5447                print "<div class=\"title\">readme</div>\n" .
5448                      "<div class=\"readme\">\n";
5449                insert_file("$projectroot/$project/README.html");
5450                print "\n</div>\n"; # class="readme"
5451        }
5452
5453        # we need to request one more than 16 (0..15) to check if
5454        # those 16 are all
5455        my @commitlist = $head ? parse_commits($head, 17) : ();
5456        if (@commitlist) {
5457                git_print_header_div('shortlog');
5458                git_shortlog_body(\@commitlist, 0, 15, $refs,
5459                                  $#commitlist <=  15 ? undef :
5460                                  $cgi->a({-href => href(action=>"shortlog")}, "..."));
5461        }
5462
5463        if (@taglist) {
5464                git_print_header_div('tags');
5465                git_tags_body(\@taglist, 0, 15,
5466                              $#taglist <=  15 ? undef :
5467                              $cgi->a({-href => href(action=>"tags")}, "..."));
5468        }
5469
5470        if (@headlist) {
5471                git_print_header_div('heads');
5472                git_heads_body(\@headlist, $head, 0, 15,
5473                               $#headlist <= 15 ? undef :
5474                               $cgi->a({-href => href(action=>"heads")}, "..."));
5475        }
5476
5477        if (%remotedata) {
5478                git_print_header_div('remotes');
5479                git_remotes_body(\%remotedata, 15, $head);
5480        }
5481
5482        if (@forklist) {
5483                git_print_header_div('forks');
5484                git_project_list_body(\@forklist, 'age', 0, 15,
5485                                      $#forklist <= 15 ? undef :
5486                                      $cgi->a({-href => href(action=>"forks")}, "..."),
5487                                      'no_header');
5488        }
5489
5490        git_footer_html();
5491}
5492
5493sub git_tag {
5494        my %tag = parse_tag($hash);
5495
5496        if (! %tag) {
5497                die_error(404, "Unknown tag object");
5498        }
5499
5500        my $head = git_get_head_hash($project);
5501        git_header_html();
5502        git_print_page_nav('','', $head,undef,$head);
5503        git_print_header_div('commit', esc_html($tag{'name'}), $hash);
5504        print "<div class=\"title_text\">\n" .
5505              "<table class=\"object_header\">\n" .
5506              "<tr>\n" .
5507              "<td>object</td>\n" .
5508              "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5509                               $tag{'object'}) . "</td>\n" .
5510              "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5511                                              $tag{'type'}) . "</td>\n" .
5512              "</tr>\n";
5513        if (defined($tag{'author'})) {
5514                git_print_authorship_rows(\%tag, 'author');
5515        }
5516        print "</table>\n\n" .
5517              "</div>\n";
5518        print "<div class=\"page_body\">";
5519        my $comment = $tag{'comment'};
5520        foreach my $line (@$comment) {
5521                chomp $line;
5522                print esc_html($line, -nbsp=>1) . "<br/>\n";
5523        }
5524        print "</div>\n";
5525        git_footer_html();
5526}
5527
5528sub git_blame_common {
5529        my $format = shift || 'porcelain';
5530        if ($format eq 'porcelain' && $cgi->param('js')) {
5531                $format = 'incremental';
5532                $action = 'blame_incremental'; # for page title etc
5533        }
5534
5535        # permissions
5536        gitweb_check_feature('blame')
5537                or die_error(403, "Blame view not allowed");
5538
5539        # error checking
5540        die_error(400, "No file name given") unless $file_name;
5541        $hash_base ||= git_get_head_hash($project);
5542        die_error(404, "Couldn't find base commit") unless $hash_base;
5543        my %co = parse_commit($hash_base)
5544                or die_error(404, "Commit not found");
5545        my $ftype = "blob";
5546        if (!defined $hash) {
5547                $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
5548                        or die_error(404, "Error looking up file");
5549        } else {
5550                $ftype = git_get_type($hash);
5551                if ($ftype !~ "blob") {
5552                        die_error(400, "Object is not a blob");
5553                }
5554        }
5555
5556        my $fd;
5557        if ($format eq 'incremental') {
5558                # get file contents (as base)
5559                open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
5560                        or die_error(500, "Open git-cat-file failed");
5561        } elsif ($format eq 'data') {
5562                # run git-blame --incremental
5563                open $fd, "-|", git_cmd(), "blame", "--incremental",
5564                        $hash_base, "--", $file_name
5565                        or die_error(500, "Open git-blame --incremental failed");
5566        } else {
5567                # run git-blame --porcelain
5568                open $fd, "-|", git_cmd(), "blame", '-p',
5569                        $hash_base, '--', $file_name
5570                        or die_error(500, "Open git-blame --porcelain failed");
5571        }
5572
5573        # incremental blame data returns early
5574        if ($format eq 'data') {
5575                print $cgi->header(
5576                        -type=>"text/plain", -charset => "utf-8",
5577                        -status=> "200 OK");
5578                local $| = 1; # output autoflush
5579                print while <$fd>;
5580                close $fd
5581                        or print "ERROR $!\n";
5582
5583                print 'END';
5584                if (defined $t0 && gitweb_check_feature('timed')) {
5585                        print ' '.
5586                              tv_interval($t0, [ gettimeofday() ]).
5587                              ' '.$number_of_git_cmds;
5588                }
5589                print "\n";
5590
5591                return;
5592        }
5593
5594        # page header
5595        git_header_html();
5596        my $formats_nav =
5597                $cgi->a({-href => href(action=>"blob", -replay=>1)},
5598                        "blob") .
5599                " | ";
5600        if ($format eq 'incremental') {
5601                $formats_nav .=
5602                        $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
5603                                "blame") . " (non-incremental)";
5604        } else {
5605                $formats_nav .=
5606                        $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
5607                                "blame") . " (incremental)";
5608        }
5609        $formats_nav .=
5610                " | " .
5611                $cgi->a({-href => href(action=>"history", -replay=>1)},
5612                        "history") .
5613                " | " .
5614                $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
5615                        "HEAD");
5616        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5617        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5618        git_print_page_path($file_name, $ftype, $hash_base);
5619
5620        # page body
5621        if ($format eq 'incremental') {
5622                print "<noscript>\n<div class=\"error\"><center><b>\n".
5623                      "This page requires JavaScript to run.\n Use ".
5624                      $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
5625                              'this page').
5626                      " instead.\n".
5627                      "</b></center></div>\n</noscript>\n";
5628
5629                print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
5630        }
5631
5632        print qq!<div class="page_body">\n!;
5633        print qq!<div id="progress_info">... / ...</div>\n!
5634                if ($format eq 'incremental');
5635        print qq!<table id="blame_table" class="blame" width="100%">\n!.
5636              #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
5637              qq!<thead>\n!.
5638              qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
5639              qq!</thead>\n!.
5640              qq!<tbody>\n!;
5641
5642        my @rev_color = qw(light dark);
5643        my $num_colors = scalar(@rev_color);
5644        my $current_color = 0;
5645
5646        if ($format eq 'incremental') {
5647                my $color_class = $rev_color[$current_color];
5648
5649                #contents of a file
5650                my $linenr = 0;
5651        LINE:
5652                while (my $line = <$fd>) {
5653                        chomp $line;
5654                        $linenr++;
5655
5656                        print qq!<tr id="l$linenr" class="$color_class">!.
5657                              qq!<td class="sha1"><a href=""> </a></td>!.
5658                              qq!<td class="linenr">!.
5659                              qq!<a class="linenr" href="">$linenr</a></td>!;
5660                        print qq!<td class="pre">! . esc_html($line) . "</td>\n";
5661                        print qq!</tr>\n!;
5662                }
5663
5664        } else { # porcelain, i.e. ordinary blame
5665                my %metainfo = (); # saves information about commits
5666
5667                # blame data
5668        LINE:
5669                while (my $line = <$fd>) {
5670                        chomp $line;
5671                        # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
5672                        # no <lines in group> for subsequent lines in group of lines
5673                        my ($full_rev, $orig_lineno, $lineno, $group_size) =
5674                           ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
5675                        if (!exists $metainfo{$full_rev}) {
5676                                $metainfo{$full_rev} = { 'nprevious' => 0 };
5677                        }
5678                        my $meta = $metainfo{$full_rev};
5679                        my $data;
5680                        while ($data = <$fd>) {
5681                                chomp $data;
5682                                last if ($data =~ s/^\t//); # contents of line
5683                                if ($data =~ /^(\S+)(?: (.*))?$/) {
5684                                        $meta->{$1} = $2 unless exists $meta->{$1};
5685                                }
5686                                if ($data =~ /^previous /) {
5687                                        $meta->{'nprevious'}++;
5688                                }
5689                        }
5690                        my $short_rev = substr($full_rev, 0, 8);
5691                        my $author = $meta->{'author'};
5692                        my %date =
5693                                parse_date($meta->{'author-time'}, $meta->{'author-tz'});
5694                        my $date = $date{'iso-tz'};
5695                        if ($group_size) {
5696                                $current_color = ($current_color + 1) % $num_colors;
5697                        }
5698                        my $tr_class = $rev_color[$current_color];
5699                        $tr_class .= ' boundary' if (exists $meta->{'boundary'});
5700                        $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
5701                        $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
5702                        print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
5703                        if ($group_size) {
5704                                print "<td class=\"sha1\"";
5705                                print " title=\"". esc_html($author) . ", $date\"";
5706                                print " rowspan=\"$group_size\"" if ($group_size > 1);
5707                                print ">";
5708                                print $cgi->a({-href => href(action=>"commit",
5709                                                             hash=>$full_rev,
5710                                                             file_name=>$file_name)},
5711                                              esc_html($short_rev));
5712                                if ($group_size >= 2) {
5713                                        my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
5714                                        if (@author_initials) {
5715                                                print "<br />" .
5716                                                      esc_html(join('', @author_initials));
5717                                                #           or join('.', ...)
5718                                        }
5719                                }
5720                                print "</td>\n";
5721                        }
5722                        # 'previous' <sha1 of parent commit> <filename at commit>
5723                        if (exists $meta->{'previous'} &&
5724                            $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
5725                                $meta->{'parent'} = $1;
5726                                $meta->{'file_parent'} = unquote($2);
5727                        }
5728                        my $linenr_commit =
5729                                exists($meta->{'parent'}) ?
5730                                $meta->{'parent'} : $full_rev;
5731                        my $linenr_filename =
5732                                exists($meta->{'file_parent'}) ?
5733                                $meta->{'file_parent'} : unquote($meta->{'filename'});
5734                        my $blamed = href(action => 'blame',
5735                                          file_name => $linenr_filename,
5736                                          hash_base => $linenr_commit);
5737                        print "<td class=\"linenr\">";
5738                        print $cgi->a({ -href => "$blamed#l$orig_lineno",
5739                                        -class => "linenr" },
5740                                      esc_html($lineno));
5741                        print "</td>";
5742                        print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
5743                        print "</tr>\n";
5744                } # end while
5745
5746        }
5747
5748        # footer
5749        print "</tbody>\n".
5750              "</table>\n"; # class="blame"
5751        print "</div>\n";   # class="blame_body"
5752        close $fd
5753                or print "Reading blob failed\n";
5754
5755        git_footer_html();
5756}
5757
5758sub git_blame {
5759        git_blame_common();
5760}
5761
5762sub git_blame_incremental {
5763        git_blame_common('incremental');
5764}
5765
5766sub git_blame_data {
5767        git_blame_common('data');
5768}
5769
5770sub git_tags {
5771        my $head = git_get_head_hash($project);
5772        git_header_html();
5773        git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
5774        git_print_header_div('summary', $project);
5775
5776        my @tagslist = git_get_tags_list();
5777        if (@tagslist) {
5778                git_tags_body(\@tagslist);
5779        }
5780        git_footer_html();
5781}
5782
5783sub git_heads {
5784        my $head = git_get_head_hash($project);
5785        git_header_html();
5786        git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
5787        git_print_header_div('summary', $project);
5788
5789        my @headslist = git_get_heads_list();
5790        if (@headslist) {
5791                git_heads_body(\@headslist, $head);
5792        }
5793        git_footer_html();
5794}
5795
5796# used both for single remote view and for list of all the remotes
5797sub git_remotes {
5798        gitweb_check_feature('remote_heads')
5799                or die_error(403, "Remote heads view is disabled");
5800
5801        my $head = git_get_head_hash($project);
5802        my $remote = $input_params{'hash'};
5803
5804        my $remotedata = git_get_remotes_list($remote);
5805        die_error(500, "Unable to get remote information") unless defined $remotedata;
5806
5807        unless (%$remotedata) {
5808                die_error(404, defined $remote ?
5809                        "Remote $remote not found" :
5810                        "No remotes found");
5811        }
5812
5813        git_header_html(undef, undef, -action_extra => $remote);
5814        git_print_page_nav('', '',  $head, undef, $head,
5815                format_ref_views($remote ? '' : 'remotes'));
5816
5817        fill_remote_heads($remotedata);
5818        if (defined $remote) {
5819                git_print_header_div('remotes', "$remote remote for $project");
5820                git_remote_block($remote, $remotedata->{$remote}, undef, $head);
5821        } else {
5822                git_print_header_div('summary', "$project remotes");
5823                git_remotes_body($remotedata, undef, $head);
5824        }
5825
5826        git_footer_html();
5827}
5828
5829sub git_blob_plain {
5830        my $type = shift;
5831        my $expires;
5832
5833        if (!defined $hash) {
5834                if (defined $file_name) {
5835                        my $base = $hash_base || git_get_head_hash($project);
5836                        $hash = git_get_hash_by_path($base, $file_name, "blob")
5837                                or die_error(404, "Cannot find file");
5838                } else {
5839                        die_error(400, "No file name defined");
5840                }
5841        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5842                # blobs defined by non-textual hash id's can be cached
5843                $expires = "+1d";
5844        }
5845
5846        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5847                or die_error(500, "Open git-cat-file blob '$hash' failed");
5848
5849        # content-type (can include charset)
5850        $type = blob_contenttype($fd, $file_name, $type);
5851
5852        # "save as" filename, even when no $file_name is given
5853        my $save_as = "$hash";
5854        if (defined $file_name) {
5855                $save_as = $file_name;
5856        } elsif ($type =~ m/^text\//) {
5857                $save_as .= '.txt';
5858        }
5859
5860        # With XSS prevention on, blobs of all types except a few known safe
5861        # ones are served with "Content-Disposition: attachment" to make sure
5862        # they don't run in our security domain.  For certain image types,
5863        # blob view writes an <img> tag referring to blob_plain view, and we
5864        # want to be sure not to break that by serving the image as an
5865        # attachment (though Firefox 3 doesn't seem to care).
5866        my $sandbox = $prevent_xss &&
5867                $type !~ m!^(?:text/plain|image/(?:gif|png|jpeg))$!;
5868
5869        print $cgi->header(
5870                -type => $type,
5871                -expires => $expires,
5872                -content_disposition =>
5873                        ($sandbox ? 'attachment' : 'inline')
5874                        . '; filename="' . $save_as . '"');
5875        local $/ = undef;
5876        binmode STDOUT, ':raw';
5877        print <$fd>;
5878        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
5879        close $fd;
5880}
5881
5882sub git_blob {
5883        my $expires;
5884
5885        if (!defined $hash) {
5886                if (defined $file_name) {
5887                        my $base = $hash_base || git_get_head_hash($project);
5888                        $hash = git_get_hash_by_path($base, $file_name, "blob")
5889                                or die_error(404, "Cannot find file");
5890                } else {
5891                        die_error(400, "No file name defined");
5892                }
5893        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5894                # blobs defined by non-textual hash id's can be cached
5895                $expires = "+1d";
5896        }
5897
5898        my $have_blame = gitweb_check_feature('blame');
5899        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5900                or die_error(500, "Couldn't cat $file_name, $hash");
5901        my $mimetype = blob_mimetype($fd, $file_name);
5902        # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
5903        if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
5904                close $fd;
5905                return git_blob_plain($mimetype);
5906        }
5907        # we can have blame only for text/* mimetype
5908        $have_blame &&= ($mimetype =~ m!^text/!);
5909
5910        my $highlight = gitweb_check_feature('highlight');
5911        my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
5912        $fd = run_highlighter($fd, $highlight, $syntax)
5913                if $syntax;
5914
5915        git_header_html(undef, $expires);
5916        my $formats_nav = '';
5917        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
5918                if (defined $file_name) {
5919                        if ($have_blame) {
5920                                $formats_nav .=
5921                                        $cgi->a({-href => href(action=>"blame", -replay=>1)},
5922                                                "blame") .
5923                                        " | ";
5924                        }
5925                        $formats_nav .=
5926                                $cgi->a({-href => href(action=>"history", -replay=>1)},
5927                                        "history") .
5928                                " | " .
5929                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5930                                        "raw") .
5931                                " | " .
5932                                $cgi->a({-href => href(action=>"blob",
5933                                                       hash_base=>"HEAD", file_name=>$file_name)},
5934                                        "HEAD");
5935                } else {
5936                        $formats_nav .=
5937                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5938                                        "raw");
5939                }
5940                git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5941                git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5942        } else {
5943                print "<div class=\"page_nav\">\n" .
5944                      "<br/><br/></div>\n" .
5945                      "<div class=\"title\">".esc_html($hash)."</div>\n";
5946        }
5947        git_print_page_path($file_name, "blob", $hash_base);
5948        print "<div class=\"page_body\">\n";
5949        if ($mimetype =~ m!^image/!) {
5950                print qq!<img type="!.esc_attr($mimetype).qq!"!;
5951                if ($file_name) {
5952                        print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
5953                }
5954                print qq! src="! .
5955                      href(action=>"blob_plain", hash=>$hash,
5956                           hash_base=>$hash_base, file_name=>$file_name) .
5957                      qq!" />\n!;
5958        } else {
5959                my $nr;
5960                while (my $line = <$fd>) {
5961                        chomp $line;
5962                        $nr++;
5963                        $line = untabify($line);
5964                        printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
5965                               $nr, esc_attr(href(-replay => 1)), $nr, $nr, $syntax ? $line : esc_html($line, -nbsp=>1);
5966                }
5967        }
5968        close $fd
5969                or print "Reading blob failed.\n";
5970        print "</div>";
5971        git_footer_html();
5972}
5973
5974sub git_tree {
5975        if (!defined $hash_base) {
5976                $hash_base = "HEAD";
5977        }
5978        if (!defined $hash) {
5979                if (defined $file_name) {
5980                        $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
5981                } else {
5982                        $hash = $hash_base;
5983                }
5984        }
5985        die_error(404, "No such tree") unless defined($hash);
5986
5987        my $show_sizes = gitweb_check_feature('show-sizes');
5988        my $have_blame = gitweb_check_feature('blame');
5989
5990        my @entries = ();
5991        {
5992                local $/ = "\0";
5993                open my $fd, "-|", git_cmd(), "ls-tree", '-z',
5994                        ($show_sizes ? '-l' : ()), @extra_options, $hash
5995                        or die_error(500, "Open git-ls-tree failed");
5996                @entries = map { chomp; $_ } <$fd>;
5997                close $fd
5998                        or die_error(404, "Reading tree failed");
5999        }
6000
6001        my $refs = git_get_references();
6002        my $ref = format_ref_marker($refs, $hash_base);
6003        git_header_html();
6004        my $basedir = '';
6005        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6006                my @views_nav = ();
6007                if (defined $file_name) {
6008                        push @views_nav,
6009                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6010                                        "history"),
6011                                $cgi->a({-href => href(action=>"tree",
6012                                                       hash_base=>"HEAD", file_name=>$file_name)},
6013                                        "HEAD"),
6014                }
6015                my $snapshot_links = format_snapshot_links($hash);
6016                if (defined $snapshot_links) {
6017                        # FIXME: Should be available when we have no hash base as well.
6018                        push @views_nav, $snapshot_links;
6019                }
6020                git_print_page_nav('tree','', $hash_base, undef, undef,
6021                                   join(' | ', @views_nav));
6022                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6023        } else {
6024                undef $hash_base;
6025                print "<div class=\"page_nav\">\n";
6026                print "<br/><br/></div>\n";
6027                print "<div class=\"title\">".esc_html($hash)."</div>\n";
6028        }
6029        if (defined $file_name) {
6030                $basedir = $file_name;
6031                if ($basedir ne '' && substr($basedir, -1) ne '/') {
6032                        $basedir .= '/';
6033                }
6034                git_print_page_path($file_name, 'tree', $hash_base);
6035        }
6036        print "<div class=\"page_body\">\n";
6037        print "<table class=\"tree\">\n";
6038        my $alternate = 1;
6039        # '..' (top directory) link if possible
6040        if (defined $hash_base &&
6041            defined $file_name && $file_name =~ m![^/]+$!) {
6042                if ($alternate) {
6043                        print "<tr class=\"dark\">\n";
6044                } else {
6045                        print "<tr class=\"light\">\n";
6046                }
6047                $alternate ^= 1;
6048
6049                my $up = $file_name;
6050                $up =~ s!/?[^/]+$!!;
6051                undef $up unless $up;
6052                # based on git_print_tree_entry
6053                print '<td class="mode">' . mode_str('040000') . "</td>\n";
6054                print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6055                print '<td class="list">';
6056                print $cgi->a({-href => href(action=>"tree",
6057                                             hash_base=>$hash_base,
6058                                             file_name=>$up)},
6059                              "..");
6060                print "</td>\n";
6061                print "<td class=\"link\"></td>\n";
6062
6063                print "</tr>\n";
6064        }
6065        foreach my $line (@entries) {
6066                my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6067
6068                if ($alternate) {
6069                        print "<tr class=\"dark\">\n";
6070                } else {
6071                        print "<tr class=\"light\">\n";
6072                }
6073                $alternate ^= 1;
6074
6075                git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6076
6077                print "</tr>\n";
6078        }
6079        print "</table>\n" .
6080              "</div>";
6081        git_footer_html();
6082}
6083
6084sub snapshot_name {
6085        my ($project, $hash) = @_;
6086
6087        # path/to/project.git  -> project
6088        # path/to/project/.git -> project
6089        my $name = to_utf8($project);
6090        $name =~ s,([^/])/*\.git$,$1,;
6091        $name = basename($name);
6092        # sanitize name
6093        $name =~ s/[[:cntrl:]]/?/g;
6094
6095        my $ver = $hash;
6096        if ($hash =~ /^[0-9a-fA-F]+$/) {
6097                # shorten SHA-1 hash
6098                my $full_hash = git_get_full_hash($project, $hash);
6099                if ($full_hash =~ /^$hash/ && length($hash) > 7) {
6100                        $ver = git_get_short_hash($project, $hash);
6101                }
6102        } elsif ($hash =~ m!^refs/tags/(.*)$!) {
6103                # tags don't need shortened SHA-1 hash
6104                $ver = $1;
6105        } else {
6106                # branches and other need shortened SHA-1 hash
6107                if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
6108                        $ver = $1;
6109                }
6110                $ver .= '-' . git_get_short_hash($project, $hash);
6111        }
6112        # in case of hierarchical branch names
6113        $ver =~ s!/!.!g;
6114
6115        # name = project-version_string
6116        $name = "$name-$ver";
6117
6118        return wantarray ? ($name, $name) : $name;
6119}
6120
6121sub git_snapshot {
6122        my $format = $input_params{'snapshot_format'};
6123        if (!@snapshot_fmts) {
6124                die_error(403, "Snapshots not allowed");
6125        }
6126        # default to first supported snapshot format
6127        $format ||= $snapshot_fmts[0];
6128        if ($format !~ m/^[a-z0-9]+$/) {
6129                die_error(400, "Invalid snapshot format parameter");
6130        } elsif (!exists($known_snapshot_formats{$format})) {
6131                die_error(400, "Unknown snapshot format");
6132        } elsif ($known_snapshot_formats{$format}{'disabled'}) {
6133                die_error(403, "Snapshot format not allowed");
6134        } elsif (!grep($_ eq $format, @snapshot_fmts)) {
6135                die_error(403, "Unsupported snapshot format");
6136        }
6137
6138        my $type = git_get_type("$hash^{}");
6139        if (!$type) {
6140                die_error(404, 'Object does not exist');
6141        }  elsif ($type eq 'blob') {
6142                die_error(400, 'Object is not a tree-ish');
6143        }
6144
6145        my ($name, $prefix) = snapshot_name($project, $hash);
6146        my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
6147        my $cmd = quote_command(
6148                git_cmd(), 'archive',
6149                "--format=$known_snapshot_formats{$format}{'format'}",
6150                "--prefix=$prefix/", $hash);
6151        if (exists $known_snapshot_formats{$format}{'compressor'}) {
6152                $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
6153        }
6154
6155        $filename =~ s/(["\\])/\\$1/g;
6156        print $cgi->header(
6157                -type => $known_snapshot_formats{$format}{'type'},
6158                -content_disposition => 'inline; filename="' . $filename . '"',
6159                -status => '200 OK');
6160
6161        open my $fd, "-|", $cmd
6162                or die_error(500, "Execute git-archive failed");
6163        binmode STDOUT, ':raw';
6164        print <$fd>;
6165        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6166        close $fd;
6167}
6168
6169sub git_log_generic {
6170        my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
6171
6172        my $head = git_get_head_hash($project);
6173        if (!defined $base) {
6174                $base = $head;
6175        }
6176        if (!defined $page) {
6177                $page = 0;
6178        }
6179        my $refs = git_get_references();
6180
6181        my $commit_hash = $base;
6182        if (defined $parent) {
6183                $commit_hash = "$parent..$base";
6184        }
6185        my @commitlist =
6186                parse_commits($commit_hash, 101, (100 * $page),
6187                              defined $file_name ? ($file_name, "--full-history") : ());
6188
6189        my $ftype;
6190        if (!defined $file_hash && defined $file_name) {
6191                # some commits could have deleted file in question,
6192                # and not have it in tree, but one of them has to have it
6193                for (my $i = 0; $i < @commitlist; $i++) {
6194                        $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
6195                        last if defined $file_hash;
6196                }
6197        }
6198        if (defined $file_hash) {
6199                $ftype = git_get_type($file_hash);
6200        }
6201        if (defined $file_name && !defined $ftype) {
6202                die_error(500, "Unknown type of object");
6203        }
6204        my %co;
6205        if (defined $file_name) {
6206                %co = parse_commit($base)
6207                        or die_error(404, "Unknown commit object");
6208        }
6209
6210
6211        my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
6212        my $next_link = '';
6213        if ($#commitlist >= 100) {
6214                $next_link =
6215                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
6216                                 -accesskey => "n", -title => "Alt-n"}, "next");
6217        }
6218        my $patch_max = gitweb_get_feature('patches');
6219        if ($patch_max && !defined $file_name) {
6220                if ($patch_max < 0 || @commitlist <= $patch_max) {
6221                        $paging_nav .= " &sdot; " .
6222                                $cgi->a({-href => href(action=>"patches", -replay=>1)},
6223                                        "patches");
6224                }
6225        }
6226
6227        git_header_html();
6228        git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
6229        if (defined $file_name) {
6230                git_print_header_div('commit', esc_html($co{'title'}), $base);
6231        } else {
6232                git_print_header_div('summary', $project)
6233        }
6234        git_print_page_path($file_name, $ftype, $hash_base)
6235                if (defined $file_name);
6236
6237        $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
6238                     $file_name, $file_hash, $ftype);
6239
6240        git_footer_html();
6241}
6242
6243sub git_log {
6244        git_log_generic('log', \&git_log_body,
6245                        $hash, $hash_parent);
6246}
6247
6248sub git_commit {
6249        $hash ||= $hash_base || "HEAD";
6250        my %co = parse_commit($hash)
6251            or die_error(404, "Unknown commit object");
6252
6253        my $parent  = $co{'parent'};
6254        my $parents = $co{'parents'}; # listref
6255
6256        # we need to prepare $formats_nav before any parameter munging
6257        my $formats_nav;
6258        if (!defined $parent) {
6259                # --root commitdiff
6260                $formats_nav .= '(initial)';
6261        } elsif (@$parents == 1) {
6262                # single parent commit
6263                $formats_nav .=
6264                        '(parent: ' .
6265                        $cgi->a({-href => href(action=>"commit",
6266                                               hash=>$parent)},
6267                                esc_html(substr($parent, 0, 7))) .
6268                        ')';
6269        } else {
6270                # merge commit
6271                $formats_nav .=
6272                        '(merge: ' .
6273                        join(' ', map {
6274                                $cgi->a({-href => href(action=>"commit",
6275                                                       hash=>$_)},
6276                                        esc_html(substr($_, 0, 7)));
6277                        } @$parents ) .
6278                        ')';
6279        }
6280        if (gitweb_check_feature('patches') && @$parents <= 1) {
6281                $formats_nav .= " | " .
6282                        $cgi->a({-href => href(action=>"patch", -replay=>1)},
6283                                "patch");
6284        }
6285
6286        if (!defined $parent) {
6287                $parent = "--root";
6288        }
6289        my @difftree;
6290        open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
6291                @diff_opts,
6292                (@$parents <= 1 ? $parent : '-c'),
6293                $hash, "--"
6294                or die_error(500, "Open git-diff-tree failed");
6295        @difftree = map { chomp; $_ } <$fd>;
6296        close $fd or die_error(404, "Reading git-diff-tree failed");
6297
6298        # non-textual hash id's can be cached
6299        my $expires;
6300        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6301                $expires = "+1d";
6302        }
6303        my $refs = git_get_references();
6304        my $ref = format_ref_marker($refs, $co{'id'});
6305
6306        git_header_html(undef, $expires);
6307        git_print_page_nav('commit', '',
6308                           $hash, $co{'tree'}, $hash,
6309                           $formats_nav);
6310
6311        if (defined $co{'parent'}) {
6312                git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
6313        } else {
6314                git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
6315        }
6316        print "<div class=\"title_text\">\n" .
6317              "<table class=\"object_header\">\n";
6318        git_print_authorship_rows(\%co);
6319        print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
6320        print "<tr>" .
6321              "<td>tree</td>" .
6322              "<td class=\"sha1\">" .
6323              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
6324                       class => "list"}, $co{'tree'}) .
6325              "</td>" .
6326              "<td class=\"link\">" .
6327              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
6328                      "tree");
6329        my $snapshot_links = format_snapshot_links($hash);
6330        if (defined $snapshot_links) {
6331                print " | " . $snapshot_links;
6332        }
6333        print "</td>" .
6334              "</tr>\n";
6335
6336        foreach my $par (@$parents) {
6337                print "<tr>" .
6338                      "<td>parent</td>" .
6339                      "<td class=\"sha1\">" .
6340                      $cgi->a({-href => href(action=>"commit", hash=>$par),
6341                               class => "list"}, $par) .
6342                      "</td>" .
6343                      "<td class=\"link\">" .
6344                      $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
6345                      " | " .
6346                      $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
6347                      "</td>" .
6348                      "</tr>\n";
6349        }
6350        print "</table>".
6351              "</div>\n";
6352
6353        print "<div class=\"page_body\">\n";
6354        git_print_log($co{'comment'});
6355        print "</div>\n";
6356
6357        git_difftree_body(\@difftree, $hash, @$parents);
6358
6359        git_footer_html();
6360}
6361
6362sub git_object {
6363        # object is defined by:
6364        # - hash or hash_base alone
6365        # - hash_base and file_name
6366        my $type;
6367
6368        # - hash or hash_base alone
6369        if ($hash || ($hash_base && !defined $file_name)) {
6370                my $object_id = $hash || $hash_base;
6371
6372                open my $fd, "-|", quote_command(
6373                        git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
6374                        or die_error(404, "Object does not exist");
6375                $type = <$fd>;
6376                chomp $type;
6377                close $fd
6378                        or die_error(404, "Object does not exist");
6379
6380        # - hash_base and file_name
6381        } elsif ($hash_base && defined $file_name) {
6382                $file_name =~ s,/+$,,;
6383
6384                system(git_cmd(), "cat-file", '-e', $hash_base) == 0
6385                        or die_error(404, "Base object does not exist");
6386
6387                # here errors should not hapen
6388                open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
6389                        or die_error(500, "Open git-ls-tree failed");
6390                my $line = <$fd>;
6391                close $fd;
6392
6393                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
6394                unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
6395                        die_error(404, "File or directory for given base does not exist");
6396                }
6397                $type = $2;
6398                $hash = $3;
6399        } else {
6400                die_error(400, "Not enough information to find object");
6401        }
6402
6403        print $cgi->redirect(-uri => href(action=>$type, -full=>1,
6404                                          hash=>$hash, hash_base=>$hash_base,
6405                                          file_name=>$file_name),
6406                             -status => '302 Found');
6407}
6408
6409sub git_blobdiff {
6410        my $format = shift || 'html';
6411
6412        my $fd;
6413        my @difftree;
6414        my %diffinfo;
6415        my $expires;
6416
6417        # preparing $fd and %diffinfo for git_patchset_body
6418        # new style URI
6419        if (defined $hash_base && defined $hash_parent_base) {
6420                if (defined $file_name) {
6421                        # read raw output
6422                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6423                                $hash_parent_base, $hash_base,
6424                                "--", (defined $file_parent ? $file_parent : ()), $file_name
6425                                or die_error(500, "Open git-diff-tree failed");
6426                        @difftree = map { chomp; $_ } <$fd>;
6427                        close $fd
6428                                or die_error(404, "Reading git-diff-tree failed");
6429                        @difftree
6430                                or die_error(404, "Blob diff not found");
6431
6432                } elsif (defined $hash &&
6433                         $hash =~ /[0-9a-fA-F]{40}/) {
6434                        # try to find filename from $hash
6435
6436                        # read filtered raw output
6437                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6438                                $hash_parent_base, $hash_base, "--"
6439                                or die_error(500, "Open git-diff-tree failed");
6440                        @difftree =
6441                                # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
6442                                # $hash == to_id
6443                                grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
6444                                map { chomp; $_ } <$fd>;
6445                        close $fd
6446                                or die_error(404, "Reading git-diff-tree failed");
6447                        @difftree
6448                                or die_error(404, "Blob diff not found");
6449
6450                } else {
6451                        die_error(400, "Missing one of the blob diff parameters");
6452                }
6453
6454                if (@difftree > 1) {
6455                        die_error(400, "Ambiguous blob diff specification");
6456                }
6457
6458                %diffinfo = parse_difftree_raw_line($difftree[0]);
6459                $file_parent ||= $diffinfo{'from_file'} || $file_name;
6460                $file_name   ||= $diffinfo{'to_file'};
6461
6462                $hash_parent ||= $diffinfo{'from_id'};
6463                $hash        ||= $diffinfo{'to_id'};
6464
6465                # non-textual hash id's can be cached
6466                if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
6467                    $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
6468                        $expires = '+1d';
6469                }
6470
6471                # open patch output
6472                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6473                        '-p', ($format eq 'html' ? "--full-index" : ()),
6474                        $hash_parent_base, $hash_base,
6475                        "--", (defined $file_parent ? $file_parent : ()), $file_name
6476                        or die_error(500, "Open git-diff-tree failed");
6477        }
6478
6479        # old/legacy style URI -- not generated anymore since 1.4.3.
6480        if (!%diffinfo) {
6481                die_error('404 Not Found', "Missing one of the blob diff parameters")
6482        }
6483
6484        # header
6485        if ($format eq 'html') {
6486                my $formats_nav =
6487                        $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
6488                                "raw");
6489                git_header_html(undef, $expires);
6490                if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6491                        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6492                        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6493                } else {
6494                        print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
6495                        print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
6496                }
6497                if (defined $file_name) {
6498                        git_print_page_path($file_name, "blob", $hash_base);
6499                } else {
6500                        print "<div class=\"page_path\"></div>\n";
6501                }
6502
6503        } elsif ($format eq 'plain') {
6504                print $cgi->header(
6505                        -type => 'text/plain',
6506                        -charset => 'utf-8',
6507                        -expires => $expires,
6508                        -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
6509
6510                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6511
6512        } else {
6513                die_error(400, "Unknown blobdiff format");
6514        }
6515
6516        # patch
6517        if ($format eq 'html') {
6518                print "<div class=\"page_body\">\n";
6519
6520                git_patchset_body($fd, [ \%diffinfo ], $hash_base, $hash_parent_base);
6521                close $fd;
6522
6523                print "</div>\n"; # class="page_body"
6524                git_footer_html();
6525
6526        } else {
6527                while (my $line = <$fd>) {
6528                        $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
6529                        $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
6530
6531                        print $line;
6532
6533                        last if $line =~ m!^\+\+\+!;
6534                }
6535                local $/ = undef;
6536                print <$fd>;
6537                close $fd;
6538        }
6539}
6540
6541sub git_blobdiff_plain {
6542        git_blobdiff('plain');
6543}
6544
6545sub git_commitdiff {
6546        my %params = @_;
6547        my $format = $params{-format} || 'html';
6548
6549        my ($patch_max) = gitweb_get_feature('patches');
6550        if ($format eq 'patch') {
6551                die_error(403, "Patch view not allowed") unless $patch_max;
6552        }
6553
6554        $hash ||= $hash_base || "HEAD";
6555        my %co = parse_commit($hash)
6556            or die_error(404, "Unknown commit object");
6557
6558        # choose format for commitdiff for merge
6559        if (! defined $hash_parent && @{$co{'parents'}} > 1) {
6560                $hash_parent = '--cc';
6561        }
6562        # we need to prepare $formats_nav before almost any parameter munging
6563        my $formats_nav;
6564        if ($format eq 'html') {
6565                $formats_nav =
6566                        $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
6567                                "raw");
6568                if ($patch_max && @{$co{'parents'}} <= 1) {
6569                        $formats_nav .= " | " .
6570                                $cgi->a({-href => href(action=>"patch", -replay=>1)},
6571                                        "patch");
6572                }
6573
6574                if (defined $hash_parent &&
6575                    $hash_parent ne '-c' && $hash_parent ne '--cc') {
6576                        # commitdiff with two commits given
6577                        my $hash_parent_short = $hash_parent;
6578                        if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
6579                                $hash_parent_short = substr($hash_parent, 0, 7);
6580                        }
6581                        $formats_nav .=
6582                                ' (from';
6583                        for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
6584                                if ($co{'parents'}[$i] eq $hash_parent) {
6585                                        $formats_nav .= ' parent ' . ($i+1);
6586                                        last;
6587                                }
6588                        }
6589                        $formats_nav .= ': ' .
6590                                $cgi->a({-href => href(action=>"commitdiff",
6591                                                       hash=>$hash_parent)},
6592                                        esc_html($hash_parent_short)) .
6593                                ')';
6594                } elsif (!$co{'parent'}) {
6595                        # --root commitdiff
6596                        $formats_nav .= ' (initial)';
6597                } elsif (scalar @{$co{'parents'}} == 1) {
6598                        # single parent commit
6599                        $formats_nav .=
6600                                ' (parent: ' .
6601                                $cgi->a({-href => href(action=>"commitdiff",
6602                                                       hash=>$co{'parent'})},
6603                                        esc_html(substr($co{'parent'}, 0, 7))) .
6604                                ')';
6605                } else {
6606                        # merge commit
6607                        if ($hash_parent eq '--cc') {
6608                                $formats_nav .= ' | ' .
6609                                        $cgi->a({-href => href(action=>"commitdiff",
6610                                                               hash=>$hash, hash_parent=>'-c')},
6611                                                'combined');
6612                        } else { # $hash_parent eq '-c'
6613                                $formats_nav .= ' | ' .
6614                                        $cgi->a({-href => href(action=>"commitdiff",
6615                                                               hash=>$hash, hash_parent=>'--cc')},
6616                                                'compact');
6617                        }
6618                        $formats_nav .=
6619                                ' (merge: ' .
6620                                join(' ', map {
6621                                        $cgi->a({-href => href(action=>"commitdiff",
6622                                                               hash=>$_)},
6623                                                esc_html(substr($_, 0, 7)));
6624                                } @{$co{'parents'}} ) .
6625                                ')';
6626                }
6627        }
6628
6629        my $hash_parent_param = $hash_parent;
6630        if (!defined $hash_parent_param) {
6631                # --cc for multiple parents, --root for parentless
6632                $hash_parent_param =
6633                        @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
6634        }
6635
6636        # read commitdiff
6637        my $fd;
6638        my @difftree;
6639        if ($format eq 'html') {
6640                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6641                        "--no-commit-id", "--patch-with-raw", "--full-index",
6642                        $hash_parent_param, $hash, "--"
6643                        or die_error(500, "Open git-diff-tree failed");
6644
6645                while (my $line = <$fd>) {
6646                        chomp $line;
6647                        # empty line ends raw part of diff-tree output
6648                        last unless $line;
6649                        push @difftree, scalar parse_difftree_raw_line($line);
6650                }
6651
6652        } elsif ($format eq 'plain') {
6653                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6654                        '-p', $hash_parent_param, $hash, "--"
6655                        or die_error(500, "Open git-diff-tree failed");
6656        } elsif ($format eq 'patch') {
6657                # For commit ranges, we limit the output to the number of
6658                # patches specified in the 'patches' feature.
6659                # For single commits, we limit the output to a single patch,
6660                # diverging from the git-format-patch default.
6661                my @commit_spec = ();
6662                if ($hash_parent) {
6663                        if ($patch_max > 0) {
6664                                push @commit_spec, "-$patch_max";
6665                        }
6666                        push @commit_spec, '-n', "$hash_parent..$hash";
6667                } else {
6668                        if ($params{-single}) {
6669                                push @commit_spec, '-1';
6670                        } else {
6671                                if ($patch_max > 0) {
6672                                        push @commit_spec, "-$patch_max";
6673                                }
6674                                push @commit_spec, "-n";
6675                        }
6676                        push @commit_spec, '--root', $hash;
6677                }
6678                open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
6679                        '--encoding=utf8', '--stdout', @commit_spec
6680                        or die_error(500, "Open git-format-patch failed");
6681        } else {
6682                die_error(400, "Unknown commitdiff format");
6683        }
6684
6685        # non-textual hash id's can be cached
6686        my $expires;
6687        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6688                $expires = "+1d";
6689        }
6690
6691        # write commit message
6692        if ($format eq 'html') {
6693                my $refs = git_get_references();
6694                my $ref = format_ref_marker($refs, $co{'id'});
6695
6696                git_header_html(undef, $expires);
6697                git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
6698                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
6699                print "<div class=\"title_text\">\n" .
6700                      "<table class=\"object_header\">\n";
6701                git_print_authorship_rows(\%co);
6702                print "</table>".
6703                      "</div>\n";
6704                print "<div class=\"page_body\">\n";
6705                if (@{$co{'comment'}} > 1) {
6706                        print "<div class=\"log\">\n";
6707                        git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
6708                        print "</div>\n"; # class="log"
6709                }
6710
6711        } elsif ($format eq 'plain') {
6712                my $refs = git_get_references("tags");
6713                my $tagname = git_get_rev_name_tags($hash);
6714                my $filename = basename($project) . "-$hash.patch";
6715
6716                print $cgi->header(
6717                        -type => 'text/plain',
6718                        -charset => 'utf-8',
6719                        -expires => $expires,
6720                        -content_disposition => 'inline; filename="' . "$filename" . '"');
6721                my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
6722                print "From: " . to_utf8($co{'author'}) . "\n";
6723                print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
6724                print "Subject: " . to_utf8($co{'title'}) . "\n";
6725
6726                print "X-Git-Tag: $tagname\n" if $tagname;
6727                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6728
6729                foreach my $line (@{$co{'comment'}}) {
6730                        print to_utf8($line) . "\n";
6731                }
6732                print "---\n\n";
6733        } elsif ($format eq 'patch') {
6734                my $filename = basename($project) . "-$hash.patch";
6735
6736                print $cgi->header(
6737                        -type => 'text/plain',
6738                        -charset => 'utf-8',
6739                        -expires => $expires,
6740                        -content_disposition => 'inline; filename="' . "$filename" . '"');
6741        }
6742
6743        # write patch
6744        if ($format eq 'html') {
6745                my $use_parents = !defined $hash_parent ||
6746                        $hash_parent eq '-c' || $hash_parent eq '--cc';
6747                git_difftree_body(\@difftree, $hash,
6748                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
6749                print "<br/>\n";
6750
6751                git_patchset_body($fd, \@difftree, $hash,
6752                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
6753                close $fd;
6754                print "</div>\n"; # class="page_body"
6755                git_footer_html();
6756
6757        } elsif ($format eq 'plain') {
6758                local $/ = undef;
6759                print <$fd>;
6760                close $fd
6761                        or print "Reading git-diff-tree failed\n";
6762        } elsif ($format eq 'patch') {
6763                local $/ = undef;
6764                print <$fd>;
6765                close $fd
6766                        or print "Reading git-format-patch failed\n";
6767        }
6768}
6769
6770sub git_commitdiff_plain {
6771        git_commitdiff(-format => 'plain');
6772}
6773
6774# format-patch-style patches
6775sub git_patch {
6776        git_commitdiff(-format => 'patch', -single => 1);
6777}
6778
6779sub git_patches {
6780        git_commitdiff(-format => 'patch');
6781}
6782
6783sub git_history {
6784        git_log_generic('history', \&git_history_body,
6785                        $hash_base, $hash_parent_base,
6786                        $file_name, $hash);
6787}
6788
6789sub git_search {
6790        gitweb_check_feature('search') or die_error(403, "Search is disabled");
6791        if (!defined $searchtext) {
6792                die_error(400, "Text field is empty");
6793        }
6794        if (!defined $hash) {
6795                $hash = git_get_head_hash($project);
6796        }
6797        my %co = parse_commit($hash);
6798        if (!%co) {
6799                die_error(404, "Unknown commit object");
6800        }
6801        if (!defined $page) {
6802                $page = 0;
6803        }
6804
6805        $searchtype ||= 'commit';
6806        if ($searchtype eq 'pickaxe') {
6807                # pickaxe may take all resources of your box and run for several minutes
6808                # with every query - so decide by yourself how public you make this feature
6809                gitweb_check_feature('pickaxe')
6810                    or die_error(403, "Pickaxe is disabled");
6811        }
6812        if ($searchtype eq 'grep') {
6813                gitweb_check_feature('grep')
6814                    or die_error(403, "Grep is disabled");
6815        }
6816
6817        git_header_html();
6818
6819        if ($searchtype eq 'commit' or $searchtype eq 'author' or $searchtype eq 'committer') {
6820                my $greptype;
6821                if ($searchtype eq 'commit') {
6822                        $greptype = "--grep=";
6823                } elsif ($searchtype eq 'author') {
6824                        $greptype = "--author=";
6825                } elsif ($searchtype eq 'committer') {
6826                        $greptype = "--committer=";
6827                }
6828                $greptype .= $searchtext;
6829                my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
6830                                               $greptype, '--regexp-ignore-case',
6831                                               $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
6832
6833                my $paging_nav = '';
6834                if ($page > 0) {
6835                        $paging_nav .=
6836                                $cgi->a({-href => href(action=>"search", hash=>$hash,
6837                                                       searchtext=>$searchtext,
6838                                                       searchtype=>$searchtype)},
6839                                        "first");
6840                        $paging_nav .= " &sdot; " .
6841                                $cgi->a({-href => href(-replay=>1, page=>$page-1),
6842                                         -accesskey => "p", -title => "Alt-p"}, "prev");
6843                } else {
6844                        $paging_nav .= "first";
6845                        $paging_nav .= " &sdot; prev";
6846                }
6847                my $next_link = '';
6848                if ($#commitlist >= 100) {
6849                        $next_link =
6850                                $cgi->a({-href => href(-replay=>1, page=>$page+1),
6851                                         -accesskey => "n", -title => "Alt-n"}, "next");
6852                        $paging_nav .= " &sdot; $next_link";
6853                } else {
6854                        $paging_nav .= " &sdot; next";
6855                }
6856
6857                git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
6858                git_print_header_div('commit', esc_html($co{'title'}), $hash);
6859                if ($page == 0 && !@commitlist) {
6860                        print "<p>No match.</p>\n";
6861                } else {
6862                        git_search_grep_body(\@commitlist, 0, 99, $next_link);
6863                }
6864        }
6865
6866        if ($searchtype eq 'pickaxe') {
6867                git_print_page_nav('','', $hash,$co{'tree'},$hash);
6868                git_print_header_div('commit', esc_html($co{'title'}), $hash);
6869
6870                print "<table class=\"pickaxe search\">\n";
6871                my $alternate = 1;
6872                local $/ = "\n";
6873                open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
6874                        '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
6875                        ($search_use_regexp ? '--pickaxe-regex' : ());
6876                undef %co;
6877                my @files;
6878                while (my $line = <$fd>) {
6879                        chomp $line;
6880                        next unless $line;
6881
6882                        my %set = parse_difftree_raw_line($line);
6883                        if (defined $set{'commit'}) {
6884                                # finish previous commit
6885                                if (%co) {
6886                                        print "</td>\n" .
6887                                              "<td class=\"link\">" .
6888                                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6889                                              " | " .
6890                                              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6891                                        print "</td>\n" .
6892                                              "</tr>\n";
6893                                }
6894
6895                                if ($alternate) {
6896                                        print "<tr class=\"dark\">\n";
6897                                } else {
6898                                        print "<tr class=\"light\">\n";
6899                                }
6900                                $alternate ^= 1;
6901                                %co = parse_commit($set{'commit'});
6902                                my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6903                                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6904                                      "<td><i>$author</i></td>\n" .
6905                                      "<td>" .
6906                                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6907                                              -class => "list subject"},
6908                                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
6909                        } elsif (defined $set{'to_id'}) {
6910                                next if ($set{'to_id'} =~ m/^0{40}$/);
6911
6912                                print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6913                                                             hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6914                                              -class => "list"},
6915                                              "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6916                                      "<br/>\n";
6917                        }
6918                }
6919                close $fd;
6920
6921                # finish last commit (warning: repetition!)
6922                if (%co) {
6923                        print "</td>\n" .
6924                              "<td class=\"link\">" .
6925                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6926                              " | " .
6927                              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6928                        print "</td>\n" .
6929                              "</tr>\n";
6930                }
6931
6932                print "</table>\n";
6933        }
6934
6935        if ($searchtype eq 'grep') {
6936                git_print_page_nav('','', $hash,$co{'tree'},$hash);
6937                git_print_header_div('commit', esc_html($co{'title'}), $hash);
6938
6939                print "<table class=\"grep_search\">\n";
6940                my $alternate = 1;
6941                my $matches = 0;
6942                local $/ = "\n";
6943                open my $fd, "-|", git_cmd(), 'grep', '-n',
6944                        $search_use_regexp ? ('-E', '-i') : '-F',
6945                        $searchtext, $co{'tree'};
6946                my $lastfile = '';
6947                while (my $line = <$fd>) {
6948                        chomp $line;
6949                        my ($file, $lno, $ltext, $binary);
6950                        last if ($matches++ > 1000);
6951                        if ($line =~ /^Binary file (.+) matches$/) {
6952                                $file = $1;
6953                                $binary = 1;
6954                        } else {
6955                                (undef, $file, $lno, $ltext) = split(/:/, $line, 4);
6956                        }
6957                        if ($file ne $lastfile) {
6958                                $lastfile and print "</td></tr>\n";
6959                                if ($alternate++) {
6960                                        print "<tr class=\"dark\">\n";
6961                                } else {
6962                                        print "<tr class=\"light\">\n";
6963                                }
6964                                print "<td class=\"list\">".
6965                                        $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6966                                                               file_name=>"$file"),
6967                                                -class => "list"}, esc_path($file));
6968                                print "</td><td>\n";
6969                                $lastfile = $file;
6970                        }
6971                        if ($binary) {
6972                                print "<div class=\"binary\">Binary file</div>\n";
6973                        } else {
6974                                $ltext = untabify($ltext);
6975                                if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6976                                        $ltext = esc_html($1, -nbsp=>1);
6977                                        $ltext .= '<span class="match">';
6978                                        $ltext .= esc_html($2, -nbsp=>1);
6979                                        $ltext .= '</span>';
6980                                        $ltext .= esc_html($3, -nbsp=>1);
6981                                } else {
6982                                        $ltext = esc_html($ltext, -nbsp=>1);
6983                                }
6984                                print "<div class=\"pre\">" .
6985                                        $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6986                                                               file_name=>"$file").'#l'.$lno,
6987                                                -class => "linenr"}, sprintf('%4i', $lno))
6988                                        . ' ' .  $ltext . "</div>\n";
6989                        }
6990                }
6991                if ($lastfile) {
6992                        print "</td></tr>\n";
6993                        if ($matches > 1000) {
6994                                print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6995                        }
6996                } else {
6997                        print "<div class=\"diff nodifferences\">No matches found</div>\n";
6998                }
6999                close $fd;
7000
7001                print "</table>\n";
7002        }
7003        git_footer_html();
7004}
7005
7006sub git_search_help {
7007        git_header_html();
7008        git_print_page_nav('','', $hash,$hash,$hash);
7009        print <<EOT;
7010<p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7011regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7012the pattern entered is recognized as the POSIX extended
7013<a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7014insensitive).</p>
7015<dl>
7016<dt><b>commit</b></dt>
7017<dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7018EOT
7019        my $have_grep = gitweb_check_feature('grep');
7020        if ($have_grep) {
7021                print <<EOT;
7022<dt><b>grep</b></dt>
7023<dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7024    a different one) are searched for the given pattern. On large trees, this search can take
7025a while and put some strain on the server, so please use it with some consideration. Note that
7026due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7027case-sensitive.</dd>
7028EOT
7029        }
7030        print <<EOT;
7031<dt><b>author</b></dt>
7032<dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7033<dt><b>committer</b></dt>
7034<dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7035EOT
7036        my $have_pickaxe = gitweb_check_feature('pickaxe');
7037        if ($have_pickaxe) {
7038                print <<EOT;
7039<dt><b>pickaxe</b></dt>
7040<dd>All commits that caused the string to appear or disappear from any file (changes that
7041added, removed or "modified" the string) will be listed. This search can take a while and
7042takes a lot of strain on the server, so please use it wisely. Note that since you may be
7043interested even in changes just changing the case as well, this search is case sensitive.</dd>
7044EOT
7045        }
7046        print "</dl>\n";
7047        git_footer_html();
7048}
7049
7050sub git_shortlog {
7051        git_log_generic('shortlog', \&git_shortlog_body,
7052                        $hash, $hash_parent);
7053}
7054
7055## ......................................................................
7056## feeds (RSS, Atom; OPML)
7057
7058sub git_feed {
7059        my $format = shift || 'atom';
7060        my $have_blame = gitweb_check_feature('blame');
7061
7062        # Atom: http://www.atomenabled.org/developers/syndication/
7063        # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7064        if ($format ne 'rss' && $format ne 'atom') {
7065                die_error(400, "Unknown web feed format");
7066        }
7067
7068        # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7069        my $head = $hash || 'HEAD';
7070        my @commitlist = parse_commits($head, 150, 0, $file_name);
7071
7072        my %latest_commit;
7073        my %latest_date;
7074        my $content_type = "application/$format+xml";
7075        if (defined $cgi->http('HTTP_ACCEPT') &&
7076                 $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7077                # browser (feed reader) prefers text/xml
7078                $content_type = 'text/xml';
7079        }
7080        if (defined($commitlist[0])) {
7081                %latest_commit = %{$commitlist[0]};
7082                my $latest_epoch = $latest_commit{'committer_epoch'};
7083                %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7084                my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7085                if (defined $if_modified) {
7086                        my $since;
7087                        if (eval { require HTTP::Date; 1; }) {
7088                                $since = HTTP::Date::str2time($if_modified);
7089                        } elsif (eval { require Time::ParseDate; 1; }) {
7090                                $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7091                        }
7092                        if (defined $since && $latest_epoch <= $since) {
7093                                print $cgi->header(
7094                                        -type => $content_type,
7095                                        -charset => 'utf-8',
7096                                        -last_modified => $latest_date{'rfc2822'},
7097                                        -status => '304 Not Modified');
7098                                return;
7099                        }
7100                }
7101                print $cgi->header(
7102                        -type => $content_type,
7103                        -charset => 'utf-8',
7104                        -last_modified => $latest_date{'rfc2822'});
7105        } else {
7106                print $cgi->header(
7107                        -type => $content_type,
7108                        -charset => 'utf-8');
7109        }
7110
7111        # Optimization: skip generating the body if client asks only
7112        # for Last-Modified date.
7113        return if ($cgi->request_method() eq 'HEAD');
7114
7115        # header variables
7116        my $title = "$site_name - $project/$action";
7117        my $feed_type = 'log';
7118        if (defined $hash) {
7119                $title .= " - '$hash'";
7120                $feed_type = 'branch log';
7121                if (defined $file_name) {
7122                        $title .= " :: $file_name";
7123                        $feed_type = 'history';
7124                }
7125        } elsif (defined $file_name) {
7126                $title .= " - $file_name";
7127                $feed_type = 'history';
7128        }
7129        $title .= " $feed_type";
7130        my $descr = git_get_project_description($project);
7131        if (defined $descr) {
7132                $descr = esc_html($descr);
7133        } else {
7134                $descr = "$project " .
7135                         ($format eq 'rss' ? 'RSS' : 'Atom') .
7136                         " feed";
7137        }
7138        my $owner = git_get_project_owner($project);
7139        $owner = esc_html($owner);
7140
7141        #header
7142        my $alt_url;
7143        if (defined $file_name) {
7144                $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7145        } elsif (defined $hash) {
7146                $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7147        } else {
7148                $alt_url = href(-full=>1, action=>"summary");
7149        }
7150        print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7151        if ($format eq 'rss') {
7152                print <<XML;
7153<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7154<channel>
7155XML
7156                print "<title>$title</title>\n" .
7157                      "<link>$alt_url</link>\n" .
7158                      "<description>$descr</description>\n" .
7159                      "<language>en</language>\n" .
7160                      # project owner is responsible for 'editorial' content
7161                      "<managingEditor>$owner</managingEditor>\n";
7162                if (defined $logo || defined $favicon) {
7163                        # prefer the logo to the favicon, since RSS
7164                        # doesn't allow both
7165                        my $img = esc_url($logo || $favicon);
7166                        print "<image>\n" .
7167                              "<url>$img</url>\n" .
7168                              "<title>$title</title>\n" .
7169                              "<link>$alt_url</link>\n" .
7170                              "</image>\n";
7171                }
7172                if (%latest_date) {
7173                        print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7174                        print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7175                }
7176                print "<generator>gitweb v.$version/$git_version</generator>\n";
7177        } elsif ($format eq 'atom') {
7178                print <<XML;
7179<feed xmlns="http://www.w3.org/2005/Atom">
7180XML
7181                print "<title>$title</title>\n" .
7182                      "<subtitle>$descr</subtitle>\n" .
7183                      '<link rel="alternate" type="text/html" href="' .
7184                      $alt_url . '" />' . "\n" .
7185                      '<link rel="self" type="' . $content_type . '" href="' .
7186                      $cgi->self_url() . '" />' . "\n" .
7187                      "<id>" . href(-full=>1) . "</id>\n" .
7188                      # use project owner for feed author
7189                      "<author><name>$owner</name></author>\n";
7190                if (defined $favicon) {
7191                        print "<icon>" . esc_url($favicon) . "</icon>\n";
7192                }
7193                if (defined $logo) {
7194                        # not twice as wide as tall: 72 x 27 pixels
7195                        print "<logo>" . esc_url($logo) . "</logo>\n";
7196                }
7197                if (! %latest_date) {
7198                        # dummy date to keep the feed valid until commits trickle in:
7199                        print "<updated>1970-01-01T00:00:00Z</updated>\n";
7200                } else {
7201                        print "<updated>$latest_date{'iso-8601'}</updated>\n";
7202                }
7203                print "<generator version='$version/$git_version'>gitweb</generator>\n";
7204        }
7205
7206        # contents
7207        for (my $i = 0; $i <= $#commitlist; $i++) {
7208                my %co = %{$commitlist[$i]};
7209                my $commit = $co{'id'};
7210                # we read 150, we always show 30 and the ones more recent than 48 hours
7211                if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7212                        last;
7213                }
7214                my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7215
7216                # get list of changed files
7217                open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7218                        $co{'parent'} || "--root",
7219                        $co{'id'}, "--", (defined $file_name ? $file_name : ())
7220                        or next;
7221                my @difftree = map { chomp; $_ } <$fd>;
7222                close $fd
7223                        or next;
7224
7225                # print element (entry, item)
7226                my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7227                if ($format eq 'rss') {
7228                        print "<item>\n" .
7229                              "<title>" . esc_html($co{'title'}) . "</title>\n" .
7230                              "<author>" . esc_html($co{'author'}) . "</author>\n" .
7231                              "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7232                              "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7233                              "<link>$co_url</link>\n" .
7234                              "<description>" . esc_html($co{'title'}) . "</description>\n" .
7235                              "<content:encoded>" .
7236                              "<![CDATA[\n";
7237                } elsif ($format eq 'atom') {
7238                        print "<entry>\n" .
7239                              "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7240                              "<updated>$cd{'iso-8601'}</updated>\n" .
7241                              "<author>\n" .
7242                              "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7243                        if ($co{'author_email'}) {
7244                                print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7245                        }
7246                        print "</author>\n" .
7247                              # use committer for contributor
7248                              "<contributor>\n" .
7249                              "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7250                        if ($co{'committer_email'}) {
7251                                print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7252                        }
7253                        print "</contributor>\n" .
7254                              "<published>$cd{'iso-8601'}</published>\n" .
7255                              "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7256                              "<id>$co_url</id>\n" .
7257                              "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
7258                              "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
7259                }
7260                my $comment = $co{'comment'};
7261                print "<pre>\n";
7262                foreach my $line (@$comment) {
7263                        $line = esc_html($line);
7264                        print "$line\n";
7265                }
7266                print "</pre><ul>\n";
7267                foreach my $difftree_line (@difftree) {
7268                        my %difftree = parse_difftree_raw_line($difftree_line);
7269                        next if !$difftree{'from_id'};
7270
7271                        my $file = $difftree{'file'} || $difftree{'to_file'};
7272
7273                        print "<li>" .
7274                              "[" .
7275                              $cgi->a({-href => href(-full=>1, action=>"blobdiff",
7276                                                     hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
7277                                                     hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
7278                                                     file_name=>$file, file_parent=>$difftree{'from_file'}),
7279                                      -title => "diff"}, 'D');
7280                        if ($have_blame) {
7281                                print $cgi->a({-href => href(-full=>1, action=>"blame",
7282                                                             file_name=>$file, hash_base=>$commit),
7283                                              -title => "blame"}, 'B');
7284                        }
7285                        # if this is not a feed of a file history
7286                        if (!defined $file_name || $file_name ne $file) {
7287                                print $cgi->a({-href => href(-full=>1, action=>"history",
7288                                                             file_name=>$file, hash=>$commit),
7289                                              -title => "history"}, 'H');
7290                        }
7291                        $file = esc_path($file);
7292                        print "] ".
7293                              "$file</li>\n";
7294                }
7295                if ($format eq 'rss') {
7296                        print "</ul>]]>\n" .
7297                              "</content:encoded>\n" .
7298                              "</item>\n";
7299                } elsif ($format eq 'atom') {
7300                        print "</ul>\n</div>\n" .
7301                              "</content>\n" .
7302                              "</entry>\n";
7303                }
7304        }
7305
7306        # end of feed
7307        if ($format eq 'rss') {
7308                print "</channel>\n</rss>\n";
7309        } elsif ($format eq 'atom') {
7310                print "</feed>\n";
7311        }
7312}
7313
7314sub git_rss {
7315        git_feed('rss');
7316}
7317
7318sub git_atom {
7319        git_feed('atom');
7320}
7321
7322sub git_opml {
7323        my @list = git_get_projects_list();
7324
7325        print $cgi->header(
7326                -type => 'text/xml',
7327                -charset => 'utf-8',
7328                -content_disposition => 'inline; filename="opml.xml"');
7329
7330        print <<XML;
7331<?xml version="1.0" encoding="utf-8"?>
7332<opml version="1.0">
7333<head>
7334  <title>$site_name OPML Export</title>
7335</head>
7336<body>
7337<outline text="git RSS feeds">
7338XML
7339
7340        foreach my $pr (@list) {
7341                my %proj = %$pr;
7342                my $head = git_get_head_hash($proj{'path'});
7343                if (!defined $head) {
7344                        next;
7345                }
7346                $git_dir = "$projectroot/$proj{'path'}";
7347                my %co = parse_commit($head);
7348                if (!%co) {
7349                        next;
7350                }
7351
7352                my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7353                my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7354                my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7355                print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7356        }
7357        print <<XML;
7358</outline>
7359</body>
7360</opml>
7361XML
7362}