6651946f54f8fbfd8b96701753caa028f9814232
   1#!/usr/bin/perl
   2
   3# gitweb - simple web interface to track changes in git repositories
   4#
   5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
   6# (C) 2005, Christian Gierke
   7#
   8# This program is licensed under the GPLv2
   9
  10use 5.008;
  11use strict;
  12use warnings;
  13use CGI qw(:standard :escapeHTML -nosticky);
  14use CGI::Util qw(unescape);
  15use CGI::Carp qw(fatalsToBrowser set_message);
  16use Encode;
  17use Fcntl ':mode';
  18use File::Find qw();
  19use File::Basename qw(basename);
  20use Time::HiRes qw(gettimeofday tv_interval);
  21binmode STDOUT, ':utf8';
  22
  23our $t0 = [ gettimeofday() ];
  24our $number_of_git_cmds = 0;
  25
  26BEGIN {
  27        CGI->compile() if $ENV{'MOD_PERL'};
  28}
  29
  30our $version = "++GIT_VERSION++";
  31
  32our ($my_url, $my_uri, $base_url, $path_info, $home_link);
  33sub evaluate_uri {
  34        our $cgi;
  35
  36        our $my_url = $cgi->url();
  37        our $my_uri = $cgi->url(-absolute => 1);
  38
  39        # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
  40        # needed and used only for URLs with nonempty PATH_INFO
  41        our $base_url = $my_url;
  42
  43        # When the script is used as DirectoryIndex, the URL does not contain the name
  44        # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
  45        # have to do it ourselves. We make $path_info global because it's also used
  46        # later on.
  47        #
  48        # Another issue with the script being the DirectoryIndex is that the resulting
  49        # $my_url data is not the full script URL: this is good, because we want
  50        # generated links to keep implying the script name if it wasn't explicitly
  51        # indicated in the URL we're handling, but it means that $my_url cannot be used
  52        # as base URL.
  53        # Therefore, if we needed to strip PATH_INFO, then we know that we have
  54        # to build the base URL ourselves:
  55        our $path_info = $ENV{"PATH_INFO"};
  56        if ($path_info) {
  57                if ($my_url =~ s,\Q$path_info\E$,, &&
  58                    $my_uri =~ s,\Q$path_info\E$,, &&
  59                    defined $ENV{'SCRIPT_NAME'}) {
  60                        $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
  61                }
  62        }
  63
  64        # target of the home link on top of all pages
  65        our $home_link = $my_uri || "/";
  66}
  67
  68# core git executable to use
  69# this can just be "git" if your webserver has a sensible PATH
  70our $GIT = "++GIT_BINDIR++/git";
  71
  72# absolute fs-path which will be prepended to the project path
  73#our $projectroot = "/pub/scm";
  74our $projectroot = "++GITWEB_PROJECTROOT++";
  75
  76# fs traversing limit for getting project list
  77# the number is relative to the projectroot
  78our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
  79
  80# string of the home link on top of all pages
  81our $home_link_str = "++GITWEB_HOME_LINK_STR++";
  82
  83# name of your site or organization to appear in page titles
  84# replace this with something more descriptive for clearer bookmarks
  85our $site_name = "++GITWEB_SITENAME++"
  86                 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
  87
  88# filename of html text to include at top of each page
  89our $site_header = "++GITWEB_SITE_HEADER++";
  90# html text to include at home page
  91our $home_text = "++GITWEB_HOMETEXT++";
  92# filename of html text to include at bottom of each page
  93our $site_footer = "++GITWEB_SITE_FOOTER++";
  94
  95# URI of stylesheets
  96our @stylesheets = ("++GITWEB_CSS++");
  97# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
  98our $stylesheet = undef;
  99# URI of GIT logo (72x27 size)
 100our $logo = "++GITWEB_LOGO++";
 101# URI of GIT favicon, assumed to be image/png type
 102our $favicon = "++GITWEB_FAVICON++";
 103# URI of gitweb.js (JavaScript code for gitweb)
 104our $javascript = "++GITWEB_JS++";
 105
 106# URI and label (title) of GIT logo link
 107#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
 108#our $logo_label = "git documentation";
 109our $logo_url = "http://git-scm.com/";
 110our $logo_label = "git homepage";
 111
 112# source of projects list
 113our $projects_list = "++GITWEB_LIST++";
 114
 115# the width (in characters) of the projects list "Description" column
 116our $projects_list_description_width = 25;
 117
 118# default order of projects list
 119# valid values are none, project, descr, owner, and age
 120our $default_projects_order = "project";
 121
 122# show repository only if this file exists
 123# (only effective if this variable evaluates to true)
 124our $export_ok = "++GITWEB_EXPORT_OK++";
 125
 126# show repository only if this subroutine returns true
 127# when given the path to the project, for example:
 128#    sub { return -e "$_[0]/git-daemon-export-ok"; }
 129our $export_auth_hook = undef;
 130
 131# only allow viewing of repositories also shown on the overview page
 132our $strict_export = "++GITWEB_STRICT_EXPORT++";
 133
 134# list of git base URLs used for URL to where fetch project from,
 135# i.e. full URL is "$git_base_url/$project"
 136our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
 137
 138# default blob_plain mimetype and default charset for text/plain blob
 139our $default_blob_plain_mimetype = 'text/plain';
 140our $default_text_plain_charset  = undef;
 141
 142# file to use for guessing MIME types before trying /etc/mime.types
 143# (relative to the current git repository)
 144our $mimetypes_file = undef;
 145
 146# assume this charset if line contains non-UTF-8 characters;
 147# it should be valid encoding (see Encoding::Supported(3pm) for list),
 148# for which encoding all byte sequences are valid, for example
 149# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
 150# could be even 'utf-8' for the old behavior)
 151our $fallback_encoding = 'latin1';
 152
 153# rename detection options for git-diff and git-diff-tree
 154# - default is '-M', with the cost proportional to
 155#   (number of removed files) * (number of new files).
 156# - more costly is '-C' (which implies '-M'), with the cost proportional to
 157#   (number of changed files + number of removed files) * (number of new files)
 158# - even more costly is '-C', '--find-copies-harder' with cost
 159#   (number of files in the original tree) * (number of new files)
 160# - one might want to include '-B' option, e.g. '-B', '-M'
 161our @diff_opts = ('-M'); # taken from git_commit
 162
 163# Disables features that would allow repository owners to inject script into
 164# the gitweb domain.
 165our $prevent_xss = 0;
 166
 167# Path to the highlight executable to use (must be the one from
 168# http://www.andre-simon.de due to assumptions about parameters and output).
 169# Useful if highlight is not installed on your webserver's PATH.
 170# [Default: highlight]
 171our $highlight_bin = "++HIGHLIGHT_BIN++";
 172
 173# information about snapshot formats that gitweb is capable of serving
 174our %known_snapshot_formats = (
 175        # name => {
 176        #       'display' => display name,
 177        #       'type' => mime type,
 178        #       'suffix' => filename suffix,
 179        #       'format' => --format for git-archive,
 180        #       'compressor' => [compressor command and arguments]
 181        #                       (array reference, optional)
 182        #       'disabled' => boolean (optional)}
 183        #
 184        'tgz' => {
 185                'display' => 'tar.gz',
 186                'type' => 'application/x-gzip',
 187                'suffix' => '.tar.gz',
 188                'format' => 'tar',
 189                'compressor' => ['gzip']},
 190
 191        'tbz2' => {
 192                'display' => 'tar.bz2',
 193                'type' => 'application/x-bzip2',
 194                'suffix' => '.tar.bz2',
 195                'format' => 'tar',
 196                'compressor' => ['bzip2']},
 197
 198        'txz' => {
 199                'display' => 'tar.xz',
 200                'type' => 'application/x-xz',
 201                'suffix' => '.tar.xz',
 202                'format' => 'tar',
 203                'compressor' => ['xz'],
 204                'disabled' => 1},
 205
 206        'zip' => {
 207                'display' => 'zip',
 208                'type' => 'application/x-zip',
 209                'suffix' => '.zip',
 210                'format' => 'zip'},
 211);
 212
 213# Aliases so we understand old gitweb.snapshot values in repository
 214# configuration.
 215our %known_snapshot_format_aliases = (
 216        'gzip'  => 'tgz',
 217        'bzip2' => 'tbz2',
 218        'xz'    => 'txz',
 219
 220        # backward compatibility: legacy gitweb config support
 221        'x-gzip' => undef, 'gz' => undef,
 222        'x-bzip2' => undef, 'bz2' => undef,
 223        'x-zip' => undef, '' => undef,
 224);
 225
 226# Pixel sizes for icons and avatars. If the default font sizes or lineheights
 227# are changed, it may be appropriate to change these values too via
 228# $GITWEB_CONFIG.
 229our %avatar_size = (
 230        'default' => 16,
 231        'double'  => 32
 232);
 233
 234# Used to set the maximum load that we will still respond to gitweb queries.
 235# If server load exceed this value then return "503 server busy" error.
 236# If gitweb cannot determined server load, it is taken to be 0.
 237# Leave it undefined (or set to 'undef') to turn off load checking.
 238our $maxload = 300;
 239
 240# configuration for 'highlight' (http://www.andre-simon.de/)
 241# match by basename
 242our %highlight_basename = (
 243        #'Program' => 'py',
 244        #'Library' => 'py',
 245        'SConstruct' => 'py', # SCons equivalent of Makefile
 246        'Makefile' => 'make',
 247);
 248# match by extension
 249our %highlight_ext = (
 250        # main extensions, defining name of syntax;
 251        # see files in /usr/share/highlight/langDefs/ directory
 252        map { $_ => $_ }
 253                qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
 254        # alternate extensions, see /etc/highlight/filetypes.conf
 255        'h' => 'c',
 256        map { $_ => 'sh'  } qw(bash zsh ksh),
 257        map { $_ => 'cpp' } qw(cxx c++ cc),
 258        map { $_ => 'php' } qw(php3 php4 php5 phps),
 259        map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
 260        map { $_ => 'make'} qw(mak mk),
 261        map { $_ => 'xml' } qw(xhtml html htm),
 262);
 263
 264# You define site-wide feature defaults here; override them with
 265# $GITWEB_CONFIG as necessary.
 266our %feature = (
 267        # feature => {
 268        #       'sub' => feature-sub (subroutine),
 269        #       'override' => allow-override (boolean),
 270        #       'default' => [ default options...] (array reference)}
 271        #
 272        # if feature is overridable (it means that allow-override has true value),
 273        # then feature-sub will be called with default options as parameters;
 274        # return value of feature-sub indicates if to enable specified feature
 275        #
 276        # if there is no 'sub' key (no feature-sub), then feature cannot be
 277        # overridden
 278        #
 279        # use gitweb_get_feature(<feature>) to retrieve the <feature> value
 280        # (an array) or gitweb_check_feature(<feature>) to check if <feature>
 281        # is enabled
 282
 283        # Enable the 'blame' blob view, showing the last commit that modified
 284        # each line in the file. This can be very CPU-intensive.
 285
 286        # To enable system wide have in $GITWEB_CONFIG
 287        # $feature{'blame'}{'default'} = [1];
 288        # To have project specific config enable override in $GITWEB_CONFIG
 289        # $feature{'blame'}{'override'} = 1;
 290        # and in project config gitweb.blame = 0|1;
 291        'blame' => {
 292                'sub' => sub { feature_bool('blame', @_) },
 293                'override' => 0,
 294                'default' => [0]},
 295
 296        # Enable the 'snapshot' link, providing a compressed archive of any
 297        # tree. This can potentially generate high traffic if you have large
 298        # project.
 299
 300        # Value is a list of formats defined in %known_snapshot_formats that
 301        # you wish to offer.
 302        # To disable system wide have in $GITWEB_CONFIG
 303        # $feature{'snapshot'}{'default'} = [];
 304        # To have project specific config enable override in $GITWEB_CONFIG
 305        # $feature{'snapshot'}{'override'} = 1;
 306        # and in project config, a comma-separated list of formats or "none"
 307        # to disable.  Example: gitweb.snapshot = tbz2,zip;
 308        'snapshot' => {
 309                'sub' => \&feature_snapshot,
 310                'override' => 0,
 311                'default' => ['tgz']},
 312
 313        # Enable text search, which will list the commits which match author,
 314        # committer or commit text to a given string.  Enabled by default.
 315        # Project specific override is not supported.
 316        'search' => {
 317                'override' => 0,
 318                'default' => [1]},
 319
 320        # Enable grep search, which will list the files in currently selected
 321        # tree containing the given string. Enabled by default. This can be
 322        # potentially CPU-intensive, of course.
 323
 324        # To enable system wide have in $GITWEB_CONFIG
 325        # $feature{'grep'}{'default'} = [1];
 326        # To have project specific config enable override in $GITWEB_CONFIG
 327        # $feature{'grep'}{'override'} = 1;
 328        # and in project config gitweb.grep = 0|1;
 329        'grep' => {
 330                'sub' => sub { feature_bool('grep', @_) },
 331                'override' => 0,
 332                'default' => [1]},
 333
 334        # Enable the pickaxe search, which will list the commits that modified
 335        # a given string in a file. This can be practical and quite faster
 336        # alternative to 'blame', but still potentially CPU-intensive.
 337
 338        # To enable system wide have in $GITWEB_CONFIG
 339        # $feature{'pickaxe'}{'default'} = [1];
 340        # To have project specific config enable override in $GITWEB_CONFIG
 341        # $feature{'pickaxe'}{'override'} = 1;
 342        # and in project config gitweb.pickaxe = 0|1;
 343        'pickaxe' => {
 344                'sub' => sub { feature_bool('pickaxe', @_) },
 345                'override' => 0,
 346                'default' => [1]},
 347
 348        # Enable showing size of blobs in a 'tree' view, in a separate
 349        # column, similar to what 'ls -l' does.  This cost a bit of IO.
 350
 351        # To disable system wide have in $GITWEB_CONFIG
 352        # $feature{'show-sizes'}{'default'} = [0];
 353        # To have project specific config enable override in $GITWEB_CONFIG
 354        # $feature{'show-sizes'}{'override'} = 1;
 355        # and in project config gitweb.showsizes = 0|1;
 356        'show-sizes' => {
 357                'sub' => sub { feature_bool('showsizes', @_) },
 358                'override' => 0,
 359                'default' => [1]},
 360
 361        # Make gitweb use an alternative format of the URLs which can be
 362        # more readable and natural-looking: project name is embedded
 363        # directly in the path and the query string contains other
 364        # auxiliary information. All gitweb installations recognize
 365        # URL in either format; this configures in which formats gitweb
 366        # generates links.
 367
 368        # To enable system wide have in $GITWEB_CONFIG
 369        # $feature{'pathinfo'}{'default'} = [1];
 370        # Project specific override is not supported.
 371
 372        # Note that you will need to change the default location of CSS,
 373        # favicon, logo and possibly other files to an absolute URL. Also,
 374        # if gitweb.cgi serves as your indexfile, you will need to force
 375        # $my_uri to contain the script name in your $GITWEB_CONFIG.
 376        'pathinfo' => {
 377                'override' => 0,
 378                'default' => [0]},
 379
 380        # Make gitweb consider projects in project root subdirectories
 381        # to be forks of existing projects. Given project $projname.git,
 382        # projects matching $projname/*.git will not be shown in the main
 383        # projects list, instead a '+' mark will be added to $projname
 384        # there and a 'forks' view will be enabled for the project, listing
 385        # all the forks. If project list is taken from a file, forks have
 386        # to be listed after the main project.
 387
 388        # To enable system wide have in $GITWEB_CONFIG
 389        # $feature{'forks'}{'default'} = [1];
 390        # Project specific override is not supported.
 391        'forks' => {
 392                'override' => 0,
 393                'default' => [0]},
 394
 395        # Insert custom links to the action bar of all project pages.
 396        # This enables you mainly to link to third-party scripts integrating
 397        # into gitweb; e.g. git-browser for graphical history representation
 398        # or custom web-based repository administration interface.
 399
 400        # The 'default' value consists of a list of triplets in the form
 401        # (label, link, position) where position is the label after which
 402        # to insert the link and link is a format string where %n expands
 403        # to the project name, %f to the project path within the filesystem,
 404        # %h to the current hash (h gitweb parameter) and %b to the current
 405        # hash base (hb gitweb parameter); %% expands to %.
 406
 407        # To enable system wide have in $GITWEB_CONFIG e.g.
 408        # $feature{'actions'}{'default'} = [('graphiclog',
 409        #       '/git-browser/by-commit.html?r=%n', 'summary')];
 410        # Project specific override is not supported.
 411        'actions' => {
 412                'override' => 0,
 413                'default' => []},
 414
 415        # Allow gitweb scan project content tags described in ctags/
 416        # of project repository, and display the popular Web 2.0-ish
 417        # "tag cloud" near the project list. Note that this is something
 418        # COMPLETELY different from the normal Git tags.
 419
 420        # gitweb by itself can show existing tags, but it does not handle
 421        # tagging itself; you need an external application for that.
 422        # For an example script, check Girocco's cgi/tagproj.cgi.
 423        # You may want to install the HTML::TagCloud Perl module to get
 424        # a pretty tag cloud instead of just a list of tags.
 425
 426        # To enable system wide have in $GITWEB_CONFIG
 427        # $feature{'ctags'}{'default'} = ['path_to_tag_script'];
 428        # Project specific override is not supported.
 429        'ctags' => {
 430                'override' => 0,
 431                'default' => [0]},
 432
 433        # The maximum number of patches in a patchset generated in patch
 434        # view. Set this to 0 or undef to disable patch view, or to a
 435        # negative number to remove any limit.
 436
 437        # To disable system wide have in $GITWEB_CONFIG
 438        # $feature{'patches'}{'default'} = [0];
 439        # To have project specific config enable override in $GITWEB_CONFIG
 440        # $feature{'patches'}{'override'} = 1;
 441        # and in project config gitweb.patches = 0|n;
 442        # where n is the maximum number of patches allowed in a patchset.
 443        'patches' => {
 444                'sub' => \&feature_patches,
 445                'override' => 0,
 446                'default' => [16]},
 447
 448        # Avatar support. When this feature is enabled, views such as
 449        # shortlog or commit will display an avatar associated with
 450        # the email of the committer(s) and/or author(s).
 451
 452        # Currently available providers are gravatar and picon.
 453        # If an unknown provider is specified, the feature is disabled.
 454
 455        # Gravatar depends on Digest::MD5.
 456        # Picon currently relies on the indiana.edu database.
 457
 458        # To enable system wide have in $GITWEB_CONFIG
 459        # $feature{'avatar'}{'default'} = ['<provider>'];
 460        # where <provider> is either gravatar or picon.
 461        # To have project specific config enable override in $GITWEB_CONFIG
 462        # $feature{'avatar'}{'override'} = 1;
 463        # and in project config gitweb.avatar = <provider>;
 464        'avatar' => {
 465                'sub' => \&feature_avatar,
 466                'override' => 0,
 467                'default' => ['']},
 468
 469        # Enable displaying how much time and how many git commands
 470        # it took to generate and display page.  Disabled by default.
 471        # Project specific override is not supported.
 472        'timed' => {
 473                'override' => 0,
 474                'default' => [0]},
 475
 476        # Enable turning some links into links to actions which require
 477        # JavaScript to run (like 'blame_incremental').  Not enabled by
 478        # default.  Project specific override is currently not supported.
 479        'javascript-actions' => {
 480                'override' => 0,
 481                'default' => [0]},
 482
 483        # Syntax highlighting support. This is based on Daniel Svensson's
 484        # and Sham Chukoury's work in gitweb-xmms2.git.
 485        # It requires the 'highlight' program present in $PATH,
 486        # and therefore is disabled by default.
 487
 488        # To enable system wide have in $GITWEB_CONFIG
 489        # $feature{'highlight'}{'default'} = [1];
 490
 491        'highlight' => {
 492                'sub' => sub { feature_bool('highlight', @_) },
 493                'override' => 0,
 494                'default' => [0]},
 495
 496        # Enable displaying of remote heads in the heads list
 497
 498        # To enable system wide have in $GITWEB_CONFIG
 499        # $feature{'remote_heads'}{'default'} = [1];
 500        # To have project specific config enable override in $GITWEB_CONFIG
 501        # $feature{'remote_heads'}{'override'} = 1;
 502        # and in project config gitweb.remote_heads = 0|1;
 503        'remote_heads' => {
 504                'sub' => sub { feature_bool('remote_heads', @_) },
 505                'override' => 0,
 506                'default' => [0]},
 507);
 508
 509sub gitweb_get_feature {
 510        my ($name) = @_;
 511        return unless exists $feature{$name};
 512        my ($sub, $override, @defaults) = (
 513                $feature{$name}{'sub'},
 514                $feature{$name}{'override'},
 515                @{$feature{$name}{'default'}});
 516        # project specific override is possible only if we have project
 517        our $git_dir; # global variable, declared later
 518        if (!$override || !defined $git_dir) {
 519                return @defaults;
 520        }
 521        if (!defined $sub) {
 522                warn "feature $name is not overridable";
 523                return @defaults;
 524        }
 525        return $sub->(@defaults);
 526}
 527
 528# A wrapper to check if a given feature is enabled.
 529# With this, you can say
 530#
 531#   my $bool_feat = gitweb_check_feature('bool_feat');
 532#   gitweb_check_feature('bool_feat') or somecode;
 533#
 534# instead of
 535#
 536#   my ($bool_feat) = gitweb_get_feature('bool_feat');
 537#   (gitweb_get_feature('bool_feat'))[0] or somecode;
 538#
 539sub gitweb_check_feature {
 540        return (gitweb_get_feature(@_))[0];
 541}
 542
 543
 544sub feature_bool {
 545        my $key = shift;
 546        my ($val) = git_get_project_config($key, '--bool');
 547
 548        if (!defined $val) {
 549                return ($_[0]);
 550        } elsif ($val eq 'true') {
 551                return (1);
 552        } elsif ($val eq 'false') {
 553                return (0);
 554        }
 555}
 556
 557sub feature_snapshot {
 558        my (@fmts) = @_;
 559
 560        my ($val) = git_get_project_config('snapshot');
 561
 562        if ($val) {
 563                @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
 564        }
 565
 566        return @fmts;
 567}
 568
 569sub feature_patches {
 570        my @val = (git_get_project_config('patches', '--int'));
 571
 572        if (@val) {
 573                return @val;
 574        }
 575
 576        return ($_[0]);
 577}
 578
 579sub feature_avatar {
 580        my @val = (git_get_project_config('avatar'));
 581
 582        return @val ? @val : @_;
 583}
 584
 585# checking HEAD file with -e is fragile if the repository was
 586# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
 587# and then pruned.
 588sub check_head_link {
 589        my ($dir) = @_;
 590        my $headfile = "$dir/HEAD";
 591        return ((-e $headfile) ||
 592                (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
 593}
 594
 595sub check_export_ok {
 596        my ($dir) = @_;
 597        return (check_head_link($dir) &&
 598                (!$export_ok || -e "$dir/$export_ok") &&
 599                (!$export_auth_hook || $export_auth_hook->($dir)));
 600}
 601
 602# process alternate names for backward compatibility
 603# filter out unsupported (unknown) snapshot formats
 604sub filter_snapshot_fmts {
 605        my @fmts = @_;
 606
 607        @fmts = map {
 608                exists $known_snapshot_format_aliases{$_} ?
 609                       $known_snapshot_format_aliases{$_} : $_} @fmts;
 610        @fmts = grep {
 611                exists $known_snapshot_formats{$_} &&
 612                !$known_snapshot_formats{$_}{'disabled'}} @fmts;
 613}
 614
 615# If it is set to code reference, it is code that it is to be run once per
 616# request, allowing updating configurations that change with each request,
 617# while running other code in config file only once.
 618#
 619# Otherwise, if it is false then gitweb would process config file only once;
 620# if it is true then gitweb config would be run for each request.
 621our $per_request_config = 1;
 622
 623our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM);
 624sub evaluate_gitweb_config {
 625        our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
 626        our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
 627        # die if there are errors parsing config file
 628        if (-e $GITWEB_CONFIG) {
 629                do $GITWEB_CONFIG;
 630                die $@ if $@;
 631        } elsif (-e $GITWEB_CONFIG_SYSTEM) {
 632                do $GITWEB_CONFIG_SYSTEM;
 633                die $@ if $@;
 634        }
 635}
 636
 637# Get loadavg of system, to compare against $maxload.
 638# Currently it requires '/proc/loadavg' present to get loadavg;
 639# if it is not present it returns 0, which means no load checking.
 640sub get_loadavg {
 641        if( -e '/proc/loadavg' ){
 642                open my $fd, '<', '/proc/loadavg'
 643                        or return 0;
 644                my @load = split(/\s+/, scalar <$fd>);
 645                close $fd;
 646
 647                # The first three columns measure CPU and IO utilization of the last one,
 648                # five, and 10 minute periods.  The fourth column shows the number of
 649                # currently running processes and the total number of processes in the m/n
 650                # format.  The last column displays the last process ID used.
 651                return $load[0] || 0;
 652        }
 653        # additional checks for load average should go here for things that don't export
 654        # /proc/loadavg
 655
 656        return 0;
 657}
 658
 659# version of the core git binary
 660our $git_version;
 661sub evaluate_git_version {
 662        our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
 663        $number_of_git_cmds++;
 664}
 665
 666sub check_loadavg {
 667        if (defined $maxload && get_loadavg() > $maxload) {
 668                die_error(503, "The load average on the server is too high");
 669        }
 670}
 671
 672# ======================================================================
 673# input validation and dispatch
 674
 675# input parameters can be collected from a variety of sources (presently, CGI
 676# and PATH_INFO), so we define an %input_params hash that collects them all
 677# together during validation: this allows subsequent uses (e.g. href()) to be
 678# agnostic of the parameter origin
 679
 680our %input_params = ();
 681
 682# input parameters are stored with the long parameter name as key. This will
 683# also be used in the href subroutine to convert parameters to their CGI
 684# equivalent, and since the href() usage is the most frequent one, we store
 685# the name -> CGI key mapping here, instead of the reverse.
 686#
 687# XXX: Warning: If you touch this, check the search form for updating,
 688# too.
 689
 690our @cgi_param_mapping = (
 691        project => "p",
 692        action => "a",
 693        file_name => "f",
 694        file_parent => "fp",
 695        hash => "h",
 696        hash_parent => "hp",
 697        hash_base => "hb",
 698        hash_parent_base => "hpb",
 699        page => "pg",
 700        order => "o",
 701        searchtext => "s",
 702        searchtype => "st",
 703        snapshot_format => "sf",
 704        extra_options => "opt",
 705        search_use_regexp => "sr",
 706        # this must be last entry (for manipulation from JavaScript)
 707        javascript => "js"
 708);
 709our %cgi_param_mapping = @cgi_param_mapping;
 710
 711# we will also need to know the possible actions, for validation
 712our %actions = (
 713        "blame" => \&git_blame,
 714        "blame_incremental" => \&git_blame_incremental,
 715        "blame_data" => \&git_blame_data,
 716        "blobdiff" => \&git_blobdiff,
 717        "blobdiff_plain" => \&git_blobdiff_plain,
 718        "blob" => \&git_blob,
 719        "blob_plain" => \&git_blob_plain,
 720        "commitdiff" => \&git_commitdiff,
 721        "commitdiff_plain" => \&git_commitdiff_plain,
 722        "commit" => \&git_commit,
 723        "forks" => \&git_forks,
 724        "heads" => \&git_heads,
 725        "history" => \&git_history,
 726        "log" => \&git_log,
 727        "patch" => \&git_patch,
 728        "patches" => \&git_patches,
 729        "remotes" => \&git_remotes,
 730        "rss" => \&git_rss,
 731        "atom" => \&git_atom,
 732        "search" => \&git_search,
 733        "search_help" => \&git_search_help,
 734        "shortlog" => \&git_shortlog,
 735        "summary" => \&git_summary,
 736        "tag" => \&git_tag,
 737        "tags" => \&git_tags,
 738        "tree" => \&git_tree,
 739        "snapshot" => \&git_snapshot,
 740        "object" => \&git_object,
 741        # those below don't need $project
 742        "opml" => \&git_opml,
 743        "project_list" => \&git_project_list,
 744        "project_index" => \&git_project_index,
 745);
 746
 747# finally, we have the hash of allowed extra_options for the commands that
 748# allow them
 749our %allowed_options = (
 750        "--no-merges" => [ qw(rss atom log shortlog history) ],
 751);
 752
 753# fill %input_params with the CGI parameters. All values except for 'opt'
 754# should be single values, but opt can be an array. We should probably
 755# build an array of parameters that can be multi-valued, but since for the time
 756# being it's only this one, we just single it out
 757sub evaluate_query_params {
 758        our $cgi;
 759
 760        while (my ($name, $symbol) = each %cgi_param_mapping) {
 761                if ($symbol eq 'opt') {
 762                        $input_params{$name} = [ $cgi->param($symbol) ];
 763                } else {
 764                        $input_params{$name} = $cgi->param($symbol);
 765                }
 766        }
 767}
 768
 769# now read PATH_INFO and update the parameter list for missing parameters
 770sub evaluate_path_info {
 771        return if defined $input_params{'project'};
 772        return if !$path_info;
 773        $path_info =~ s,^/+,,;
 774        return if !$path_info;
 775
 776        # find which part of PATH_INFO is project
 777        my $project = $path_info;
 778        $project =~ s,/+$,,;
 779        while ($project && !check_head_link("$projectroot/$project")) {
 780                $project =~ s,/*[^/]*$,,;
 781        }
 782        return unless $project;
 783        $input_params{'project'} = $project;
 784
 785        # do not change any parameters if an action is given using the query string
 786        return if $input_params{'action'};
 787        $path_info =~ s,^\Q$project\E/*,,;
 788
 789        # next, check if we have an action
 790        my $action = $path_info;
 791        $action =~ s,/.*$,,;
 792        if (exists $actions{$action}) {
 793                $path_info =~ s,^$action/*,,;
 794                $input_params{'action'} = $action;
 795        }
 796
 797        # list of actions that want hash_base instead of hash, but can have no
 798        # pathname (f) parameter
 799        my @wants_base = (
 800                'tree',
 801                'history',
 802        );
 803
 804        # we want to catch, among others
 805        # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
 806        my ($parentrefname, $parentpathname, $refname, $pathname) =
 807                ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
 808
 809        # first, analyze the 'current' part
 810        if (defined $pathname) {
 811                # we got "branch:filename" or "branch:dir/"
 812                # we could use git_get_type(branch:pathname), but:
 813                # - it needs $git_dir
 814                # - it does a git() call
 815                # - the convention of terminating directories with a slash
 816                #   makes it superfluous
 817                # - embedding the action in the PATH_INFO would make it even
 818                #   more superfluous
 819                $pathname =~ s,^/+,,;
 820                if (!$pathname || substr($pathname, -1) eq "/") {
 821                        $input_params{'action'} ||= "tree";
 822                        $pathname =~ s,/$,,;
 823                } else {
 824                        # the default action depends on whether we had parent info
 825                        # or not
 826                        if ($parentrefname) {
 827                                $input_params{'action'} ||= "blobdiff_plain";
 828                        } else {
 829                                $input_params{'action'} ||= "blob_plain";
 830                        }
 831                }
 832                $input_params{'hash_base'} ||= $refname;
 833                $input_params{'file_name'} ||= $pathname;
 834        } elsif (defined $refname) {
 835                # we got "branch". In this case we have to choose if we have to
 836                # set hash or hash_base.
 837                #
 838                # Most of the actions without a pathname only want hash to be
 839                # set, except for the ones specified in @wants_base that want
 840                # hash_base instead. It should also be noted that hand-crafted
 841                # links having 'history' as an action and no pathname or hash
 842                # set will fail, but that happens regardless of PATH_INFO.
 843                if (defined $parentrefname) {
 844                        # if there is parent let the default be 'shortlog' action
 845                        # (for http://git.example.com/repo.git/A..B links); if there
 846                        # is no parent, dispatch will detect type of object and set
 847                        # action appropriately if required (if action is not set)
 848                        $input_params{'action'} ||= "shortlog";
 849                }
 850                if ($input_params{'action'} &&
 851                    grep { $_ eq $input_params{'action'} } @wants_base) {
 852                        $input_params{'hash_base'} ||= $refname;
 853                } else {
 854                        $input_params{'hash'} ||= $refname;
 855                }
 856        }
 857
 858        # next, handle the 'parent' part, if present
 859        if (defined $parentrefname) {
 860                # a missing pathspec defaults to the 'current' filename, allowing e.g.
 861                # someproject/blobdiff/oldrev..newrev:/filename
 862                if ($parentpathname) {
 863                        $parentpathname =~ s,^/+,,;
 864                        $parentpathname =~ s,/$,,;
 865                        $input_params{'file_parent'} ||= $parentpathname;
 866                } else {
 867                        $input_params{'file_parent'} ||= $input_params{'file_name'};
 868                }
 869                # we assume that hash_parent_base is wanted if a path was specified,
 870                # or if the action wants hash_base instead of hash
 871                if (defined $input_params{'file_parent'} ||
 872                        grep { $_ eq $input_params{'action'} } @wants_base) {
 873                        $input_params{'hash_parent_base'} ||= $parentrefname;
 874                } else {
 875                        $input_params{'hash_parent'} ||= $parentrefname;
 876                }
 877        }
 878
 879        # for the snapshot action, we allow URLs in the form
 880        # $project/snapshot/$hash.ext
 881        # where .ext determines the snapshot and gets removed from the
 882        # passed $refname to provide the $hash.
 883        #
 884        # To be able to tell that $refname includes the format extension, we
 885        # require the following two conditions to be satisfied:
 886        # - the hash input parameter MUST have been set from the $refname part
 887        #   of the URL (i.e. they must be equal)
 888        # - the snapshot format MUST NOT have been defined already (e.g. from
 889        #   CGI parameter sf)
 890        # It's also useless to try any matching unless $refname has a dot,
 891        # so we check for that too
 892        if (defined $input_params{'action'} &&
 893                $input_params{'action'} eq 'snapshot' &&
 894                defined $refname && index($refname, '.') != -1 &&
 895                $refname eq $input_params{'hash'} &&
 896                !defined $input_params{'snapshot_format'}) {
 897                # We loop over the known snapshot formats, checking for
 898                # extensions. Allowed extensions are both the defined suffix
 899                # (which includes the initial dot already) and the snapshot
 900                # format key itself, with a prepended dot
 901                while (my ($fmt, $opt) = each %known_snapshot_formats) {
 902                        my $hash = $refname;
 903                        unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
 904                                next;
 905                        }
 906                        my $sfx = $1;
 907                        # a valid suffix was found, so set the snapshot format
 908                        # and reset the hash parameter
 909                        $input_params{'snapshot_format'} = $fmt;
 910                        $input_params{'hash'} = $hash;
 911                        # we also set the format suffix to the one requested
 912                        # in the URL: this way a request for e.g. .tgz returns
 913                        # a .tgz instead of a .tar.gz
 914                        $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
 915                        last;
 916                }
 917        }
 918}
 919
 920our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
 921     $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
 922     $searchtext, $search_regexp);
 923sub evaluate_and_validate_params {
 924        our $action = $input_params{'action'};
 925        if (defined $action) {
 926                if (!validate_action($action)) {
 927                        die_error(400, "Invalid action parameter");
 928                }
 929        }
 930
 931        # parameters which are pathnames
 932        our $project = $input_params{'project'};
 933        if (defined $project) {
 934                if (!validate_project($project)) {
 935                        undef $project;
 936                        die_error(404, "No such project");
 937                }
 938        }
 939
 940        our $file_name = $input_params{'file_name'};
 941        if (defined $file_name) {
 942                if (!validate_pathname($file_name)) {
 943                        die_error(400, "Invalid file parameter");
 944                }
 945        }
 946
 947        our $file_parent = $input_params{'file_parent'};
 948        if (defined $file_parent) {
 949                if (!validate_pathname($file_parent)) {
 950                        die_error(400, "Invalid file parent parameter");
 951                }
 952        }
 953
 954        # parameters which are refnames
 955        our $hash = $input_params{'hash'};
 956        if (defined $hash) {
 957                if (!validate_refname($hash)) {
 958                        die_error(400, "Invalid hash parameter");
 959                }
 960        }
 961
 962        our $hash_parent = $input_params{'hash_parent'};
 963        if (defined $hash_parent) {
 964                if (!validate_refname($hash_parent)) {
 965                        die_error(400, "Invalid hash parent parameter");
 966                }
 967        }
 968
 969        our $hash_base = $input_params{'hash_base'};
 970        if (defined $hash_base) {
 971                if (!validate_refname($hash_base)) {
 972                        die_error(400, "Invalid hash base parameter");
 973                }
 974        }
 975
 976        our @extra_options = @{$input_params{'extra_options'}};
 977        # @extra_options is always defined, since it can only be (currently) set from
 978        # CGI, and $cgi->param() returns the empty array in array context if the param
 979        # is not set
 980        foreach my $opt (@extra_options) {
 981                if (not exists $allowed_options{$opt}) {
 982                        die_error(400, "Invalid option parameter");
 983                }
 984                if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
 985                        die_error(400, "Invalid option parameter for this action");
 986                }
 987        }
 988
 989        our $hash_parent_base = $input_params{'hash_parent_base'};
 990        if (defined $hash_parent_base) {
 991                if (!validate_refname($hash_parent_base)) {
 992                        die_error(400, "Invalid hash parent base parameter");
 993                }
 994        }
 995
 996        # other parameters
 997        our $page = $input_params{'page'};
 998        if (defined $page) {
 999                if ($page =~ m/[^0-9]/) {
1000                        die_error(400, "Invalid page parameter");
1001                }
1002        }
1003
1004        our $searchtype = $input_params{'searchtype'};
1005        if (defined $searchtype) {
1006                if ($searchtype =~ m/[^a-z]/) {
1007                        die_error(400, "Invalid searchtype parameter");
1008                }
1009        }
1010
1011        our $search_use_regexp = $input_params{'search_use_regexp'};
1012
1013        our $searchtext = $input_params{'searchtext'};
1014        our $search_regexp;
1015        if (defined $searchtext) {
1016                if (length($searchtext) < 2) {
1017                        die_error(403, "At least two characters are required for search parameter");
1018                }
1019                $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
1020        }
1021}
1022
1023# path to the current git repository
1024our $git_dir;
1025sub evaluate_git_dir {
1026        our $git_dir = "$projectroot/$project" if $project;
1027}
1028
1029our (@snapshot_fmts, $git_avatar);
1030sub configure_gitweb_features {
1031        # list of supported snapshot formats
1032        our @snapshot_fmts = gitweb_get_feature('snapshot');
1033        @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1034
1035        # check that the avatar feature is set to a known provider name,
1036        # and for each provider check if the dependencies are satisfied.
1037        # if the provider name is invalid or the dependencies are not met,
1038        # reset $git_avatar to the empty string.
1039        our ($git_avatar) = gitweb_get_feature('avatar');
1040        if ($git_avatar eq 'gravatar') {
1041                $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1042        } elsif ($git_avatar eq 'picon') {
1043                # no dependencies
1044        } else {
1045                $git_avatar = '';
1046        }
1047}
1048
1049# custom error handler: 'die <message>' is Internal Server Error
1050sub handle_errors_html {
1051        my $msg = shift; # it is already HTML escaped
1052
1053        # to avoid infinite loop where error occurs in die_error,
1054        # change handler to default handler, disabling handle_errors_html
1055        set_message("Error occured when inside die_error:\n$msg");
1056
1057        # you cannot jump out of die_error when called as error handler;
1058        # the subroutine set via CGI::Carp::set_message is called _after_
1059        # HTTP headers are already written, so it cannot write them itself
1060        die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1061}
1062set_message(\&handle_errors_html);
1063
1064# dispatch
1065sub dispatch {
1066        if (!defined $action) {
1067                if (defined $hash) {
1068                        $action = git_get_type($hash);
1069                } elsif (defined $hash_base && defined $file_name) {
1070                        $action = git_get_type("$hash_base:$file_name");
1071                } elsif (defined $project) {
1072                        $action = 'summary';
1073                } else {
1074                        $action = 'project_list';
1075                }
1076        }
1077        if (!defined($actions{$action})) {
1078                die_error(400, "Unknown action");
1079        }
1080        if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1081            !$project) {
1082                die_error(400, "Project needed");
1083        }
1084        $actions{$action}->();
1085}
1086
1087sub reset_timer {
1088        our $t0 = [ gettimeofday() ]
1089                if defined $t0;
1090        our $number_of_git_cmds = 0;
1091}
1092
1093our $first_request = 1;
1094sub run_request {
1095        reset_timer();
1096
1097        evaluate_uri();
1098        if ($first_request) {
1099                evaluate_gitweb_config();
1100                evaluate_git_version();
1101        }
1102        if ($per_request_config) {
1103                if (ref($per_request_config) eq 'CODE') {
1104                        $per_request_config->();
1105                } elsif (!$first_request) {
1106                        evaluate_gitweb_config();
1107                }
1108        }
1109        check_loadavg();
1110
1111        # $projectroot and $projects_list might be set in gitweb config file
1112        $projects_list ||= $projectroot;
1113
1114        evaluate_query_params();
1115        evaluate_path_info();
1116        evaluate_and_validate_params();
1117        evaluate_git_dir();
1118
1119        configure_gitweb_features();
1120
1121        dispatch();
1122}
1123
1124our $is_last_request = sub { 1 };
1125our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1126our $CGI = 'CGI';
1127our $cgi;
1128sub configure_as_fcgi {
1129        require CGI::Fast;
1130        our $CGI = 'CGI::Fast';
1131
1132        my $request_number = 0;
1133        # let each child service 100 requests
1134        our $is_last_request = sub { ++$request_number > 100 };
1135}
1136sub evaluate_argv {
1137        my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1138        configure_as_fcgi()
1139                if $script_name =~ /\.fcgi$/;
1140
1141        return unless (@ARGV);
1142
1143        require Getopt::Long;
1144        Getopt::Long::GetOptions(
1145                'fastcgi|fcgi|f' => \&configure_as_fcgi,
1146                'nproc|n=i' => sub {
1147                        my ($arg, $val) = @_;
1148                        return unless eval { require FCGI::ProcManager; 1; };
1149                        my $proc_manager = FCGI::ProcManager->new({
1150                                n_processes => $val,
1151                        });
1152                        our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1153                        our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1154                        our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1155                },
1156        );
1157}
1158
1159sub run {
1160        evaluate_argv();
1161
1162        $first_request = 1;
1163        $pre_listen_hook->()
1164                if $pre_listen_hook;
1165
1166 REQUEST:
1167        while ($cgi = $CGI->new()) {
1168                $pre_dispatch_hook->()
1169                        if $pre_dispatch_hook;
1170
1171                run_request();
1172
1173                $post_dispatch_hook->()
1174                        if $post_dispatch_hook;
1175                $first_request = 0;
1176
1177                last REQUEST if ($is_last_request->());
1178        }
1179
1180 DONE_GITWEB:
1181        1;
1182}
1183
1184run();
1185
1186if (defined caller) {
1187        # wrapped in a subroutine processing requests,
1188        # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1189        return;
1190} else {
1191        # pure CGI script, serving single request
1192        exit;
1193}
1194
1195## ======================================================================
1196## action links
1197
1198# possible values of extra options
1199# -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1200# -replay => 1      - start from a current view (replay with modifications)
1201# -path_info => 0|1 - don't use/use path_info URL (if possible)
1202# -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1203sub href {
1204        my %params = @_;
1205        # default is to use -absolute url() i.e. $my_uri
1206        my $href = $params{-full} ? $my_url : $my_uri;
1207
1208        # implicit -replay, must be first of implicit params
1209        $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1210
1211        $params{'project'} = $project unless exists $params{'project'};
1212
1213        if ($params{-replay}) {
1214                while (my ($name, $symbol) = each %cgi_param_mapping) {
1215                        if (!exists $params{$name}) {
1216                                $params{$name} = $input_params{$name};
1217                        }
1218                }
1219        }
1220
1221        my $use_pathinfo = gitweb_check_feature('pathinfo');
1222        if (defined $params{'project'} &&
1223            (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1224                # try to put as many parameters as possible in PATH_INFO:
1225                #   - project name
1226                #   - action
1227                #   - hash_parent or hash_parent_base:/file_parent
1228                #   - hash or hash_base:/filename
1229                #   - the snapshot_format as an appropriate suffix
1230
1231                # When the script is the root DirectoryIndex for the domain,
1232                # $href here would be something like http://gitweb.example.com/
1233                # Thus, we strip any trailing / from $href, to spare us double
1234                # slashes in the final URL
1235                $href =~ s,/$,,;
1236
1237                # Then add the project name, if present
1238                $href .= "/".esc_path_info($params{'project'});
1239                delete $params{'project'};
1240
1241                # since we destructively absorb parameters, we keep this
1242                # boolean that remembers if we're handling a snapshot
1243                my $is_snapshot = $params{'action'} eq 'snapshot';
1244
1245                # Summary just uses the project path URL, any other action is
1246                # added to the URL
1247                if (defined $params{'action'}) {
1248                        $href .= "/".esc_path_info($params{'action'})
1249                                unless $params{'action'} eq 'summary';
1250                        delete $params{'action'};
1251                }
1252
1253                # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1254                # stripping nonexistent or useless pieces
1255                $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1256                        || $params{'hash_parent'} || $params{'hash'});
1257                if (defined $params{'hash_base'}) {
1258                        if (defined $params{'hash_parent_base'}) {
1259                                $href .= esc_path_info($params{'hash_parent_base'});
1260                                # skip the file_parent if it's the same as the file_name
1261                                if (defined $params{'file_parent'}) {
1262                                        if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1263                                                delete $params{'file_parent'};
1264                                        } elsif ($params{'file_parent'} !~ /\.\./) {
1265                                                $href .= ":/".esc_path_info($params{'file_parent'});
1266                                                delete $params{'file_parent'};
1267                                        }
1268                                }
1269                                $href .= "..";
1270                                delete $params{'hash_parent'};
1271                                delete $params{'hash_parent_base'};
1272                        } elsif (defined $params{'hash_parent'}) {
1273                                $href .= esc_path_info($params{'hash_parent'}). "..";
1274                                delete $params{'hash_parent'};
1275                        }
1276
1277                        $href .= esc_path_info($params{'hash_base'});
1278                        if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1279                                $href .= ":/".esc_path_info($params{'file_name'});
1280                                delete $params{'file_name'};
1281                        }
1282                        delete $params{'hash'};
1283                        delete $params{'hash_base'};
1284                } elsif (defined $params{'hash'}) {
1285                        $href .= esc_path_info($params{'hash'});
1286                        delete $params{'hash'};
1287                }
1288
1289                # If the action was a snapshot, we can absorb the
1290                # snapshot_format parameter too
1291                if ($is_snapshot) {
1292                        my $fmt = $params{'snapshot_format'};
1293                        # snapshot_format should always be defined when href()
1294                        # is called, but just in case some code forgets, we
1295                        # fall back to the default
1296                        $fmt ||= $snapshot_fmts[0];
1297                        $href .= $known_snapshot_formats{$fmt}{'suffix'};
1298                        delete $params{'snapshot_format'};
1299                }
1300        }
1301
1302        # now encode the parameters explicitly
1303        my @result = ();
1304        for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1305                my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1306                if (defined $params{$name}) {
1307                        if (ref($params{$name}) eq "ARRAY") {
1308                                foreach my $par (@{$params{$name}}) {
1309                                        push @result, $symbol . "=" . esc_param($par);
1310                                }
1311                        } else {
1312                                push @result, $symbol . "=" . esc_param($params{$name});
1313                        }
1314                }
1315        }
1316        $href .= "?" . join(';', @result) if scalar @result;
1317
1318        # final transformation: trailing spaces must be escaped (URI-encoded)
1319        $href =~ s/(\s+)$/CGI::escape($1)/e;
1320
1321        if ($params{-anchor}) {
1322                $href .= "#".esc_param($params{-anchor});
1323        }
1324
1325        return $href;
1326}
1327
1328
1329## ======================================================================
1330## validation, quoting/unquoting and escaping
1331
1332sub validate_action {
1333        my $input = shift || return undef;
1334        return undef unless exists $actions{$input};
1335        return $input;
1336}
1337
1338sub validate_project {
1339        my $input = shift || return undef;
1340        if (!validate_pathname($input) ||
1341                !(-d "$projectroot/$input") ||
1342                !check_export_ok("$projectroot/$input") ||
1343                ($strict_export && !project_in_list($input))) {
1344                return undef;
1345        } else {
1346                return $input;
1347        }
1348}
1349
1350sub validate_pathname {
1351        my $input = shift || return undef;
1352
1353        # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1354        # at the beginning, at the end, and between slashes.
1355        # also this catches doubled slashes
1356        if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1357                return undef;
1358        }
1359        # no null characters
1360        if ($input =~ m!\0!) {
1361                return undef;
1362        }
1363        return $input;
1364}
1365
1366sub validate_refname {
1367        my $input = shift || return undef;
1368
1369        # textual hashes are O.K.
1370        if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1371                return $input;
1372        }
1373        # it must be correct pathname
1374        $input = validate_pathname($input)
1375                or return undef;
1376        # restrictions on ref name according to git-check-ref-format
1377        if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1378                return undef;
1379        }
1380        return $input;
1381}
1382
1383# decode sequences of octets in utf8 into Perl's internal form,
1384# which is utf-8 with utf8 flag set if needed.  gitweb writes out
1385# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1386sub to_utf8 {
1387        my $str = shift;
1388        return undef unless defined $str;
1389        if (utf8::valid($str)) {
1390                utf8::decode($str);
1391                return $str;
1392        } else {
1393                return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1394        }
1395}
1396
1397# quote unsafe chars, but keep the slash, even when it's not
1398# correct, but quoted slashes look too horrible in bookmarks
1399sub esc_param {
1400        my $str = shift;
1401        return undef unless defined $str;
1402        $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1403        $str =~ s/ /\+/g;
1404        return $str;
1405}
1406
1407# the quoting rules for path_info fragment are slightly different
1408sub esc_path_info {
1409        my $str = shift;
1410        return undef unless defined $str;
1411
1412        # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1413        $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1414
1415        return $str;
1416}
1417
1418# quote unsafe chars in whole URL, so some characters cannot be quoted
1419sub esc_url {
1420        my $str = shift;
1421        return undef unless defined $str;
1422        $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1423        $str =~ s/ /\+/g;
1424        return $str;
1425}
1426
1427# quote unsafe characters in HTML attributes
1428sub esc_attr {
1429
1430        # for XHTML conformance escaping '"' to '&quot;' is not enough
1431        return esc_html(@_);
1432}
1433
1434# replace invalid utf8 character with SUBSTITUTION sequence
1435sub esc_html {
1436        my $str = shift;
1437        my %opts = @_;
1438
1439        return undef unless defined $str;
1440
1441        $str = to_utf8($str);
1442        $str = $cgi->escapeHTML($str);
1443        if ($opts{'-nbsp'}) {
1444                $str =~ s/ /&nbsp;/g;
1445        }
1446        $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1447        return $str;
1448}
1449
1450# quote control characters and escape filename to HTML
1451sub esc_path {
1452        my $str = shift;
1453        my %opts = @_;
1454
1455        return undef unless defined $str;
1456
1457        $str = to_utf8($str);
1458        $str = $cgi->escapeHTML($str);
1459        if ($opts{'-nbsp'}) {
1460                $str =~ s/ /&nbsp;/g;
1461        }
1462        $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1463        return $str;
1464}
1465
1466# Make control characters "printable", using character escape codes (CEC)
1467sub quot_cec {
1468        my $cntrl = shift;
1469        my %opts = @_;
1470        my %es = ( # character escape codes, aka escape sequences
1471                "\t" => '\t',   # tab            (HT)
1472                "\n" => '\n',   # line feed      (LF)
1473                "\r" => '\r',   # carrige return (CR)
1474                "\f" => '\f',   # form feed      (FF)
1475                "\b" => '\b',   # backspace      (BS)
1476                "\a" => '\a',   # alarm (bell)   (BEL)
1477                "\e" => '\e',   # escape         (ESC)
1478                "\013" => '\v', # vertical tab   (VT)
1479                "\000" => '\0', # nul character  (NUL)
1480        );
1481        my $chr = ( (exists $es{$cntrl})
1482                    ? $es{$cntrl}
1483                    : sprintf('\%2x', ord($cntrl)) );
1484        if ($opts{-nohtml}) {
1485                return $chr;
1486        } else {
1487                return "<span class=\"cntrl\">$chr</span>";
1488        }
1489}
1490
1491# Alternatively use unicode control pictures codepoints,
1492# Unicode "printable representation" (PR)
1493sub quot_upr {
1494        my $cntrl = shift;
1495        my %opts = @_;
1496
1497        my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1498        if ($opts{-nohtml}) {
1499                return $chr;
1500        } else {
1501                return "<span class=\"cntrl\">$chr</span>";
1502        }
1503}
1504
1505# git may return quoted and escaped filenames
1506sub unquote {
1507        my $str = shift;
1508
1509        sub unq {
1510                my $seq = shift;
1511                my %es = ( # character escape codes, aka escape sequences
1512                        't' => "\t",   # tab            (HT, TAB)
1513                        'n' => "\n",   # newline        (NL)
1514                        'r' => "\r",   # return         (CR)
1515                        'f' => "\f",   # form feed      (FF)
1516                        'b' => "\b",   # backspace      (BS)
1517                        'a' => "\a",   # alarm (bell)   (BEL)
1518                        'e' => "\e",   # escape         (ESC)
1519                        'v' => "\013", # vertical tab   (VT)
1520                );
1521
1522                if ($seq =~ m/^[0-7]{1,3}$/) {
1523                        # octal char sequence
1524                        return chr(oct($seq));
1525                } elsif (exists $es{$seq}) {
1526                        # C escape sequence, aka character escape code
1527                        return $es{$seq};
1528                }
1529                # quoted ordinary character
1530                return $seq;
1531        }
1532
1533        if ($str =~ m/^"(.*)"$/) {
1534                # needs unquoting
1535                $str = $1;
1536                $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1537        }
1538        return $str;
1539}
1540
1541# escape tabs (convert tabs to spaces)
1542sub untabify {
1543        my $line = shift;
1544
1545        while ((my $pos = index($line, "\t")) != -1) {
1546                if (my $count = (8 - ($pos % 8))) {
1547                        my $spaces = ' ' x $count;
1548                        $line =~ s/\t/$spaces/;
1549                }
1550        }
1551
1552        return $line;
1553}
1554
1555sub project_in_list {
1556        my $project = shift;
1557        my @list = git_get_projects_list();
1558        return @list && scalar(grep { $_->{'path'} eq $project } @list);
1559}
1560
1561## ----------------------------------------------------------------------
1562## HTML aware string manipulation
1563
1564# Try to chop given string on a word boundary between position
1565# $len and $len+$add_len. If there is no word boundary there,
1566# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1567# (marking chopped part) would be longer than given string.
1568sub chop_str {
1569        my $str = shift;
1570        my $len = shift;
1571        my $add_len = shift || 10;
1572        my $where = shift || 'right'; # 'left' | 'center' | 'right'
1573
1574        # Make sure perl knows it is utf8 encoded so we don't
1575        # cut in the middle of a utf8 multibyte char.
1576        $str = to_utf8($str);
1577
1578        # allow only $len chars, but don't cut a word if it would fit in $add_len
1579        # if it doesn't fit, cut it if it's still longer than the dots we would add
1580        # remove chopped character entities entirely
1581
1582        # when chopping in the middle, distribute $len into left and right part
1583        # return early if chopping wouldn't make string shorter
1584        if ($where eq 'center') {
1585                return $str if ($len + 5 >= length($str)); # filler is length 5
1586                $len = int($len/2);
1587        } else {
1588                return $str if ($len + 4 >= length($str)); # filler is length 4
1589        }
1590
1591        # regexps: ending and beginning with word part up to $add_len
1592        my $endre = qr/.{$len}\w{0,$add_len}/;
1593        my $begre = qr/\w{0,$add_len}.{$len}/;
1594
1595        if ($where eq 'left') {
1596                $str =~ m/^(.*?)($begre)$/;
1597                my ($lead, $body) = ($1, $2);
1598                if (length($lead) > 4) {
1599                        $lead = " ...";
1600                }
1601                return "$lead$body";
1602
1603        } elsif ($where eq 'center') {
1604                $str =~ m/^($endre)(.*)$/;
1605                my ($left, $str)  = ($1, $2);
1606                $str =~ m/^(.*?)($begre)$/;
1607                my ($mid, $right) = ($1, $2);
1608                if (length($mid) > 5) {
1609                        $mid = " ... ";
1610                }
1611                return "$left$mid$right";
1612
1613        } else {
1614                $str =~ m/^($endre)(.*)$/;
1615                my $body = $1;
1616                my $tail = $2;
1617                if (length($tail) > 4) {
1618                        $tail = "... ";
1619                }
1620                return "$body$tail";
1621        }
1622}
1623
1624# takes the same arguments as chop_str, but also wraps a <span> around the
1625# result with a title attribute if it does get chopped. Additionally, the
1626# string is HTML-escaped.
1627sub chop_and_escape_str {
1628        my ($str) = @_;
1629
1630        my $chopped = chop_str(@_);
1631        if ($chopped eq $str) {
1632                return esc_html($chopped);
1633        } else {
1634                $str =~ s/[[:cntrl:]]/?/g;
1635                return $cgi->span({-title=>$str}, esc_html($chopped));
1636        }
1637}
1638
1639## ----------------------------------------------------------------------
1640## functions returning short strings
1641
1642# CSS class for given age value (in seconds)
1643sub age_class {
1644        my $age = shift;
1645
1646        if (!defined $age) {
1647                return "noage";
1648        } elsif ($age < 60*60*2) {
1649                return "age0";
1650        } elsif ($age < 60*60*24*2) {
1651                return "age1";
1652        } else {
1653                return "age2";
1654        }
1655}
1656
1657# convert age in seconds to "nn units ago" string
1658sub age_string {
1659        my $age = shift;
1660        my $age_str;
1661
1662        if ($age > 60*60*24*365*2) {
1663                $age_str = (int $age/60/60/24/365);
1664                $age_str .= " years ago";
1665        } elsif ($age > 60*60*24*(365/12)*2) {
1666                $age_str = int $age/60/60/24/(365/12);
1667                $age_str .= " months ago";
1668        } elsif ($age > 60*60*24*7*2) {
1669                $age_str = int $age/60/60/24/7;
1670                $age_str .= " weeks ago";
1671        } elsif ($age > 60*60*24*2) {
1672                $age_str = int $age/60/60/24;
1673                $age_str .= " days ago";
1674        } elsif ($age > 60*60*2) {
1675                $age_str = int $age/60/60;
1676                $age_str .= " hours ago";
1677        } elsif ($age > 60*2) {
1678                $age_str = int $age/60;
1679                $age_str .= " min ago";
1680        } elsif ($age > 2) {
1681                $age_str = int $age;
1682                $age_str .= " sec ago";
1683        } else {
1684                $age_str .= " right now";
1685        }
1686        return $age_str;
1687}
1688
1689use constant {
1690        S_IFINVALID => 0030000,
1691        S_IFGITLINK => 0160000,
1692};
1693
1694# submodule/subproject, a commit object reference
1695sub S_ISGITLINK {
1696        my $mode = shift;
1697
1698        return (($mode & S_IFMT) == S_IFGITLINK)
1699}
1700
1701# convert file mode in octal to symbolic file mode string
1702sub mode_str {
1703        my $mode = oct shift;
1704
1705        if (S_ISGITLINK($mode)) {
1706                return 'm---------';
1707        } elsif (S_ISDIR($mode & S_IFMT)) {
1708                return 'drwxr-xr-x';
1709        } elsif (S_ISLNK($mode)) {
1710                return 'lrwxrwxrwx';
1711        } elsif (S_ISREG($mode)) {
1712                # git cares only about the executable bit
1713                if ($mode & S_IXUSR) {
1714                        return '-rwxr-xr-x';
1715                } else {
1716                        return '-rw-r--r--';
1717                };
1718        } else {
1719                return '----------';
1720        }
1721}
1722
1723# convert file mode in octal to file type string
1724sub file_type {
1725        my $mode = shift;
1726
1727        if ($mode !~ m/^[0-7]+$/) {
1728                return $mode;
1729        } else {
1730                $mode = oct $mode;
1731        }
1732
1733        if (S_ISGITLINK($mode)) {
1734                return "submodule";
1735        } elsif (S_ISDIR($mode & S_IFMT)) {
1736                return "directory";
1737        } elsif (S_ISLNK($mode)) {
1738                return "symlink";
1739        } elsif (S_ISREG($mode)) {
1740                return "file";
1741        } else {
1742                return "unknown";
1743        }
1744}
1745
1746# convert file mode in octal to file type description string
1747sub file_type_long {
1748        my $mode = shift;
1749
1750        if ($mode !~ m/^[0-7]+$/) {
1751                return $mode;
1752        } else {
1753                $mode = oct $mode;
1754        }
1755
1756        if (S_ISGITLINK($mode)) {
1757                return "submodule";
1758        } elsif (S_ISDIR($mode & S_IFMT)) {
1759                return "directory";
1760        } elsif (S_ISLNK($mode)) {
1761                return "symlink";
1762        } elsif (S_ISREG($mode)) {
1763                if ($mode & S_IXUSR) {
1764                        return "executable";
1765                } else {
1766                        return "file";
1767                };
1768        } else {
1769                return "unknown";
1770        }
1771}
1772
1773
1774## ----------------------------------------------------------------------
1775## functions returning short HTML fragments, or transforming HTML fragments
1776## which don't belong to other sections
1777
1778# format line of commit message.
1779sub format_log_line_html {
1780        my $line = shift;
1781
1782        $line = esc_html($line, -nbsp=>1);
1783        $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1784                $cgi->a({-href => href(action=>"object", hash=>$1),
1785                                        -class => "text"}, $1);
1786        }eg;
1787
1788        return $line;
1789}
1790
1791# format marker of refs pointing to given object
1792
1793# the destination action is chosen based on object type and current context:
1794# - for annotated tags, we choose the tag view unless it's the current view
1795#   already, in which case we go to shortlog view
1796# - for other refs, we keep the current view if we're in history, shortlog or
1797#   log view, and select shortlog otherwise
1798sub format_ref_marker {
1799        my ($refs, $id) = @_;
1800        my $markers = '';
1801
1802        if (defined $refs->{$id}) {
1803                foreach my $ref (@{$refs->{$id}}) {
1804                        # this code exploits the fact that non-lightweight tags are the
1805                        # only indirect objects, and that they are the only objects for which
1806                        # we want to use tag instead of shortlog as action
1807                        my ($type, $name) = qw();
1808                        my $indirect = ($ref =~ s/\^\{\}$//);
1809                        # e.g. tags/v2.6.11 or heads/next
1810                        if ($ref =~ m!^(.*?)s?/(.*)$!) {
1811                                $type = $1;
1812                                $name = $2;
1813                        } else {
1814                                $type = "ref";
1815                                $name = $ref;
1816                        }
1817
1818                        my $class = $type;
1819                        $class .= " indirect" if $indirect;
1820
1821                        my $dest_action = "shortlog";
1822
1823                        if ($indirect) {
1824                                $dest_action = "tag" unless $action eq "tag";
1825                        } elsif ($action =~ /^(history|(short)?log)$/) {
1826                                $dest_action = $action;
1827                        }
1828
1829                        my $dest = "";
1830                        $dest .= "refs/" unless $ref =~ m!^refs/!;
1831                        $dest .= $ref;
1832
1833                        my $link = $cgi->a({
1834                                -href => href(
1835                                        action=>$dest_action,
1836                                        hash=>$dest
1837                                )}, $name);
1838
1839                        $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
1840                                $link . "</span>";
1841                }
1842        }
1843
1844        if ($markers) {
1845                return ' <span class="refs">'. $markers . '</span>';
1846        } else {
1847                return "";
1848        }
1849}
1850
1851# format, perhaps shortened and with markers, title line
1852sub format_subject_html {
1853        my ($long, $short, $href, $extra) = @_;
1854        $extra = '' unless defined($extra);
1855
1856        if (length($short) < length($long)) {
1857                $long =~ s/[[:cntrl:]]/?/g;
1858                return $cgi->a({-href => $href, -class => "list subject",
1859                                -title => to_utf8($long)},
1860                       esc_html($short)) . $extra;
1861        } else {
1862                return $cgi->a({-href => $href, -class => "list subject"},
1863                       esc_html($long)) . $extra;
1864        }
1865}
1866
1867# Rather than recomputing the url for an email multiple times, we cache it
1868# after the first hit. This gives a visible benefit in views where the avatar
1869# for the same email is used repeatedly (e.g. shortlog).
1870# The cache is shared by all avatar engines (currently gravatar only), which
1871# are free to use it as preferred. Since only one avatar engine is used for any
1872# given page, there's no risk for cache conflicts.
1873our %avatar_cache = ();
1874
1875# Compute the picon url for a given email, by using the picon search service over at
1876# http://www.cs.indiana.edu/picons/search.html
1877sub picon_url {
1878        my $email = lc shift;
1879        if (!$avatar_cache{$email}) {
1880                my ($user, $domain) = split('@', $email);
1881                $avatar_cache{$email} =
1882                        "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1883                        "$domain/$user/" .
1884                        "users+domains+unknown/up/single";
1885        }
1886        return $avatar_cache{$email};
1887}
1888
1889# Compute the gravatar url for a given email, if it's not in the cache already.
1890# Gravatar stores only the part of the URL before the size, since that's the
1891# one computationally more expensive. This also allows reuse of the cache for
1892# different sizes (for this particular engine).
1893sub gravatar_url {
1894        my $email = lc shift;
1895        my $size = shift;
1896        $avatar_cache{$email} ||=
1897                "http://www.gravatar.com/avatar/" .
1898                        Digest::MD5::md5_hex($email) . "?s=";
1899        return $avatar_cache{$email} . $size;
1900}
1901
1902# Insert an avatar for the given $email at the given $size if the feature
1903# is enabled.
1904sub git_get_avatar {
1905        my ($email, %opts) = @_;
1906        my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1907        my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1908        $opts{-size} ||= 'default';
1909        my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1910        my $url = "";
1911        if ($git_avatar eq 'gravatar') {
1912                $url = gravatar_url($email, $size);
1913        } elsif ($git_avatar eq 'picon') {
1914                $url = picon_url($email);
1915        }
1916        # Other providers can be added by extending the if chain, defining $url
1917        # as needed. If no variant puts something in $url, we assume avatars
1918        # are completely disabled/unavailable.
1919        if ($url) {
1920                return $pre_white .
1921                       "<img width=\"$size\" " .
1922                            "class=\"avatar\" " .
1923                            "src=\"".esc_url($url)."\" " .
1924                            "alt=\"\" " .
1925                       "/>" . $post_white;
1926        } else {
1927                return "";
1928        }
1929}
1930
1931sub format_search_author {
1932        my ($author, $searchtype, $displaytext) = @_;
1933        my $have_search = gitweb_check_feature('search');
1934
1935        if ($have_search) {
1936                my $performed = "";
1937                if ($searchtype eq 'author') {
1938                        $performed = "authored";
1939                } elsif ($searchtype eq 'committer') {
1940                        $performed = "committed";
1941                }
1942
1943                return $cgi->a({-href => href(action=>"search", hash=>$hash,
1944                                searchtext=>$author,
1945                                searchtype=>$searchtype), class=>"list",
1946                                title=>"Search for commits $performed by $author"},
1947                                $displaytext);
1948
1949        } else {
1950                return $displaytext;
1951        }
1952}
1953
1954# format the author name of the given commit with the given tag
1955# the author name is chopped and escaped according to the other
1956# optional parameters (see chop_str).
1957sub format_author_html {
1958        my $tag = shift;
1959        my $co = shift;
1960        my $author = chop_and_escape_str($co->{'author_name'}, @_);
1961        return "<$tag class=\"author\">" .
1962               format_search_author($co->{'author_name'}, "author",
1963                       git_get_avatar($co->{'author_email'}, -pad_after => 1) .
1964                       $author) .
1965               "</$tag>";
1966}
1967
1968# format git diff header line, i.e. "diff --(git|combined|cc) ..."
1969sub format_git_diff_header_line {
1970        my $line = shift;
1971        my $diffinfo = shift;
1972        my ($from, $to) = @_;
1973
1974        if ($diffinfo->{'nparents'}) {
1975                # combined diff
1976                $line =~ s!^(diff (.*?) )"?.*$!$1!;
1977                if ($to->{'href'}) {
1978                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1979                                         esc_path($to->{'file'}));
1980                } else { # file was deleted (no href)
1981                        $line .= esc_path($to->{'file'});
1982                }
1983        } else {
1984                # "ordinary" diff
1985                $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
1986                if ($from->{'href'}) {
1987                        $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
1988                                         'a/' . esc_path($from->{'file'}));
1989                } else { # file was added (no href)
1990                        $line .= 'a/' . esc_path($from->{'file'});
1991                }
1992                $line .= ' ';
1993                if ($to->{'href'}) {
1994                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1995                                         'b/' . esc_path($to->{'file'}));
1996                } else { # file was deleted
1997                        $line .= 'b/' . esc_path($to->{'file'});
1998                }
1999        }
2000
2001        return "<div class=\"diff header\">$line</div>\n";
2002}
2003
2004# format extended diff header line, before patch itself
2005sub format_extended_diff_header_line {
2006        my $line = shift;
2007        my $diffinfo = shift;
2008        my ($from, $to) = @_;
2009
2010        # match <path>
2011        if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2012                $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2013                                       esc_path($from->{'file'}));
2014        }
2015        if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2016                $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2017                                 esc_path($to->{'file'}));
2018        }
2019        # match single <mode>
2020        if ($line =~ m/\s(\d{6})$/) {
2021                $line .= '<span class="info"> (' .
2022                         file_type_long($1) .
2023                         ')</span>';
2024        }
2025        # match <hash>
2026        if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2027                # can match only for combined diff
2028                $line = 'index ';
2029                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2030                        if ($from->{'href'}[$i]) {
2031                                $line .= $cgi->a({-href=>$from->{'href'}[$i],
2032                                                  -class=>"hash"},
2033                                                 substr($diffinfo->{'from_id'}[$i],0,7));
2034                        } else {
2035                                $line .= '0' x 7;
2036                        }
2037                        # separator
2038                        $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2039                }
2040                $line .= '..';
2041                if ($to->{'href'}) {
2042                        $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2043                                         substr($diffinfo->{'to_id'},0,7));
2044                } else {
2045                        $line .= '0' x 7;
2046                }
2047
2048        } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2049                # can match only for ordinary diff
2050                my ($from_link, $to_link);
2051                if ($from->{'href'}) {
2052                        $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2053                                             substr($diffinfo->{'from_id'},0,7));
2054                } else {
2055                        $from_link = '0' x 7;
2056                }
2057                if ($to->{'href'}) {
2058                        $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2059                                           substr($diffinfo->{'to_id'},0,7));
2060                } else {
2061                        $to_link = '0' x 7;
2062                }
2063                my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2064                $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2065        }
2066
2067        return $line . "<br/>\n";
2068}
2069
2070# format from-file/to-file diff header
2071sub format_diff_from_to_header {
2072        my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2073        my $line;
2074        my $result = '';
2075
2076        $line = $from_line;
2077        #assert($line =~ m/^---/) if DEBUG;
2078        # no extra formatting for "^--- /dev/null"
2079        if (! $diffinfo->{'nparents'}) {
2080                # ordinary (single parent) diff
2081                if ($line =~ m!^--- "?a/!) {
2082                        if ($from->{'href'}) {
2083                                $line = '--- a/' .
2084                                        $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2085                                                esc_path($from->{'file'}));
2086                        } else {
2087                                $line = '--- a/' .
2088                                        esc_path($from->{'file'});
2089                        }
2090                }
2091                $result .= qq!<div class="diff from_file">$line</div>\n!;
2092
2093        } else {
2094                # combined diff (merge commit)
2095                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2096                        if ($from->{'href'}[$i]) {
2097                                $line = '--- ' .
2098                                        $cgi->a({-href=>href(action=>"blobdiff",
2099                                                             hash_parent=>$diffinfo->{'from_id'}[$i],
2100                                                             hash_parent_base=>$parents[$i],
2101                                                             file_parent=>$from->{'file'}[$i],
2102                                                             hash=>$diffinfo->{'to_id'},
2103                                                             hash_base=>$hash,
2104                                                             file_name=>$to->{'file'}),
2105                                                 -class=>"path",
2106                                                 -title=>"diff" . ($i+1)},
2107                                                $i+1) .
2108                                        '/' .
2109                                        $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2110                                                esc_path($from->{'file'}[$i]));
2111                        } else {
2112                                $line = '--- /dev/null';
2113                        }
2114                        $result .= qq!<div class="diff from_file">$line</div>\n!;
2115                }
2116        }
2117
2118        $line = $to_line;
2119        #assert($line =~ m/^\+\+\+/) if DEBUG;
2120        # no extra formatting for "^+++ /dev/null"
2121        if ($line =~ m!^\+\+\+ "?b/!) {
2122                if ($to->{'href'}) {
2123                        $line = '+++ b/' .
2124                                $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2125                                        esc_path($to->{'file'}));
2126                } else {
2127                        $line = '+++ b/' .
2128                                esc_path($to->{'file'});
2129                }
2130        }
2131        $result .= qq!<div class="diff to_file">$line</div>\n!;
2132
2133        return $result;
2134}
2135
2136# create note for patch simplified by combined diff
2137sub format_diff_cc_simplified {
2138        my ($diffinfo, @parents) = @_;
2139        my $result = '';
2140
2141        $result .= "<div class=\"diff header\">" .
2142                   "diff --cc ";
2143        if (!is_deleted($diffinfo)) {
2144                $result .= $cgi->a({-href => href(action=>"blob",
2145                                                  hash_base=>$hash,
2146                                                  hash=>$diffinfo->{'to_id'},
2147                                                  file_name=>$diffinfo->{'to_file'}),
2148                                    -class => "path"},
2149                                   esc_path($diffinfo->{'to_file'}));
2150        } else {
2151                $result .= esc_path($diffinfo->{'to_file'});
2152        }
2153        $result .= "</div>\n" . # class="diff header"
2154                   "<div class=\"diff nodifferences\">" .
2155                   "Simple merge" .
2156                   "</div>\n"; # class="diff nodifferences"
2157
2158        return $result;
2159}
2160
2161# format patch (diff) line (not to be used for diff headers)
2162sub format_diff_line {
2163        my $line = shift;
2164        my ($from, $to) = @_;
2165        my $diff_class = "";
2166
2167        chomp $line;
2168
2169        if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2170                # combined diff
2171                my $prefix = substr($line, 0, scalar @{$from->{'href'}});
2172                if ($line =~ m/^\@{3}/) {
2173                        $diff_class = " chunk_header";
2174                } elsif ($line =~ m/^\\/) {
2175                        $diff_class = " incomplete";
2176                } elsif ($prefix =~ tr/+/+/) {
2177                        $diff_class = " add";
2178                } elsif ($prefix =~ tr/-/-/) {
2179                        $diff_class = " rem";
2180                }
2181        } else {
2182                # assume ordinary diff
2183                my $char = substr($line, 0, 1);
2184                if ($char eq '+') {
2185                        $diff_class = " add";
2186                } elsif ($char eq '-') {
2187                        $diff_class = " rem";
2188                } elsif ($char eq '@') {
2189                        $diff_class = " chunk_header";
2190                } elsif ($char eq "\\") {
2191                        $diff_class = " incomplete";
2192                }
2193        }
2194        $line = untabify($line);
2195        if ($from && $to && $line =~ m/^\@{2} /) {
2196                my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2197                        $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2198
2199                $from_lines = 0 unless defined $from_lines;
2200                $to_lines   = 0 unless defined $to_lines;
2201
2202                if ($from->{'href'}) {
2203                        $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2204                                             -class=>"list"}, $from_text);
2205                }
2206                if ($to->{'href'}) {
2207                        $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2208                                             -class=>"list"}, $to_text);
2209                }
2210                $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2211                        "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2212                return "<div class=\"diff$diff_class\">$line</div>\n";
2213        } elsif ($from && $to && $line =~ m/^\@{3}/) {
2214                my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2215                my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2216
2217                @from_text = split(' ', $ranges);
2218                for (my $i = 0; $i < @from_text; ++$i) {
2219                        ($from_start[$i], $from_nlines[$i]) =
2220                                (split(',', substr($from_text[$i], 1)), 0);
2221                }
2222
2223                $to_text   = pop @from_text;
2224                $to_start  = pop @from_start;
2225                $to_nlines = pop @from_nlines;
2226
2227                $line = "<span class=\"chunk_info\">$prefix ";
2228                for (my $i = 0; $i < @from_text; ++$i) {
2229                        if ($from->{'href'}[$i]) {
2230                                $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2231                                                  -class=>"list"}, $from_text[$i]);
2232                        } else {
2233                                $line .= $from_text[$i];
2234                        }
2235                        $line .= " ";
2236                }
2237                if ($to->{'href'}) {
2238                        $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2239                                          -class=>"list"}, $to_text);
2240                } else {
2241                        $line .= $to_text;
2242                }
2243                $line .= " $prefix</span>" .
2244                         "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2245                return "<div class=\"diff$diff_class\">$line</div>\n";
2246        }
2247        return "<div class=\"diff$diff_class\">" . esc_html($line, -nbsp=>1) . "</div>\n";
2248}
2249
2250# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2251# linked.  Pass the hash of the tree/commit to snapshot.
2252sub format_snapshot_links {
2253        my ($hash) = @_;
2254        my $num_fmts = @snapshot_fmts;
2255        if ($num_fmts > 1) {
2256                # A parenthesized list of links bearing format names.
2257                # e.g. "snapshot (_tar.gz_ _zip_)"
2258                return "snapshot (" . join(' ', map
2259                        $cgi->a({
2260                                -href => href(
2261                                        action=>"snapshot",
2262                                        hash=>$hash,
2263                                        snapshot_format=>$_
2264                                )
2265                        }, $known_snapshot_formats{$_}{'display'})
2266                , @snapshot_fmts) . ")";
2267        } elsif ($num_fmts == 1) {
2268                # A single "snapshot" link whose tooltip bears the format name.
2269                # i.e. "_snapshot_"
2270                my ($fmt) = @snapshot_fmts;
2271                return
2272                        $cgi->a({
2273                                -href => href(
2274                                        action=>"snapshot",
2275                                        hash=>$hash,
2276                                        snapshot_format=>$fmt
2277                                ),
2278                                -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2279                        }, "snapshot");
2280        } else { # $num_fmts == 0
2281                return undef;
2282        }
2283}
2284
2285## ......................................................................
2286## functions returning values to be passed, perhaps after some
2287## transformation, to other functions; e.g. returning arguments to href()
2288
2289# returns hash to be passed to href to generate gitweb URL
2290# in -title key it returns description of link
2291sub get_feed_info {
2292        my $format = shift || 'Atom';
2293        my %res = (action => lc($format));
2294
2295        # feed links are possible only for project views
2296        return unless (defined $project);
2297        # some views should link to OPML, or to generic project feed,
2298        # or don't have specific feed yet (so they should use generic)
2299        return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2300
2301        my $branch;
2302        # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2303        # from tag links; this also makes possible to detect branch links
2304        if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2305            (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2306                $branch = $1;
2307        }
2308        # find log type for feed description (title)
2309        my $type = 'log';
2310        if (defined $file_name) {
2311                $type  = "history of $file_name";
2312                $type .= "/" if ($action eq 'tree');
2313                $type .= " on '$branch'" if (defined $branch);
2314        } else {
2315                $type = "log of $branch" if (defined $branch);
2316        }
2317
2318        $res{-title} = $type;
2319        $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2320        $res{'file_name'} = $file_name;
2321
2322        return %res;
2323}
2324
2325## ----------------------------------------------------------------------
2326## git utility subroutines, invoking git commands
2327
2328# returns path to the core git executable and the --git-dir parameter as list
2329sub git_cmd {
2330        $number_of_git_cmds++;
2331        return $GIT, '--git-dir='.$git_dir;
2332}
2333
2334# quote the given arguments for passing them to the shell
2335# quote_command("command", "arg 1", "arg with ' and ! characters")
2336# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2337# Try to avoid using this function wherever possible.
2338sub quote_command {
2339        return join(' ',
2340                map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2341}
2342
2343# get HEAD ref of given project as hash
2344sub git_get_head_hash {
2345        return git_get_full_hash(shift, 'HEAD');
2346}
2347
2348sub git_get_full_hash {
2349        return git_get_hash(@_);
2350}
2351
2352sub git_get_short_hash {
2353        return git_get_hash(@_, '--short=7');
2354}
2355
2356sub git_get_hash {
2357        my ($project, $hash, @options) = @_;
2358        my $o_git_dir = $git_dir;
2359        my $retval = undef;
2360        $git_dir = "$projectroot/$project";
2361        if (open my $fd, '-|', git_cmd(), 'rev-parse',
2362            '--verify', '-q', @options, $hash) {
2363                $retval = <$fd>;
2364                chomp $retval if defined $retval;
2365                close $fd;
2366        }
2367        if (defined $o_git_dir) {
2368                $git_dir = $o_git_dir;
2369        }
2370        return $retval;
2371}
2372
2373# get type of given object
2374sub git_get_type {
2375        my $hash = shift;
2376
2377        open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2378        my $type = <$fd>;
2379        close $fd or return;
2380        chomp $type;
2381        return $type;
2382}
2383
2384# repository configuration
2385our $config_file = '';
2386our %config;
2387
2388# store multiple values for single key as anonymous array reference
2389# single values stored directly in the hash, not as [ <value> ]
2390sub hash_set_multi {
2391        my ($hash, $key, $value) = @_;
2392
2393        if (!exists $hash->{$key}) {
2394                $hash->{$key} = $value;
2395        } elsif (!ref $hash->{$key}) {
2396                $hash->{$key} = [ $hash->{$key}, $value ];
2397        } else {
2398                push @{$hash->{$key}}, $value;
2399        }
2400}
2401
2402# return hash of git project configuration
2403# optionally limited to some section, e.g. 'gitweb'
2404sub git_parse_project_config {
2405        my $section_regexp = shift;
2406        my %config;
2407
2408        local $/ = "\0";
2409
2410        open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2411                or return;
2412
2413        while (my $keyval = <$fh>) {
2414                chomp $keyval;
2415                my ($key, $value) = split(/\n/, $keyval, 2);
2416
2417                hash_set_multi(\%config, $key, $value)
2418                        if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2419        }
2420        close $fh;
2421
2422        return %config;
2423}
2424
2425# convert config value to boolean: 'true' or 'false'
2426# no value, number > 0, 'true' and 'yes' values are true
2427# rest of values are treated as false (never as error)
2428sub config_to_bool {
2429        my $val = shift;
2430
2431        return 1 if !defined $val;             # section.key
2432
2433        # strip leading and trailing whitespace
2434        $val =~ s/^\s+//;
2435        $val =~ s/\s+$//;
2436
2437        return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2438                ($val =~ /^(?:true|yes)$/i));  # section.key = true
2439}
2440
2441# convert config value to simple decimal number
2442# an optional value suffix of 'k', 'm', or 'g' will cause the value
2443# to be multiplied by 1024, 1048576, or 1073741824
2444sub config_to_int {
2445        my $val = shift;
2446
2447        # strip leading and trailing whitespace
2448        $val =~ s/^\s+//;
2449        $val =~ s/\s+$//;
2450
2451        if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2452                $unit = lc($unit);
2453                # unknown unit is treated as 1
2454                return $num * ($unit eq 'g' ? 1073741824 :
2455                               $unit eq 'm' ?    1048576 :
2456                               $unit eq 'k' ?       1024 : 1);
2457        }
2458        return $val;
2459}
2460
2461# convert config value to array reference, if needed
2462sub config_to_multi {
2463        my $val = shift;
2464
2465        return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2466}
2467
2468sub git_get_project_config {
2469        my ($key, $type) = @_;
2470
2471        return unless defined $git_dir;
2472
2473        # key sanity check
2474        return unless ($key);
2475        $key =~ s/^gitweb\.//;
2476        return if ($key =~ m/\W/);
2477
2478        # type sanity check
2479        if (defined $type) {
2480                $type =~ s/^--//;
2481                $type = undef
2482                        unless ($type eq 'bool' || $type eq 'int');
2483        }
2484
2485        # get config
2486        if (!defined $config_file ||
2487            $config_file ne "$git_dir/config") {
2488                %config = git_parse_project_config('gitweb');
2489                $config_file = "$git_dir/config";
2490        }
2491
2492        # check if config variable (key) exists
2493        return unless exists $config{"gitweb.$key"};
2494
2495        # ensure given type
2496        if (!defined $type) {
2497                return $config{"gitweb.$key"};
2498        } elsif ($type eq 'bool') {
2499                # backward compatibility: 'git config --bool' returns true/false
2500                return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2501        } elsif ($type eq 'int') {
2502                return config_to_int($config{"gitweb.$key"});
2503        }
2504        return $config{"gitweb.$key"};
2505}
2506
2507# get hash of given path at given ref
2508sub git_get_hash_by_path {
2509        my $base = shift;
2510        my $path = shift || return undef;
2511        my $type = shift;
2512
2513        $path =~ s,/+$,,;
2514
2515        open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2516                or die_error(500, "Open git-ls-tree failed");
2517        my $line = <$fd>;
2518        close $fd or return undef;
2519
2520        if (!defined $line) {
2521                # there is no tree or hash given by $path at $base
2522                return undef;
2523        }
2524
2525        #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2526        $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2527        if (defined $type && $type ne $2) {
2528                # type doesn't match
2529                return undef;
2530        }
2531        return $3;
2532}
2533
2534# get path of entry with given hash at given tree-ish (ref)
2535# used to get 'from' filename for combined diff (merge commit) for renames
2536sub git_get_path_by_hash {
2537        my $base = shift || return;
2538        my $hash = shift || return;
2539
2540        local $/ = "\0";
2541
2542        open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2543                or return undef;
2544        while (my $line = <$fd>) {
2545                chomp $line;
2546
2547                #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2548                #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2549                if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2550                        close $fd;
2551                        return $1;
2552                }
2553        }
2554        close $fd;
2555        return undef;
2556}
2557
2558## ......................................................................
2559## git utility functions, directly accessing git repository
2560
2561sub git_get_project_description {
2562        my $path = shift;
2563
2564        $git_dir = "$projectroot/$path";
2565        open my $fd, '<', "$git_dir/description"
2566                or return git_get_project_config('description');
2567        my $descr = <$fd>;
2568        close $fd;
2569        if (defined $descr) {
2570                chomp $descr;
2571        }
2572        return $descr;
2573}
2574
2575sub git_get_project_ctags {
2576        my $path = shift;
2577        my $ctags = {};
2578
2579        $git_dir = "$projectroot/$path";
2580        opendir my $dh, "$git_dir/ctags"
2581                or return $ctags;
2582        foreach (grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh)) {
2583                open my $ct, '<', $_ or next;
2584                my $val = <$ct>;
2585                chomp $val;
2586                close $ct;
2587                my $ctag = $_; $ctag =~ s#.*/##;
2588                $ctags->{$ctag} = $val;
2589        }
2590        closedir $dh;
2591        $ctags;
2592}
2593
2594sub git_populate_project_tagcloud {
2595        my $ctags = shift;
2596
2597        # First, merge different-cased tags; tags vote on casing
2598        my %ctags_lc;
2599        foreach (keys %$ctags) {
2600                $ctags_lc{lc $_}->{count} += $ctags->{$_};
2601                if (not $ctags_lc{lc $_}->{topcount}
2602                    or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2603                        $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2604                        $ctags_lc{lc $_}->{topname} = $_;
2605                }
2606        }
2607
2608        my $cloud;
2609        if (eval { require HTML::TagCloud; 1; }) {
2610                $cloud = HTML::TagCloud->new;
2611                foreach (sort keys %ctags_lc) {
2612                        # Pad the title with spaces so that the cloud looks
2613                        # less crammed.
2614                        my $title = $ctags_lc{$_}->{topname};
2615                        $title =~ s/ /&nbsp;/g;
2616                        $title =~ s/^/&nbsp;/g;
2617                        $title =~ s/$/&nbsp;/g;
2618                        $cloud->add($title, $home_link."?by_tag=".$_, $ctags_lc{$_}->{count});
2619                }
2620        } else {
2621                $cloud = \%ctags_lc;
2622        }
2623        $cloud;
2624}
2625
2626sub git_show_project_tagcloud {
2627        my ($cloud, $count) = @_;
2628        print STDERR ref($cloud)."..\n";
2629        if (ref $cloud eq 'HTML::TagCloud') {
2630                return $cloud->html_and_css($count);
2631        } else {
2632                my @tags = sort { $cloud->{$a}->{count} <=> $cloud->{$b}->{count} } keys %$cloud;
2633                return '<p align="center">' . join (', ', map {
2634                        $cgi->a({-href=>"$home_link?by_tag=$_"}, $cloud->{$_}->{topname})
2635                } splice(@tags, 0, $count)) . '</p>';
2636        }
2637}
2638
2639sub git_get_project_url_list {
2640        my $path = shift;
2641
2642        $git_dir = "$projectroot/$path";
2643        open my $fd, '<', "$git_dir/cloneurl"
2644                or return wantarray ?
2645                @{ config_to_multi(git_get_project_config('url')) } :
2646                   config_to_multi(git_get_project_config('url'));
2647        my @git_project_url_list = map { chomp; $_ } <$fd>;
2648        close $fd;
2649
2650        return wantarray ? @git_project_url_list : \@git_project_url_list;
2651}
2652
2653sub git_get_projects_list {
2654        my ($filter) = @_;
2655        my @list;
2656
2657        $filter ||= '';
2658        $filter =~ s/\.git$//;
2659
2660        my $check_forks = gitweb_check_feature('forks');
2661
2662        if (-d $projects_list) {
2663                # search in directory
2664                my $dir = $projects_list . ($filter ? "/$filter" : '');
2665                # remove the trailing "/"
2666                $dir =~ s!/+$!!;
2667                my $pfxlen = length("$dir");
2668                my $pfxdepth = ($dir =~ tr!/!!);
2669
2670                File::Find::find({
2671                        follow_fast => 1, # follow symbolic links
2672                        follow_skip => 2, # ignore duplicates
2673                        dangling_symlinks => 0, # ignore dangling symlinks, silently
2674                        wanted => sub {
2675                                # global variables
2676                                our $project_maxdepth;
2677                                our $projectroot;
2678                                # skip project-list toplevel, if we get it.
2679                                return if (m!^[/.]$!);
2680                                # only directories can be git repositories
2681                                return unless (-d $_);
2682                                # don't traverse too deep (Find is super slow on os x)
2683                                if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2684                                        $File::Find::prune = 1;
2685                                        return;
2686                                }
2687
2688                                my $subdir = substr($File::Find::name, $pfxlen + 1);
2689                                # we check related file in $projectroot
2690                                my $path = ($filter ? "$filter/" : '') . $subdir;
2691                                if (check_export_ok("$projectroot/$path")) {
2692                                        push @list, { path => $path };
2693                                        $File::Find::prune = 1;
2694                                }
2695                        },
2696                }, "$dir");
2697
2698        } elsif (-f $projects_list) {
2699                # read from file(url-encoded):
2700                # 'git%2Fgit.git Linus+Torvalds'
2701                # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2702                # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2703                my %paths;
2704                open my $fd, '<', $projects_list or return;
2705        PROJECT:
2706                while (my $line = <$fd>) {
2707                        chomp $line;
2708                        my ($path, $owner) = split ' ', $line;
2709                        $path = unescape($path);
2710                        $owner = unescape($owner);
2711                        if (!defined $path) {
2712                                next;
2713                        }
2714                        if ($filter ne '') {
2715                                # looking for forks;
2716                                my $pfx = substr($path, 0, length($filter));
2717                                if ($pfx ne $filter) {
2718                                        next PROJECT;
2719                                }
2720                                my $sfx = substr($path, length($filter));
2721                                if ($sfx !~ /^\/.*\.git$/) {
2722                                        next PROJECT;
2723                                }
2724                        } elsif ($check_forks) {
2725                        PATH:
2726                                foreach my $filter (keys %paths) {
2727                                        # looking for forks;
2728                                        my $pfx = substr($path, 0, length($filter));
2729                                        if ($pfx ne $filter) {
2730                                                next PATH;
2731                                        }
2732                                        my $sfx = substr($path, length($filter));
2733                                        if ($sfx !~ /^\/.*\.git$/) {
2734                                                next PATH;
2735                                        }
2736                                        # is a fork, don't include it in
2737                                        # the list
2738                                        next PROJECT;
2739                                }
2740                        }
2741                        if (check_export_ok("$projectroot/$path")) {
2742                                my $pr = {
2743                                        path => $path,
2744                                        owner => to_utf8($owner),
2745                                };
2746                                push @list, $pr;
2747                                (my $forks_path = $path) =~ s/\.git$//;
2748                                $paths{$forks_path}++;
2749                        }
2750                }
2751                close $fd;
2752        }
2753        return @list;
2754}
2755
2756our $gitweb_project_owner = undef;
2757sub git_get_project_list_from_file {
2758
2759        return if (defined $gitweb_project_owner);
2760
2761        $gitweb_project_owner = {};
2762        # read from file (url-encoded):
2763        # 'git%2Fgit.git Linus+Torvalds'
2764        # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2765        # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2766        if (-f $projects_list) {
2767                open(my $fd, '<', $projects_list);
2768                while (my $line = <$fd>) {
2769                        chomp $line;
2770                        my ($pr, $ow) = split ' ', $line;
2771                        $pr = unescape($pr);
2772                        $ow = unescape($ow);
2773                        $gitweb_project_owner->{$pr} = to_utf8($ow);
2774                }
2775                close $fd;
2776        }
2777}
2778
2779sub git_get_project_owner {
2780        my $project = shift;
2781        my $owner;
2782
2783        return undef unless $project;
2784        $git_dir = "$projectroot/$project";
2785
2786        if (!defined $gitweb_project_owner) {
2787                git_get_project_list_from_file();
2788        }
2789
2790        if (exists $gitweb_project_owner->{$project}) {
2791                $owner = $gitweb_project_owner->{$project};
2792        }
2793        if (!defined $owner){
2794                $owner = git_get_project_config('owner');
2795        }
2796        if (!defined $owner) {
2797                $owner = get_file_owner("$git_dir");
2798        }
2799
2800        return $owner;
2801}
2802
2803sub git_get_last_activity {
2804        my ($path) = @_;
2805        my $fd;
2806
2807        $git_dir = "$projectroot/$path";
2808        open($fd, "-|", git_cmd(), 'for-each-ref',
2809             '--format=%(committer)',
2810             '--sort=-committerdate',
2811             '--count=1',
2812             'refs/heads') or return;
2813        my $most_recent = <$fd>;
2814        close $fd or return;
2815        if (defined $most_recent &&
2816            $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
2817                my $timestamp = $1;
2818                my $age = time - $timestamp;
2819                return ($age, age_string($age));
2820        }
2821        return (undef, undef);
2822}
2823
2824# Implementation note: when a single remote is wanted, we cannot use 'git
2825# remote show -n' because that command always work (assuming it's a remote URL
2826# if it's not defined), and we cannot use 'git remote show' because that would
2827# try to make a network roundtrip. So the only way to find if that particular
2828# remote is defined is to walk the list provided by 'git remote -v' and stop if
2829# and when we find what we want.
2830sub git_get_remotes_list {
2831        my $wanted = shift;
2832        my %remotes = ();
2833
2834        open my $fd, '-|' , git_cmd(), 'remote', '-v';
2835        return unless $fd;
2836        while (my $remote = <$fd>) {
2837                chomp $remote;
2838                $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
2839                next if $wanted and not $remote eq $wanted;
2840                my ($url, $key) = ($1, $2);
2841
2842                $remotes{$remote} ||= { 'heads' => () };
2843                $remotes{$remote}{$key} = $url;
2844        }
2845        close $fd or return;
2846        return wantarray ? %remotes : \%remotes;
2847}
2848
2849# Takes a hash of remotes as first parameter and fills it by adding the
2850# available remote heads for each of the indicated remotes.
2851sub fill_remote_heads {
2852        my $remotes = shift;
2853        my @heads = map { "remotes/$_" } keys %$remotes;
2854        my @remoteheads = git_get_heads_list(undef, @heads);
2855        foreach my $remote (keys %$remotes) {
2856                $remotes->{$remote}{'heads'} = [ grep {
2857                        $_->{'name'} =~ s!^$remote/!!
2858                        } @remoteheads ];
2859        }
2860}
2861
2862sub git_get_references {
2863        my $type = shift || "";
2864        my %refs;
2865        # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
2866        # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
2867        open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
2868                ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
2869                or return;
2870
2871        while (my $line = <$fd>) {
2872                chomp $line;
2873                if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
2874                        if (defined $refs{$1}) {
2875                                push @{$refs{$1}}, $2;
2876                        } else {
2877                                $refs{$1} = [ $2 ];
2878                        }
2879                }
2880        }
2881        close $fd or return;
2882        return \%refs;
2883}
2884
2885sub git_get_rev_name_tags {
2886        my $hash = shift || return undef;
2887
2888        open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
2889                or return;
2890        my $name_rev = <$fd>;
2891        close $fd;
2892
2893        if ($name_rev =~ m|^$hash tags/(.*)$|) {
2894                return $1;
2895        } else {
2896                # catches also '$hash undefined' output
2897                return undef;
2898        }
2899}
2900
2901## ----------------------------------------------------------------------
2902## parse to hash functions
2903
2904sub parse_date {
2905        my $epoch = shift;
2906        my $tz = shift || "-0000";
2907
2908        my %date;
2909        my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
2910        my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
2911        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
2912        $date{'hour'} = $hour;
2913        $date{'minute'} = $min;
2914        $date{'mday'} = $mday;
2915        $date{'day'} = $days[$wday];
2916        $date{'month'} = $months[$mon];
2917        $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
2918                             $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
2919        $date{'mday-time'} = sprintf "%d %s %02d:%02d",
2920                             $mday, $months[$mon], $hour ,$min;
2921        $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
2922                             1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
2923
2924        my ($tz_sign, $tz_hour, $tz_min) =
2925                ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
2926        $tz_sign = ($tz_sign eq '-' ? -1 : +1);
2927        my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
2928        ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
2929        $date{'hour_local'} = $hour;
2930        $date{'minute_local'} = $min;
2931        $date{'tz_local'} = $tz;
2932        $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
2933                                  1900+$year, $mon+1, $mday,
2934                                  $hour, $min, $sec, $tz);
2935        return %date;
2936}
2937
2938sub parse_tag {
2939        my $tag_id = shift;
2940        my %tag;
2941        my @comment;
2942
2943        open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
2944        $tag{'id'} = $tag_id;
2945        while (my $line = <$fd>) {
2946                chomp $line;
2947                if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
2948                        $tag{'object'} = $1;
2949                } elsif ($line =~ m/^type (.+)$/) {
2950                        $tag{'type'} = $1;
2951                } elsif ($line =~ m/^tag (.+)$/) {
2952                        $tag{'name'} = $1;
2953                } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
2954                        $tag{'author'} = $1;
2955                        $tag{'author_epoch'} = $2;
2956                        $tag{'author_tz'} = $3;
2957                        if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
2958                                $tag{'author_name'}  = $1;
2959                                $tag{'author_email'} = $2;
2960                        } else {
2961                                $tag{'author_name'} = $tag{'author'};
2962                        }
2963                } elsif ($line =~ m/--BEGIN/) {
2964                        push @comment, $line;
2965                        last;
2966                } elsif ($line eq "") {
2967                        last;
2968                }
2969        }
2970        push @comment, <$fd>;
2971        $tag{'comment'} = \@comment;
2972        close $fd or return;
2973        if (!defined $tag{'name'}) {
2974                return
2975        };
2976        return %tag
2977}
2978
2979sub parse_commit_text {
2980        my ($commit_text, $withparents) = @_;
2981        my @commit_lines = split '\n', $commit_text;
2982        my %co;
2983
2984        pop @commit_lines; # Remove '\0'
2985
2986        if (! @commit_lines) {
2987                return;
2988        }
2989
2990        my $header = shift @commit_lines;
2991        if ($header !~ m/^[0-9a-fA-F]{40}/) {
2992                return;
2993        }
2994        ($co{'id'}, my @parents) = split ' ', $header;
2995        while (my $line = shift @commit_lines) {
2996                last if $line eq "\n";
2997                if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
2998                        $co{'tree'} = $1;
2999                } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3000                        push @parents, $1;
3001                } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3002                        $co{'author'} = to_utf8($1);
3003                        $co{'author_epoch'} = $2;
3004                        $co{'author_tz'} = $3;
3005                        if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3006                                $co{'author_name'}  = $1;
3007                                $co{'author_email'} = $2;
3008                        } else {
3009                                $co{'author_name'} = $co{'author'};
3010                        }
3011                } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3012                        $co{'committer'} = to_utf8($1);
3013                        $co{'committer_epoch'} = $2;
3014                        $co{'committer_tz'} = $3;
3015                        if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3016                                $co{'committer_name'}  = $1;
3017                                $co{'committer_email'} = $2;
3018                        } else {
3019                                $co{'committer_name'} = $co{'committer'};
3020                        }
3021                }
3022        }
3023        if (!defined $co{'tree'}) {
3024                return;
3025        };
3026        $co{'parents'} = \@parents;
3027        $co{'parent'} = $parents[0];
3028
3029        foreach my $title (@commit_lines) {
3030                $title =~ s/^    //;
3031                if ($title ne "") {
3032                        $co{'title'} = chop_str($title, 80, 5);
3033                        # remove leading stuff of merges to make the interesting part visible
3034                        if (length($title) > 50) {
3035                                $title =~ s/^Automatic //;
3036                                $title =~ s/^merge (of|with) /Merge ... /i;
3037                                if (length($title) > 50) {
3038                                        $title =~ s/(http|rsync):\/\///;
3039                                }
3040                                if (length($title) > 50) {
3041                                        $title =~ s/(master|www|rsync)\.//;
3042                                }
3043                                if (length($title) > 50) {
3044                                        $title =~ s/kernel.org:?//;
3045                                }
3046                                if (length($title) > 50) {
3047                                        $title =~ s/\/pub\/scm//;
3048                                }
3049                        }
3050                        $co{'title_short'} = chop_str($title, 50, 5);
3051                        last;
3052                }
3053        }
3054        if (! defined $co{'title'} || $co{'title'} eq "") {
3055                $co{'title'} = $co{'title_short'} = '(no commit message)';
3056        }
3057        # remove added spaces
3058        foreach my $line (@commit_lines) {
3059                $line =~ s/^    //;
3060        }
3061        $co{'comment'} = \@commit_lines;
3062
3063        my $age = time - $co{'committer_epoch'};
3064        $co{'age'} = $age;
3065        $co{'age_string'} = age_string($age);
3066        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3067        if ($age > 60*60*24*7*2) {
3068                $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3069                $co{'age_string_age'} = $co{'age_string'};
3070        } else {
3071                $co{'age_string_date'} = $co{'age_string'};
3072                $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3073        }
3074        return %co;
3075}
3076
3077sub parse_commit {
3078        my ($commit_id) = @_;
3079        my %co;
3080
3081        local $/ = "\0";
3082
3083        open my $fd, "-|", git_cmd(), "rev-list",
3084                "--parents",
3085                "--header",
3086                "--max-count=1",
3087                $commit_id,
3088                "--",
3089                or die_error(500, "Open git-rev-list failed");
3090        %co = parse_commit_text(<$fd>, 1);
3091        close $fd;
3092
3093        return %co;
3094}
3095
3096sub parse_commits {
3097        my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3098        my @cos;
3099
3100        $maxcount ||= 1;
3101        $skip ||= 0;
3102
3103        local $/ = "\0";
3104
3105        open my $fd, "-|", git_cmd(), "rev-list",
3106                "--header",
3107                @args,
3108                ("--max-count=" . $maxcount),
3109                ("--skip=" . $skip),
3110                @extra_options,
3111                $commit_id,
3112                "--",
3113                ($filename ? ($filename) : ())
3114                or die_error(500, "Open git-rev-list failed");
3115        while (my $line = <$fd>) {
3116                my %co = parse_commit_text($line);
3117                push @cos, \%co;
3118        }
3119        close $fd;
3120
3121        return wantarray ? @cos : \@cos;
3122}
3123
3124# parse line of git-diff-tree "raw" output
3125sub parse_difftree_raw_line {
3126        my $line = shift;
3127        my %res;
3128
3129        # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3130        # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3131        if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3132                $res{'from_mode'} = $1;
3133                $res{'to_mode'} = $2;
3134                $res{'from_id'} = $3;
3135                $res{'to_id'} = $4;
3136                $res{'status'} = $5;
3137                $res{'similarity'} = $6;
3138                if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3139                        ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3140                } else {
3141                        $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3142                }
3143        }
3144        # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3145        # combined diff (for merge commit)
3146        elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3147                $res{'nparents'}  = length($1);
3148                $res{'from_mode'} = [ split(' ', $2) ];
3149                $res{'to_mode'} = pop @{$res{'from_mode'}};
3150                $res{'from_id'} = [ split(' ', $3) ];
3151                $res{'to_id'} = pop @{$res{'from_id'}};
3152                $res{'status'} = [ split('', $4) ];
3153                $res{'to_file'} = unquote($5);
3154        }
3155        # 'c512b523472485aef4fff9e57b229d9d243c967f'
3156        elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3157                $res{'commit'} = $1;
3158        }
3159
3160        return wantarray ? %res : \%res;
3161}
3162
3163# wrapper: return parsed line of git-diff-tree "raw" output
3164# (the argument might be raw line, or parsed info)
3165sub parsed_difftree_line {
3166        my $line_or_ref = shift;
3167
3168        if (ref($line_or_ref) eq "HASH") {
3169                # pre-parsed (or generated by hand)
3170                return $line_or_ref;
3171        } else {
3172                return parse_difftree_raw_line($line_or_ref);
3173        }
3174}
3175
3176# parse line of git-ls-tree output
3177sub parse_ls_tree_line {
3178        my $line = shift;
3179        my %opts = @_;
3180        my %res;
3181
3182        if ($opts{'-l'}) {
3183                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3184                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3185
3186                $res{'mode'} = $1;
3187                $res{'type'} = $2;
3188                $res{'hash'} = $3;
3189                $res{'size'} = $4;
3190                if ($opts{'-z'}) {
3191                        $res{'name'} = $5;
3192                } else {
3193                        $res{'name'} = unquote($5);
3194                }
3195        } else {
3196                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3197                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3198
3199                $res{'mode'} = $1;
3200                $res{'type'} = $2;
3201                $res{'hash'} = $3;
3202                if ($opts{'-z'}) {
3203                        $res{'name'} = $4;
3204                } else {
3205                        $res{'name'} = unquote($4);
3206                }
3207        }
3208
3209        return wantarray ? %res : \%res;
3210}
3211
3212# generates _two_ hashes, references to which are passed as 2 and 3 argument
3213sub parse_from_to_diffinfo {
3214        my ($diffinfo, $from, $to, @parents) = @_;
3215
3216        if ($diffinfo->{'nparents'}) {
3217                # combined diff
3218                $from->{'file'} = [];
3219                $from->{'href'} = [];
3220                fill_from_file_info($diffinfo, @parents)
3221                        unless exists $diffinfo->{'from_file'};
3222                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3223                        $from->{'file'}[$i] =
3224                                defined $diffinfo->{'from_file'}[$i] ?
3225                                        $diffinfo->{'from_file'}[$i] :
3226                                        $diffinfo->{'to_file'};
3227                        if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3228                                $from->{'href'}[$i] = href(action=>"blob",
3229                                                           hash_base=>$parents[$i],
3230                                                           hash=>$diffinfo->{'from_id'}[$i],
3231                                                           file_name=>$from->{'file'}[$i]);
3232                        } else {
3233                                $from->{'href'}[$i] = undef;
3234                        }
3235                }
3236        } else {
3237                # ordinary (not combined) diff
3238                $from->{'file'} = $diffinfo->{'from_file'};
3239                if ($diffinfo->{'status'} ne "A") { # not new (added) file
3240                        $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3241                                               hash=>$diffinfo->{'from_id'},
3242                                               file_name=>$from->{'file'});
3243                } else {
3244                        delete $from->{'href'};
3245                }
3246        }
3247
3248        $to->{'file'} = $diffinfo->{'to_file'};
3249        if (!is_deleted($diffinfo)) { # file exists in result
3250                $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3251                                     hash=>$diffinfo->{'to_id'},
3252                                     file_name=>$to->{'file'});
3253        } else {
3254                delete $to->{'href'};
3255        }
3256}
3257
3258## ......................................................................
3259## parse to array of hashes functions
3260
3261sub git_get_heads_list {
3262        my ($limit, @classes) = @_;
3263        @classes = ('heads') unless @classes;
3264        my @patterns = map { "refs/$_" } @classes;
3265        my @headslist;
3266
3267        open my $fd, '-|', git_cmd(), 'for-each-ref',
3268                ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3269                '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3270                @patterns
3271                or return;
3272        while (my $line = <$fd>) {
3273                my %ref_item;
3274
3275                chomp $line;
3276                my ($refinfo, $committerinfo) = split(/\0/, $line);
3277                my ($hash, $name, $title) = split(' ', $refinfo, 3);
3278                my ($committer, $epoch, $tz) =
3279                        ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3280                $ref_item{'fullname'}  = $name;
3281                $name =~ s!^refs/(?:head|remote)s/!!;
3282
3283                $ref_item{'name'}  = $name;
3284                $ref_item{'id'}    = $hash;
3285                $ref_item{'title'} = $title || '(no commit message)';
3286                $ref_item{'epoch'} = $epoch;
3287                if ($epoch) {
3288                        $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3289                } else {
3290                        $ref_item{'age'} = "unknown";
3291                }
3292
3293                push @headslist, \%ref_item;
3294        }
3295        close $fd;
3296
3297        return wantarray ? @headslist : \@headslist;
3298}
3299
3300sub git_get_tags_list {
3301        my $limit = shift;
3302        my @tagslist;
3303
3304        open my $fd, '-|', git_cmd(), 'for-each-ref',
3305                ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3306                '--format=%(objectname) %(objecttype) %(refname) '.
3307                '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3308                'refs/tags'
3309                or return;
3310        while (my $line = <$fd>) {
3311                my %ref_item;
3312
3313                chomp $line;
3314                my ($refinfo, $creatorinfo) = split(/\0/, $line);
3315                my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3316                my ($creator, $epoch, $tz) =
3317                        ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3318                $ref_item{'fullname'} = $name;
3319                $name =~ s!^refs/tags/!!;
3320
3321                $ref_item{'type'} = $type;
3322                $ref_item{'id'} = $id;
3323                $ref_item{'name'} = $name;
3324                if ($type eq "tag") {
3325                        $ref_item{'subject'} = $title;
3326                        $ref_item{'reftype'} = $reftype;
3327                        $ref_item{'refid'}   = $refid;
3328                } else {
3329                        $ref_item{'reftype'} = $type;
3330                        $ref_item{'refid'}   = $id;
3331                }
3332
3333                if ($type eq "tag" || $type eq "commit") {
3334                        $ref_item{'epoch'} = $epoch;
3335                        if ($epoch) {
3336                                $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3337                        } else {
3338                                $ref_item{'age'} = "unknown";
3339                        }
3340                }
3341
3342                push @tagslist, \%ref_item;
3343        }
3344        close $fd;
3345
3346        return wantarray ? @tagslist : \@tagslist;
3347}
3348
3349## ----------------------------------------------------------------------
3350## filesystem-related functions
3351
3352sub get_file_owner {
3353        my $path = shift;
3354
3355        my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3356        my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3357        if (!defined $gcos) {
3358                return undef;
3359        }
3360        my $owner = $gcos;
3361        $owner =~ s/[,;].*$//;
3362        return to_utf8($owner);
3363}
3364
3365# assume that file exists
3366sub insert_file {
3367        my $filename = shift;
3368
3369        open my $fd, '<', $filename;
3370        print map { to_utf8($_) } <$fd>;
3371        close $fd;
3372}
3373
3374## ......................................................................
3375## mimetype related functions
3376
3377sub mimetype_guess_file {
3378        my $filename = shift;
3379        my $mimemap = shift;
3380        -r $mimemap or return undef;
3381
3382        my %mimemap;
3383        open(my $mh, '<', $mimemap) or return undef;
3384        while (<$mh>) {
3385                next if m/^#/; # skip comments
3386                my ($mimetype, $exts) = split(/\t+/);
3387                if (defined $exts) {
3388                        my @exts = split(/\s+/, $exts);
3389                        foreach my $ext (@exts) {
3390                                $mimemap{$ext} = $mimetype;
3391                        }
3392                }
3393        }
3394        close($mh);
3395
3396        $filename =~ /\.([^.]*)$/;
3397        return $mimemap{$1};
3398}
3399
3400sub mimetype_guess {
3401        my $filename = shift;
3402        my $mime;
3403        $filename =~ /\./ or return undef;
3404
3405        if ($mimetypes_file) {
3406                my $file = $mimetypes_file;
3407                if ($file !~ m!^/!) { # if it is relative path
3408                        # it is relative to project
3409                        $file = "$projectroot/$project/$file";
3410                }
3411                $mime = mimetype_guess_file($filename, $file);
3412        }
3413        $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3414        return $mime;
3415}
3416
3417sub blob_mimetype {
3418        my $fd = shift;
3419        my $filename = shift;
3420
3421        if ($filename) {
3422                my $mime = mimetype_guess($filename);
3423                $mime and return $mime;
3424        }
3425
3426        # just in case
3427        return $default_blob_plain_mimetype unless $fd;
3428
3429        if (-T $fd) {
3430                return 'text/plain';
3431        } elsif (! $filename) {
3432                return 'application/octet-stream';
3433        } elsif ($filename =~ m/\.png$/i) {
3434                return 'image/png';
3435        } elsif ($filename =~ m/\.gif$/i) {
3436                return 'image/gif';
3437        } elsif ($filename =~ m/\.jpe?g$/i) {
3438                return 'image/jpeg';
3439        } else {
3440                return 'application/octet-stream';
3441        }
3442}
3443
3444sub blob_contenttype {
3445        my ($fd, $file_name, $type) = @_;
3446
3447        $type ||= blob_mimetype($fd, $file_name);
3448        if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3449                $type .= "; charset=$default_text_plain_charset";
3450        }
3451
3452        return $type;
3453}
3454
3455# guess file syntax for syntax highlighting; return undef if no highlighting
3456# the name of syntax can (in the future) depend on syntax highlighter used
3457sub guess_file_syntax {
3458        my ($highlight, $mimetype, $file_name) = @_;
3459        return undef unless ($highlight && defined $file_name);
3460        my $basename = basename($file_name, '.in');
3461        return $highlight_basename{$basename}
3462                if exists $highlight_basename{$basename};
3463
3464        $basename =~ /\.([^.]*)$/;
3465        my $ext = $1 or return undef;
3466        return $highlight_ext{$ext}
3467                if exists $highlight_ext{$ext};
3468
3469        return undef;
3470}
3471
3472# run highlighter and return FD of its output,
3473# or return original FD if no highlighting
3474sub run_highlighter {
3475        my ($fd, $highlight, $syntax) = @_;
3476        return $fd unless ($highlight && defined $syntax);
3477
3478        close $fd;
3479        open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3480                  quote_command($highlight_bin).
3481                  " --replace-tabs=8 --fragment --syntax $syntax |"
3482                or die_error(500, "Couldn't open file or run syntax highlighter");
3483        return $fd;
3484}
3485
3486## ======================================================================
3487## functions printing HTML: header, footer, error page
3488
3489sub get_page_title {
3490        my $title = to_utf8($site_name);
3491
3492        return $title unless (defined $project);
3493        $title .= " - " . to_utf8($project);
3494
3495        return $title unless (defined $action);
3496        $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3497
3498        return $title unless (defined $file_name);
3499        $title .= " - " . esc_path($file_name);
3500        if ($action eq "tree" && $file_name !~ m|/$|) {
3501                $title .= "/";
3502        }
3503
3504        return $title;
3505}
3506
3507sub print_feed_meta {
3508        if (defined $project) {
3509                my %href_params = get_feed_info();
3510                if (!exists $href_params{'-title'}) {
3511                        $href_params{'-title'} = 'log';
3512                }
3513
3514                foreach my $format (qw(RSS Atom)) {
3515                        my $type = lc($format);
3516                        my %link_attr = (
3517                                '-rel' => 'alternate',
3518                                '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3519                                '-type' => "application/$type+xml"
3520                        );
3521
3522                        $href_params{'action'} = $type;
3523                        $link_attr{'-href'} = href(%href_params);
3524                        print "<link ".
3525                              "rel=\"$link_attr{'-rel'}\" ".
3526                              "title=\"$link_attr{'-title'}\" ".
3527                              "href=\"$link_attr{'-href'}\" ".
3528                              "type=\"$link_attr{'-type'}\" ".
3529                              "/>\n";
3530
3531                        $href_params{'extra_options'} = '--no-merges';
3532                        $link_attr{'-href'} = href(%href_params);
3533                        $link_attr{'-title'} .= ' (no merges)';
3534                        print "<link ".
3535                              "rel=\"$link_attr{'-rel'}\" ".
3536                              "title=\"$link_attr{'-title'}\" ".
3537                              "href=\"$link_attr{'-href'}\" ".
3538                              "type=\"$link_attr{'-type'}\" ".
3539                              "/>\n";
3540                }
3541
3542        } else {
3543                printf('<link rel="alternate" title="%s projects list" '.
3544                       'href="%s" type="text/plain; charset=utf-8" />'."\n",
3545                       esc_attr($site_name), href(project=>undef, action=>"project_index"));
3546                printf('<link rel="alternate" title="%s projects feeds" '.
3547                       'href="%s" type="text/x-opml" />'."\n",
3548                       esc_attr($site_name), href(project=>undef, action=>"opml"));
3549        }
3550}
3551
3552sub git_header_html {
3553        my $status = shift || "200 OK";
3554        my $expires = shift;
3555        my %opts = @_;
3556
3557        my $title = get_page_title();
3558        my $content_type;
3559        # require explicit support from the UA if we are to send the page as
3560        # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3561        # we have to do this because MSIE sometimes globs '*/*', pretending to
3562        # support xhtml+xml but choking when it gets what it asked for.
3563        if (defined $cgi->http('HTTP_ACCEPT') &&
3564            $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3565            $cgi->Accept('application/xhtml+xml') != 0) {
3566                $content_type = 'application/xhtml+xml';
3567        } else {
3568                $content_type = 'text/html';
3569        }
3570        print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3571                           -status=> $status, -expires => $expires)
3572                unless ($opts{'-no_http_header'});
3573        my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3574        print <<EOF;
3575<?xml version="1.0" encoding="utf-8"?>
3576<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3577<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3578<!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3579<!-- git core binaries version $git_version -->
3580<head>
3581<meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3582<meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3583<meta name="robots" content="index, nofollow"/>
3584<title>$title</title>
3585EOF
3586        # the stylesheet, favicon etc urls won't work correctly with path_info
3587        # unless we set the appropriate base URL
3588        if ($ENV{'PATH_INFO'}) {
3589                print "<base href=\"".esc_url($base_url)."\" />\n";
3590        }
3591        # print out each stylesheet that exist, providing backwards capability
3592        # for those people who defined $stylesheet in a config file
3593        if (defined $stylesheet) {
3594                print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3595        } else {
3596                foreach my $stylesheet (@stylesheets) {
3597                        next unless $stylesheet;
3598                        print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3599                }
3600        }
3601        print_feed_meta()
3602                if ($status eq '200 OK');
3603        if (defined $favicon) {
3604                print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3605        }
3606
3607        print "</head>\n" .
3608              "<body>\n";
3609
3610        if (defined $site_header && -f $site_header) {
3611                insert_file($site_header);
3612        }
3613
3614        print "<div class=\"page_header\">\n";
3615        if (defined $logo) {
3616                print $cgi->a({-href => esc_url($logo_url),
3617                               -title => $logo_label},
3618                              $cgi->img({-src => esc_url($logo),
3619                                         -width => 72, -height => 27,
3620                                         -alt => "git",
3621                                         -class => "logo"}));
3622        }
3623        print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3624        if (defined $project) {
3625                print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3626                if (defined $action) {
3627                        my $action_print = $action ;
3628                        if (defined $opts{-action_extra}) {
3629                                $action_print = $cgi->a({-href => href(action=>$action)},
3630                                        $action);
3631                        }
3632                        print " / $action_print";
3633                }
3634                if (defined $opts{-action_extra}) {
3635                        print " / $opts{-action_extra}";
3636                }
3637                print "\n";
3638        }
3639        print "</div>\n";
3640
3641        my $have_search = gitweb_check_feature('search');
3642        if (defined $project && $have_search) {
3643                if (!defined $searchtext) {
3644                        $searchtext = "";
3645                }
3646                my $search_hash;
3647                if (defined $hash_base) {
3648                        $search_hash = $hash_base;
3649                } elsif (defined $hash) {
3650                        $search_hash = $hash;
3651                } else {
3652                        $search_hash = "HEAD";
3653                }
3654                my $action = $my_uri;
3655                my $use_pathinfo = gitweb_check_feature('pathinfo');
3656                if ($use_pathinfo) {
3657                        $action .= "/".esc_url($project);
3658                }
3659                print $cgi->startform(-method => "get", -action => $action) .
3660                      "<div class=\"search\">\n" .
3661                      (!$use_pathinfo &&
3662                      $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3663                      $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3664                      $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3665                      $cgi->popup_menu(-name => 'st', -default => 'commit',
3666                                       -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3667                      $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3668                      " search:\n",
3669                      $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3670                      "<span title=\"Extended regular expression\">" .
3671                      $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3672                                     -checked => $search_use_regexp) .
3673                      "</span>" .
3674                      "</div>" .
3675                      $cgi->end_form() . "\n";
3676        }
3677}
3678
3679sub git_footer_html {
3680        my $feed_class = 'rss_logo';
3681
3682        print "<div class=\"page_footer\">\n";
3683        if (defined $project) {
3684                my $descr = git_get_project_description($project);
3685                if (defined $descr) {
3686                        print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3687                }
3688
3689                my %href_params = get_feed_info();
3690                if (!%href_params) {
3691                        $feed_class .= ' generic';
3692                }
3693                $href_params{'-title'} ||= 'log';
3694
3695                foreach my $format (qw(RSS Atom)) {
3696                        $href_params{'action'} = lc($format);
3697                        print $cgi->a({-href => href(%href_params),
3698                                      -title => "$href_params{'-title'} $format feed",
3699                                      -class => $feed_class}, $format)."\n";
3700                }
3701
3702        } else {
3703                print $cgi->a({-href => href(project=>undef, action=>"opml"),
3704                              -class => $feed_class}, "OPML") . " ";
3705                print $cgi->a({-href => href(project=>undef, action=>"project_index"),
3706                              -class => $feed_class}, "TXT") . "\n";
3707        }
3708        print "</div>\n"; # class="page_footer"
3709
3710        if (defined $t0 && gitweb_check_feature('timed')) {
3711                print "<div id=\"generating_info\">\n";
3712                print 'This page took '.
3713                      '<span id="generating_time" class="time_span">'.
3714                      tv_interval($t0, [ gettimeofday() ]).
3715                      ' seconds </span>'.
3716                      ' and '.
3717                      '<span id="generating_cmd">'.
3718                      $number_of_git_cmds.
3719                      '</span> git commands '.
3720                      " to generate.\n";
3721                print "</div>\n"; # class="page_footer"
3722        }
3723
3724        if (defined $site_footer && -f $site_footer) {
3725                insert_file($site_footer);
3726        }
3727
3728        print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
3729        if (defined $action &&
3730            $action eq 'blame_incremental') {
3731                print qq!<script type="text/javascript">\n!.
3732                      qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
3733                      qq!           "!. href() .qq!");\n!.
3734                      qq!</script>\n!;
3735        } else {
3736                print qq!<script type="text/javascript">\n!.
3737                      qq!window.onload = function () {\n!.
3738                      (gitweb_check_feature('javascript-actions') ?
3739                      qq!       fixLinks();\n! : '').
3740                      # last parameter to onloadTZSetup must be CSS class used by format_timestamp_html
3741                      qq!       onloadTZSetup('local', 'gitweb_tz', 'datetime');\n!.
3742                      qq!};\n!.
3743                      qq!</script>\n!;
3744        }
3745
3746        print "</body>\n" .
3747              "</html>";
3748}
3749
3750# die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
3751# Example: die_error(404, 'Hash not found')
3752# By convention, use the following status codes (as defined in RFC 2616):
3753# 400: Invalid or missing CGI parameters, or
3754#      requested object exists but has wrong type.
3755# 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
3756#      this server or project.
3757# 404: Requested object/revision/project doesn't exist.
3758# 500: The server isn't configured properly, or
3759#      an internal error occurred (e.g. failed assertions caused by bugs), or
3760#      an unknown error occurred (e.g. the git binary died unexpectedly).
3761# 503: The server is currently unavailable (because it is overloaded,
3762#      or down for maintenance).  Generally, this is a temporary state.
3763sub die_error {
3764        my $status = shift || 500;
3765        my $error = esc_html(shift) || "Internal Server Error";
3766        my $extra = shift;
3767        my %opts = @_;
3768
3769        my %http_responses = (
3770                400 => '400 Bad Request',
3771                403 => '403 Forbidden',
3772                404 => '404 Not Found',
3773                500 => '500 Internal Server Error',
3774                503 => '503 Service Unavailable',
3775        );
3776        git_header_html($http_responses{$status}, undef, %opts);
3777        print <<EOF;
3778<div class="page_body">
3779<br /><br />
3780$status - $error
3781<br />
3782EOF
3783        if (defined $extra) {
3784                print "<hr />\n" .
3785                      "$extra\n";
3786        }
3787        print "</div>\n";
3788
3789        git_footer_html();
3790        goto DONE_GITWEB
3791                unless ($opts{'-error_handler'});
3792}
3793
3794## ----------------------------------------------------------------------
3795## functions printing or outputting HTML: navigation
3796
3797sub git_print_page_nav {
3798        my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
3799        $extra = '' if !defined $extra; # pager or formats
3800
3801        my @navs = qw(summary shortlog log commit commitdiff tree);
3802        if ($suppress) {
3803                @navs = grep { $_ ne $suppress } @navs;
3804        }
3805
3806        my %arg = map { $_ => {action=>$_} } @navs;
3807        if (defined $head) {
3808                for (qw(commit commitdiff)) {
3809                        $arg{$_}{'hash'} = $head;
3810                }
3811                if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
3812                        for (qw(shortlog log)) {
3813                                $arg{$_}{'hash'} = $head;
3814                        }
3815                }
3816        }
3817
3818        $arg{'tree'}{'hash'} = $treehead if defined $treehead;
3819        $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
3820
3821        my @actions = gitweb_get_feature('actions');
3822        my %repl = (
3823                '%' => '%',
3824                'n' => $project,         # project name
3825                'f' => $git_dir,         # project path within filesystem
3826                'h' => $treehead || '',  # current hash ('h' parameter)
3827                'b' => $treebase || '',  # hash base ('hb' parameter)
3828        );
3829        while (@actions) {
3830                my ($label, $link, $pos) = splice(@actions,0,3);
3831                # insert
3832                @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
3833                # munch munch
3834                $link =~ s/%([%nfhb])/$repl{$1}/g;
3835                $arg{$label}{'_href'} = $link;
3836        }
3837
3838        print "<div class=\"page_nav\">\n" .
3839                (join " | ",
3840                 map { $_ eq $current ?
3841                       $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
3842                 } @navs);
3843        print "<br/>\n$extra<br/>\n" .
3844              "</div>\n";
3845}
3846
3847# returns a submenu for the nagivation of the refs views (tags, heads,
3848# remotes) with the current view disabled and the remotes view only
3849# available if the feature is enabled
3850sub format_ref_views {
3851        my ($current) = @_;
3852        my @ref_views = qw{tags heads};
3853        push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
3854        return join " | ", map {
3855                $_ eq $current ? $_ :
3856                $cgi->a({-href => href(action=>$_)}, $_)
3857        } @ref_views
3858}
3859
3860sub format_paging_nav {
3861        my ($action, $page, $has_next_link) = @_;
3862        my $paging_nav;
3863
3864
3865        if ($page > 0) {
3866                $paging_nav .=
3867                        $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
3868                        " &sdot; " .
3869                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
3870                                 -accesskey => "p", -title => "Alt-p"}, "prev");
3871        } else {
3872                $paging_nav .= "first &sdot; prev";
3873        }
3874
3875        if ($has_next_link) {
3876                $paging_nav .= " &sdot; " .
3877                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
3878                                 -accesskey => "n", -title => "Alt-n"}, "next");
3879        } else {
3880                $paging_nav .= " &sdot; next";
3881        }
3882
3883        return $paging_nav;
3884}
3885
3886## ......................................................................
3887## functions printing or outputting HTML: div
3888
3889sub git_print_header_div {
3890        my ($action, $title, $hash, $hash_base) = @_;
3891        my %args = ();
3892
3893        $args{'action'} = $action;
3894        $args{'hash'} = $hash if $hash;
3895        $args{'hash_base'} = $hash_base if $hash_base;
3896
3897        print "<div class=\"header\">\n" .
3898              $cgi->a({-href => href(%args), -class => "title"},
3899              $title ? $title : $action) .
3900              "\n</div>\n";
3901}
3902
3903sub format_repo_url {
3904        my ($name, $url) = @_;
3905        return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
3906}
3907
3908# Group output by placing it in a DIV element and adding a header.
3909# Options for start_div() can be provided by passing a hash reference as the
3910# first parameter to the function.
3911# Options to git_print_header_div() can be provided by passing an array
3912# reference. This must follow the options to start_div if they are present.
3913# The content can be a scalar, which is output as-is, a scalar reference, which
3914# is output after html escaping, an IO handle passed either as *handle or
3915# *handle{IO}, or a function reference. In the latter case all following
3916# parameters will be taken as argument to the content function call.
3917sub git_print_section {
3918        my ($div_args, $header_args, $content);
3919        my $arg = shift;
3920        if (ref($arg) eq 'HASH') {
3921                $div_args = $arg;
3922                $arg = shift;
3923        }
3924        if (ref($arg) eq 'ARRAY') {
3925                $header_args = $arg;
3926                $arg = shift;
3927        }
3928        $content = $arg;
3929
3930        print $cgi->start_div($div_args);
3931        git_print_header_div(@$header_args);
3932
3933        if (ref($content) eq 'CODE') {
3934                $content->(@_);
3935        } elsif (ref($content) eq 'SCALAR') {
3936                print esc_html($$content);
3937        } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
3938                print <$content>;
3939        } elsif (!ref($content) && defined($content)) {
3940                print $content;
3941        }
3942
3943        print $cgi->end_div;
3944}
3945
3946sub format_timestamp_html {
3947        my $date = shift;
3948        my $strtime = '<span class="datetime">'.$date->{'rfc2822'}.'</span>';
3949
3950        my $localtime_format = '(%02d:%02d %s)';
3951        if ($date->{'hour_local'} < 6) {
3952                $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
3953        }
3954        $strtime .= ' ' .
3955                    sprintf($localtime_format,
3956                            $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
3957
3958        return $strtime;
3959}
3960
3961# Outputs the author name and date in long form
3962sub git_print_authorship {
3963        my $co = shift;
3964        my %opts = @_;
3965        my $tag = $opts{-tag} || 'div';
3966        my $author = $co->{'author_name'};
3967
3968        my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
3969        print "<$tag class=\"author_date\">" .
3970              format_search_author($author, "author", esc_html($author)) .
3971              " [".format_timestamp_html(\%ad)."]".
3972              git_get_avatar($co->{'author_email'}, -pad_before => 1) .
3973              "</$tag>\n";
3974}
3975
3976# Outputs table rows containing the full author or committer information,
3977# in the format expected for 'commit' view (& similar).
3978# Parameters are a commit hash reference, followed by the list of people
3979# to output information for. If the list is empty it defaults to both
3980# author and committer.
3981sub git_print_authorship_rows {
3982        my $co = shift;
3983        # too bad we can't use @people = @_ || ('author', 'committer')
3984        my @people = @_;
3985        @people = ('author', 'committer') unless @people;
3986        foreach my $who (@people) {
3987                my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
3988                print "<tr><td>$who</td><td>" .
3989                      format_search_author($co->{"${who}_name"}, $who,
3990                                           esc_html($co->{"${who}_name"})) . " " .
3991                      format_search_author($co->{"${who}_email"}, $who,
3992                                           esc_html("<" . $co->{"${who}_email"} . ">")) .
3993                      "</td><td rowspan=\"2\">" .
3994                      git_get_avatar($co->{"${who}_email"}, -size => 'double') .
3995                      "</td></tr>\n" .
3996                      "<tr>" .
3997                      "<td></td><td>" .
3998                      format_timestamp_html(\%wd) .
3999                      "</td>" .
4000                      "</tr>\n";
4001        }
4002}
4003
4004sub git_print_page_path {
4005        my $name = shift;
4006        my $type = shift;
4007        my $hb = shift;
4008
4009
4010        print "<div class=\"page_path\">";
4011        print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4012                      -title => 'tree root'}, to_utf8("[$project]"));
4013        print " / ";
4014        if (defined $name) {
4015                my @dirname = split '/', $name;
4016                my $basename = pop @dirname;
4017                my $fullname = '';
4018
4019                foreach my $dir (@dirname) {
4020                        $fullname .= ($fullname ? '/' : '') . $dir;
4021                        print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4022                                                     hash_base=>$hb),
4023                                      -title => $fullname}, esc_path($dir));
4024                        print " / ";
4025                }
4026                if (defined $type && $type eq 'blob') {
4027                        print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4028                                                     hash_base=>$hb),
4029                                      -title => $name}, esc_path($basename));
4030                } elsif (defined $type && $type eq 'tree') {
4031                        print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4032                                                     hash_base=>$hb),
4033                                      -title => $name}, esc_path($basename));
4034                        print " / ";
4035                } else {
4036                        print esc_path($basename);
4037                }
4038        }
4039        print "<br/></div>\n";
4040}
4041
4042sub git_print_log {
4043        my $log = shift;
4044        my %opts = @_;
4045
4046        if ($opts{'-remove_title'}) {
4047                # remove title, i.e. first line of log
4048                shift @$log;
4049        }
4050        # remove leading empty lines
4051        while (defined $log->[0] && $log->[0] eq "") {
4052                shift @$log;
4053        }
4054
4055        # print log
4056        my $signoff = 0;
4057        my $empty = 0;
4058        foreach my $line (@$log) {
4059                if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4060                        $signoff = 1;
4061                        $empty = 0;
4062                        if (! $opts{'-remove_signoff'}) {
4063                                print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4064                                next;
4065                        } else {
4066                                # remove signoff lines
4067                                next;
4068                        }
4069                } else {
4070                        $signoff = 0;
4071                }
4072
4073                # print only one empty line
4074                # do not print empty line after signoff
4075                if ($line eq "") {
4076                        next if ($empty || $signoff);
4077                        $empty = 1;
4078                } else {
4079                        $empty = 0;
4080                }
4081
4082                print format_log_line_html($line) . "<br/>\n";
4083        }
4084
4085        if ($opts{'-final_empty_line'}) {
4086                # end with single empty line
4087                print "<br/>\n" unless $empty;
4088        }
4089}
4090
4091# return link target (what link points to)
4092sub git_get_link_target {
4093        my $hash = shift;
4094        my $link_target;
4095
4096        # read link
4097        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4098                or return;
4099        {
4100                local $/ = undef;
4101                $link_target = <$fd>;
4102        }
4103        close $fd
4104                or return;
4105
4106        return $link_target;
4107}
4108
4109# given link target, and the directory (basedir) the link is in,
4110# return target of link relative to top directory (top tree);
4111# return undef if it is not possible (including absolute links).
4112sub normalize_link_target {
4113        my ($link_target, $basedir) = @_;
4114
4115        # absolute symlinks (beginning with '/') cannot be normalized
4116        return if (substr($link_target, 0, 1) eq '/');
4117
4118        # normalize link target to path from top (root) tree (dir)
4119        my $path;
4120        if ($basedir) {
4121                $path = $basedir . '/' . $link_target;
4122        } else {
4123                # we are in top (root) tree (dir)
4124                $path = $link_target;
4125        }
4126
4127        # remove //, /./, and /../
4128        my @path_parts;
4129        foreach my $part (split('/', $path)) {
4130                # discard '.' and ''
4131                next if (!$part || $part eq '.');
4132                # handle '..'
4133                if ($part eq '..') {
4134                        if (@path_parts) {
4135                                pop @path_parts;
4136                        } else {
4137                                # link leads outside repository (outside top dir)
4138                                return;
4139                        }
4140                } else {
4141                        push @path_parts, $part;
4142                }
4143        }
4144        $path = join('/', @path_parts);
4145
4146        return $path;
4147}
4148
4149# print tree entry (row of git_tree), but without encompassing <tr> element
4150sub git_print_tree_entry {
4151        my ($t, $basedir, $hash_base, $have_blame) = @_;
4152
4153        my %base_key = ();
4154        $base_key{'hash_base'} = $hash_base if defined $hash_base;
4155
4156        # The format of a table row is: mode list link.  Where mode is
4157        # the mode of the entry, list is the name of the entry, an href,
4158        # and link is the action links of the entry.
4159
4160        print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4161        if (exists $t->{'size'}) {
4162                print "<td class=\"size\">$t->{'size'}</td>\n";
4163        }
4164        if ($t->{'type'} eq "blob") {
4165                print "<td class=\"list\">" .
4166                        $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4167                                               file_name=>"$basedir$t->{'name'}", %base_key),
4168                                -class => "list"}, esc_path($t->{'name'}));
4169                if (S_ISLNK(oct $t->{'mode'})) {
4170                        my $link_target = git_get_link_target($t->{'hash'});
4171                        if ($link_target) {
4172                                my $norm_target = normalize_link_target($link_target, $basedir);
4173                                if (defined $norm_target) {
4174                                        print " -> " .
4175                                              $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4176                                                                     file_name=>$norm_target),
4177                                                       -title => $norm_target}, esc_path($link_target));
4178                                } else {
4179                                        print " -> " . esc_path($link_target);
4180                                }
4181                        }
4182                }
4183                print "</td>\n";
4184                print "<td class=\"link\">";
4185                print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4186                                             file_name=>"$basedir$t->{'name'}", %base_key)},
4187                              "blob");
4188                if ($have_blame) {
4189                        print " | " .
4190                              $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4191                                                     file_name=>"$basedir$t->{'name'}", %base_key)},
4192                                      "blame");
4193                }
4194                if (defined $hash_base) {
4195                        print " | " .
4196                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4197                                                     hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4198                                      "history");
4199                }
4200                print " | " .
4201                        $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4202                                               file_name=>"$basedir$t->{'name'}")},
4203                                "raw");
4204                print "</td>\n";
4205
4206        } elsif ($t->{'type'} eq "tree") {
4207                print "<td class=\"list\">";
4208                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4209                                             file_name=>"$basedir$t->{'name'}",
4210                                             %base_key)},
4211                              esc_path($t->{'name'}));
4212                print "</td>\n";
4213                print "<td class=\"link\">";
4214                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4215                                             file_name=>"$basedir$t->{'name'}",
4216                                             %base_key)},
4217                              "tree");
4218                if (defined $hash_base) {
4219                        print " | " .
4220                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4221                                                     file_name=>"$basedir$t->{'name'}")},
4222                                      "history");
4223                }
4224                print "</td>\n";
4225        } else {
4226                # unknown object: we can only present history for it
4227                # (this includes 'commit' object, i.e. submodule support)
4228                print "<td class=\"list\">" .
4229                      esc_path($t->{'name'}) .
4230                      "</td>\n";
4231                print "<td class=\"link\">";
4232                if (defined $hash_base) {
4233                        print $cgi->a({-href => href(action=>"history",
4234                                                     hash_base=>$hash_base,
4235                                                     file_name=>"$basedir$t->{'name'}")},
4236                                      "history");
4237                }
4238                print "</td>\n";
4239        }
4240}
4241
4242## ......................................................................
4243## functions printing large fragments of HTML
4244
4245# get pre-image filenames for merge (combined) diff
4246sub fill_from_file_info {
4247        my ($diff, @parents) = @_;
4248
4249        $diff->{'from_file'} = [ ];
4250        $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4251        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4252                if ($diff->{'status'}[$i] eq 'R' ||
4253                    $diff->{'status'}[$i] eq 'C') {
4254                        $diff->{'from_file'}[$i] =
4255                                git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4256                }
4257        }
4258
4259        return $diff;
4260}
4261
4262# is current raw difftree line of file deletion
4263sub is_deleted {
4264        my $diffinfo = shift;
4265
4266        return $diffinfo->{'to_id'} eq ('0' x 40);
4267}
4268
4269# does patch correspond to [previous] difftree raw line
4270# $diffinfo  - hashref of parsed raw diff format
4271# $patchinfo - hashref of parsed patch diff format
4272#              (the same keys as in $diffinfo)
4273sub is_patch_split {
4274        my ($diffinfo, $patchinfo) = @_;
4275
4276        return defined $diffinfo && defined $patchinfo
4277                && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4278}
4279
4280
4281sub git_difftree_body {
4282        my ($difftree, $hash, @parents) = @_;
4283        my ($parent) = $parents[0];
4284        my $have_blame = gitweb_check_feature('blame');
4285        print "<div class=\"list_head\">\n";
4286        if ($#{$difftree} > 10) {
4287                print(($#{$difftree} + 1) . " files changed:\n");
4288        }
4289        print "</div>\n";
4290
4291        print "<table class=\"" .
4292              (@parents > 1 ? "combined " : "") .
4293              "diff_tree\">\n";
4294
4295        # header only for combined diff in 'commitdiff' view
4296        my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4297        if ($has_header) {
4298                # table header
4299                print "<thead><tr>\n" .
4300                       "<th></th><th></th>\n"; # filename, patchN link
4301                for (my $i = 0; $i < @parents; $i++) {
4302                        my $par = $parents[$i];
4303                        print "<th>" .
4304                              $cgi->a({-href => href(action=>"commitdiff",
4305                                                     hash=>$hash, hash_parent=>$par),
4306                                       -title => 'commitdiff to parent number ' .
4307                                                  ($i+1) . ': ' . substr($par,0,7)},
4308                                      $i+1) .
4309                              "&nbsp;</th>\n";
4310                }
4311                print "</tr></thead>\n<tbody>\n";
4312        }
4313
4314        my $alternate = 1;
4315        my $patchno = 0;
4316        foreach my $line (@{$difftree}) {
4317                my $diff = parsed_difftree_line($line);
4318
4319                if ($alternate) {
4320                        print "<tr class=\"dark\">\n";
4321                } else {
4322                        print "<tr class=\"light\">\n";
4323                }
4324                $alternate ^= 1;
4325
4326                if (exists $diff->{'nparents'}) { # combined diff
4327
4328                        fill_from_file_info($diff, @parents)
4329                                unless exists $diff->{'from_file'};
4330
4331                        if (!is_deleted($diff)) {
4332                                # file exists in the result (child) commit
4333                                print "<td>" .
4334                                      $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4335                                                             file_name=>$diff->{'to_file'},
4336                                                             hash_base=>$hash),
4337                                              -class => "list"}, esc_path($diff->{'to_file'})) .
4338                                      "</td>\n";
4339                        } else {
4340                                print "<td>" .
4341                                      esc_path($diff->{'to_file'}) .
4342                                      "</td>\n";
4343                        }
4344
4345                        if ($action eq 'commitdiff') {
4346                                # link to patch
4347                                $patchno++;
4348                                print "<td class=\"link\">" .
4349                                      $cgi->a({-href => href(-anchor=>"patch$patchno")},
4350                                              "patch") .
4351                                      " | " .
4352                                      "</td>\n";
4353                        }
4354
4355                        my $has_history = 0;
4356                        my $not_deleted = 0;
4357                        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4358                                my $hash_parent = $parents[$i];
4359                                my $from_hash = $diff->{'from_id'}[$i];
4360                                my $from_path = $diff->{'from_file'}[$i];
4361                                my $status = $diff->{'status'}[$i];
4362
4363                                $has_history ||= ($status ne 'A');
4364                                $not_deleted ||= ($status ne 'D');
4365
4366                                if ($status eq 'A') {
4367                                        print "<td  class=\"link\" align=\"right\"> | </td>\n";
4368                                } elsif ($status eq 'D') {
4369                                        print "<td class=\"link\">" .
4370                                              $cgi->a({-href => href(action=>"blob",
4371                                                                     hash_base=>$hash,
4372                                                                     hash=>$from_hash,
4373                                                                     file_name=>$from_path)},
4374                                                      "blob" . ($i+1)) .
4375                                              " | </td>\n";
4376                                } else {
4377                                        if ($diff->{'to_id'} eq $from_hash) {
4378                                                print "<td class=\"link nochange\">";
4379                                        } else {
4380                                                print "<td class=\"link\">";
4381                                        }
4382                                        print $cgi->a({-href => href(action=>"blobdiff",
4383                                                                     hash=>$diff->{'to_id'},
4384                                                                     hash_parent=>$from_hash,
4385                                                                     hash_base=>$hash,
4386                                                                     hash_parent_base=>$hash_parent,
4387                                                                     file_name=>$diff->{'to_file'},
4388                                                                     file_parent=>$from_path)},
4389                                                      "diff" . ($i+1)) .
4390                                              " | </td>\n";
4391                                }
4392                        }
4393
4394                        print "<td class=\"link\">";
4395                        if ($not_deleted) {
4396                                print $cgi->a({-href => href(action=>"blob",
4397                                                             hash=>$diff->{'to_id'},
4398                                                             file_name=>$diff->{'to_file'},
4399                                                             hash_base=>$hash)},
4400                                              "blob");
4401                                print " | " if ($has_history);
4402                        }
4403                        if ($has_history) {
4404                                print $cgi->a({-href => href(action=>"history",
4405                                                             file_name=>$diff->{'to_file'},
4406                                                             hash_base=>$hash)},
4407                                              "history");
4408                        }
4409                        print "</td>\n";
4410
4411                        print "</tr>\n";
4412                        next; # instead of 'else' clause, to avoid extra indent
4413                }
4414                # else ordinary diff
4415
4416                my ($to_mode_oct, $to_mode_str, $to_file_type);
4417                my ($from_mode_oct, $from_mode_str, $from_file_type);
4418                if ($diff->{'to_mode'} ne ('0' x 6)) {
4419                        $to_mode_oct = oct $diff->{'to_mode'};
4420                        if (S_ISREG($to_mode_oct)) { # only for regular file
4421                                $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4422                        }
4423                        $to_file_type = file_type($diff->{'to_mode'});
4424                }
4425                if ($diff->{'from_mode'} ne ('0' x 6)) {
4426                        $from_mode_oct = oct $diff->{'from_mode'};
4427                        if (S_ISREG($from_mode_oct)) { # only for regular file
4428                                $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4429                        }
4430                        $from_file_type = file_type($diff->{'from_mode'});
4431                }
4432
4433                if ($diff->{'status'} eq "A") { # created
4434                        my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4435                        $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4436                        $mode_chng   .= "]</span>";
4437                        print "<td>";
4438                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4439                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4440                                      -class => "list"}, esc_path($diff->{'file'}));
4441                        print "</td>\n";
4442                        print "<td>$mode_chng</td>\n";
4443                        print "<td class=\"link\">";
4444                        if ($action eq 'commitdiff') {
4445                                # link to patch
4446                                $patchno++;
4447                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4448                                              "patch") .
4449                                      " | ";
4450                        }
4451                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4452                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4453                                      "blob");
4454                        print "</td>\n";
4455
4456                } elsif ($diff->{'status'} eq "D") { # deleted
4457                        my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4458                        print "<td>";
4459                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4460                                                     hash_base=>$parent, file_name=>$diff->{'file'}),
4461                                       -class => "list"}, esc_path($diff->{'file'}));
4462                        print "</td>\n";
4463                        print "<td>$mode_chng</td>\n";
4464                        print "<td class=\"link\">";
4465                        if ($action eq 'commitdiff') {
4466                                # link to patch
4467                                $patchno++;
4468                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4469                                              "patch") .
4470                                      " | ";
4471                        }
4472                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4473                                                     hash_base=>$parent, file_name=>$diff->{'file'})},
4474                                      "blob") . " | ";
4475                        if ($have_blame) {
4476                                print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4477                                                             file_name=>$diff->{'file'})},
4478                                              "blame") . " | ";
4479                        }
4480                        print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4481                                                     file_name=>$diff->{'file'})},
4482                                      "history");
4483                        print "</td>\n";
4484
4485                } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4486                        my $mode_chnge = "";
4487                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4488                                $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4489                                if ($from_file_type ne $to_file_type) {
4490                                        $mode_chnge .= " from $from_file_type to $to_file_type";
4491                                }
4492                                if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4493                                        if ($from_mode_str && $to_mode_str) {
4494                                                $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4495                                        } elsif ($to_mode_str) {
4496                                                $mode_chnge .= " mode: $to_mode_str";
4497                                        }
4498                                }
4499                                $mode_chnge .= "]</span>\n";
4500                        }
4501                        print "<td>";
4502                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4503                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4504                                      -class => "list"}, esc_path($diff->{'file'}));
4505                        print "</td>\n";
4506                        print "<td>$mode_chnge</td>\n";
4507                        print "<td class=\"link\">";
4508                        if ($action eq 'commitdiff') {
4509                                # link to patch
4510                                $patchno++;
4511                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4512                                              "patch") .
4513                                      " | ";
4514                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4515                                # "commit" view and modified file (not onlu mode changed)
4516                                print $cgi->a({-href => href(action=>"blobdiff",
4517                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4518                                                             hash_base=>$hash, hash_parent_base=>$parent,
4519                                                             file_name=>$diff->{'file'})},
4520                                              "diff") .
4521                                      " | ";
4522                        }
4523                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4524                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4525                                       "blob") . " | ";
4526                        if ($have_blame) {
4527                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4528                                                             file_name=>$diff->{'file'})},
4529                                              "blame") . " | ";
4530                        }
4531                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4532                                                     file_name=>$diff->{'file'})},
4533                                      "history");
4534                        print "</td>\n";
4535
4536                } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4537                        my %status_name = ('R' => 'moved', 'C' => 'copied');
4538                        my $nstatus = $status_name{$diff->{'status'}};
4539                        my $mode_chng = "";
4540                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4541                                # mode also for directories, so we cannot use $to_mode_str
4542                                $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4543                        }
4544                        print "<td>" .
4545                              $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4546                                                     hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4547                                      -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4548                              "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4549                              $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4550                                                     hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4551                                      -class => "list"}, esc_path($diff->{'from_file'})) .
4552                              " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4553                              "<td class=\"link\">";
4554                        if ($action eq 'commitdiff') {
4555                                # link to patch
4556                                $patchno++;
4557                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4558                                              "patch") .
4559                                      " | ";
4560                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4561                                # "commit" view and modified file (not only pure rename or copy)
4562                                print $cgi->a({-href => href(action=>"blobdiff",
4563                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4564                                                             hash_base=>$hash, hash_parent_base=>$parent,
4565                                                             file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4566                                              "diff") .
4567                                      " | ";
4568                        }
4569                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4570                                                     hash_base=>$parent, file_name=>$diff->{'to_file'})},
4571                                      "blob") . " | ";
4572                        if ($have_blame) {
4573                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4574                                                             file_name=>$diff->{'to_file'})},
4575                                              "blame") . " | ";
4576                        }
4577                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4578                                                    file_name=>$diff->{'to_file'})},
4579                                      "history");
4580                        print "</td>\n";
4581
4582                } # we should not encounter Unmerged (U) or Unknown (X) status
4583                print "</tr>\n";
4584        }
4585        print "</tbody>" if $has_header;
4586        print "</table>\n";
4587}
4588
4589sub git_patchset_body {
4590        my ($fd, $difftree, $hash, @hash_parents) = @_;
4591        my ($hash_parent) = $hash_parents[0];
4592
4593        my $is_combined = (@hash_parents > 1);
4594        my $patch_idx = 0;
4595        my $patch_number = 0;
4596        my $patch_line;
4597        my $diffinfo;
4598        my $to_name;
4599        my (%from, %to);
4600
4601        print "<div class=\"patchset\">\n";
4602
4603        # skip to first patch
4604        while ($patch_line = <$fd>) {
4605                chomp $patch_line;
4606
4607                last if ($patch_line =~ m/^diff /);
4608        }
4609
4610 PATCH:
4611        while ($patch_line) {
4612
4613                # parse "git diff" header line
4614                if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
4615                        # $1 is from_name, which we do not use
4616                        $to_name = unquote($2);
4617                        $to_name =~ s!^b/!!;
4618                } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
4619                        # $1 is 'cc' or 'combined', which we do not use
4620                        $to_name = unquote($2);
4621                } else {
4622                        $to_name = undef;
4623                }
4624
4625                # check if current patch belong to current raw line
4626                # and parse raw git-diff line if needed
4627                if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
4628                        # this is continuation of a split patch
4629                        print "<div class=\"patch cont\">\n";
4630                } else {
4631                        # advance raw git-diff output if needed
4632                        $patch_idx++ if defined $diffinfo;
4633
4634                        # read and prepare patch information
4635                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4636
4637                        # compact combined diff output can have some patches skipped
4638                        # find which patch (using pathname of result) we are at now;
4639                        if ($is_combined) {
4640                                while ($to_name ne $diffinfo->{'to_file'}) {
4641                                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4642                                              format_diff_cc_simplified($diffinfo, @hash_parents) .
4643                                              "</div>\n";  # class="patch"
4644
4645                                        $patch_idx++;
4646                                        $patch_number++;
4647
4648                                        last if $patch_idx > $#$difftree;
4649                                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4650                                }
4651                        }
4652
4653                        # modifies %from, %to hashes
4654                        parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
4655
4656                        # this is first patch for raw difftree line with $patch_idx index
4657                        # we index @$difftree array from 0, but number patches from 1
4658                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
4659                }
4660
4661                # git diff header
4662                #assert($patch_line =~ m/^diff /) if DEBUG;
4663                #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
4664                $patch_number++;
4665                # print "git diff" header
4666                print format_git_diff_header_line($patch_line, $diffinfo,
4667                                                  \%from, \%to);
4668
4669                # print extended diff header
4670                print "<div class=\"diff extended_header\">\n";
4671        EXTENDED_HEADER:
4672                while ($patch_line = <$fd>) {
4673                        chomp $patch_line;
4674
4675                        last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
4676
4677                        print format_extended_diff_header_line($patch_line, $diffinfo,
4678                                                               \%from, \%to);
4679                }
4680                print "</div>\n"; # class="diff extended_header"
4681
4682                # from-file/to-file diff header
4683                if (! $patch_line) {
4684                        print "</div>\n"; # class="patch"
4685                        last PATCH;
4686                }
4687                next PATCH if ($patch_line =~ m/^diff /);
4688                #assert($patch_line =~ m/^---/) if DEBUG;
4689
4690                my $last_patch_line = $patch_line;
4691                $patch_line = <$fd>;
4692                chomp $patch_line;
4693                #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
4694
4695                print format_diff_from_to_header($last_patch_line, $patch_line,
4696                                                 $diffinfo, \%from, \%to,
4697                                                 @hash_parents);
4698
4699                # the patch itself
4700        LINE:
4701                while ($patch_line = <$fd>) {
4702                        chomp $patch_line;
4703
4704                        next PATCH if ($patch_line =~ m/^diff /);
4705
4706                        print format_diff_line($patch_line, \%from, \%to);
4707                }
4708
4709        } continue {
4710                print "</div>\n"; # class="patch"
4711        }
4712
4713        # for compact combined (--cc) format, with chunk and patch simplification
4714        # the patchset might be empty, but there might be unprocessed raw lines
4715        for (++$patch_idx if $patch_number > 0;
4716             $patch_idx < @$difftree;
4717             ++$patch_idx) {
4718                # read and prepare patch information
4719                $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4720
4721                # generate anchor for "patch" links in difftree / whatchanged part
4722                print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4723                      format_diff_cc_simplified($diffinfo, @hash_parents) .
4724                      "</div>\n";  # class="patch"
4725
4726                $patch_number++;
4727        }
4728
4729        if ($patch_number == 0) {
4730                if (@hash_parents > 1) {
4731                        print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
4732                } else {
4733                        print "<div class=\"diff nodifferences\">No differences found</div>\n";
4734                }
4735        }
4736
4737        print "</div>\n"; # class="patchset"
4738}
4739
4740# . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
4741
4742# fills project list info (age, description, owner, forks) for each
4743# project in the list, removing invalid projects from returned list
4744# NOTE: modifies $projlist, but does not remove entries from it
4745sub fill_project_list_info {
4746        my ($projlist, $check_forks) = @_;
4747        my @projects;
4748
4749        my $show_ctags = gitweb_check_feature('ctags');
4750 PROJECT:
4751        foreach my $pr (@$projlist) {
4752                my (@activity) = git_get_last_activity($pr->{'path'});
4753                unless (@activity) {
4754                        next PROJECT;
4755                }
4756                ($pr->{'age'}, $pr->{'age_string'}) = @activity;
4757                if (!defined $pr->{'descr'}) {
4758                        my $descr = git_get_project_description($pr->{'path'}) || "";
4759                        $descr = to_utf8($descr);
4760                        $pr->{'descr_long'} = $descr;
4761                        $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
4762                }
4763                if (!defined $pr->{'owner'}) {
4764                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
4765                }
4766                if ($check_forks) {
4767                        my $pname = $pr->{'path'};
4768                        if (($pname =~ s/\.git$//) &&
4769                            ($pname !~ /\/$/) &&
4770                            (-d "$projectroot/$pname")) {
4771                                $pr->{'forks'} = "-d $projectroot/$pname";
4772                        } else {
4773                                $pr->{'forks'} = 0;
4774                        }
4775                }
4776                $show_ctags and $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
4777                push @projects, $pr;
4778        }
4779
4780        return @projects;
4781}
4782
4783# print 'sort by' <th> element, generating 'sort by $name' replay link
4784# if that order is not selected
4785sub print_sort_th {
4786        print format_sort_th(@_);
4787}
4788
4789sub format_sort_th {
4790        my ($name, $order, $header) = @_;
4791        my $sort_th = "";
4792        $header ||= ucfirst($name);
4793
4794        if ($order eq $name) {
4795                $sort_th .= "<th>$header</th>\n";
4796        } else {
4797                $sort_th .= "<th>" .
4798                            $cgi->a({-href => href(-replay=>1, order=>$name),
4799                                     -class => "header"}, $header) .
4800                            "</th>\n";
4801        }
4802
4803        return $sort_th;
4804}
4805
4806sub git_project_list_body {
4807        # actually uses global variable $project
4808        my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
4809
4810        my $check_forks = gitweb_check_feature('forks');
4811        my @projects = fill_project_list_info($projlist, $check_forks);
4812
4813        $order ||= $default_projects_order;
4814        $from = 0 unless defined $from;
4815        $to = $#projects if (!defined $to || $#projects < $to);
4816
4817        my %order_info = (
4818                project => { key => 'path', type => 'str' },
4819                descr => { key => 'descr_long', type => 'str' },
4820                owner => { key => 'owner', type => 'str' },
4821                age => { key => 'age', type => 'num' }
4822        );
4823        my $oi = $order_info{$order};
4824        if ($oi->{'type'} eq 'str') {
4825                @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @projects;
4826        } else {
4827                @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @projects;
4828        }
4829
4830        my $show_ctags = gitweb_check_feature('ctags');
4831        if ($show_ctags) {
4832                my %ctags;
4833                foreach my $p (@projects) {
4834                        foreach my $ct (keys %{$p->{'ctags'}}) {
4835                                $ctags{$ct} += $p->{'ctags'}->{$ct};
4836                        }
4837                }
4838                my $cloud = git_populate_project_tagcloud(\%ctags);
4839                print git_show_project_tagcloud($cloud, 64);
4840        }
4841
4842        print "<table class=\"project_list\">\n";
4843        unless ($no_header) {
4844                print "<tr>\n";
4845                if ($check_forks) {
4846                        print "<th></th>\n";
4847                }
4848                print_sort_th('project', $order, 'Project');
4849                print_sort_th('descr', $order, 'Description');
4850                print_sort_th('owner', $order, 'Owner');
4851                print_sort_th('age', $order, 'Last Change');
4852                print "<th></th>\n" . # for links
4853                      "</tr>\n";
4854        }
4855        my $alternate = 1;
4856        my $tagfilter = $cgi->param('by_tag');
4857        for (my $i = $from; $i <= $to; $i++) {
4858                my $pr = $projects[$i];
4859
4860                next if $tagfilter and $show_ctags and not grep { lc $_ eq lc $tagfilter } keys %{$pr->{'ctags'}};
4861                next if $searchtext and not $pr->{'path'} =~ /$searchtext/
4862                        and not $pr->{'descr_long'} =~ /$searchtext/;
4863                # Weed out forks or non-matching entries of search
4864                if ($check_forks) {
4865                        my $forkbase = $project; $forkbase ||= ''; $forkbase =~ s#\.git$#/#;
4866                        $forkbase="^$forkbase" if $forkbase;
4867                        next if not $searchtext and not $tagfilter and $show_ctags
4868                                and $pr->{'path'} =~ m#$forkbase.*/.*#; # regexp-safe
4869                }
4870
4871                if ($alternate) {
4872                        print "<tr class=\"dark\">\n";
4873                } else {
4874                        print "<tr class=\"light\">\n";
4875                }
4876                $alternate ^= 1;
4877                if ($check_forks) {
4878                        print "<td>";
4879                        if ($pr->{'forks'}) {
4880                                print "<!-- $pr->{'forks'} -->\n";
4881                                print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "+");
4882                        }
4883                        print "</td>\n";
4884                }
4885                print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4886                                        -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
4887                      "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4888                                        -class => "list", -title => $pr->{'descr_long'}},
4889                                        esc_html($pr->{'descr'})) . "</td>\n" .
4890                      "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
4891                print "<td class=\"". age_class($pr->{'age'}) . "\">" .
4892                      (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
4893                      "<td class=\"link\">" .
4894                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
4895                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
4896                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
4897                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
4898                      ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
4899                      "</td>\n" .
4900                      "</tr>\n";
4901        }
4902        if (defined $extra) {
4903                print "<tr>\n";
4904                if ($check_forks) {
4905                        print "<td></td>\n";
4906                }
4907                print "<td colspan=\"5\">$extra</td>\n" .
4908                      "</tr>\n";
4909        }
4910        print "</table>\n";
4911}
4912
4913sub git_log_body {
4914        # uses global variable $project
4915        my ($commitlist, $from, $to, $refs, $extra) = @_;
4916
4917        $from = 0 unless defined $from;
4918        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4919
4920        for (my $i = 0; $i <= $to; $i++) {
4921                my %co = %{$commitlist->[$i]};
4922                next if !%co;
4923                my $commit = $co{'id'};
4924                my $ref = format_ref_marker($refs, $commit);
4925                git_print_header_div('commit',
4926                               "<span class=\"age\">$co{'age_string'}</span>" .
4927                               esc_html($co{'title'}) . $ref,
4928                               $commit);
4929                print "<div class=\"title_text\">\n" .
4930                      "<div class=\"log_link\">\n" .
4931                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
4932                      " | " .
4933                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
4934                      " | " .
4935                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
4936                      "<br/>\n" .
4937                      "</div>\n";
4938                      git_print_authorship(\%co, -tag => 'span');
4939                      print "<br/>\n</div>\n";
4940
4941                print "<div class=\"log_body\">\n";
4942                git_print_log($co{'comment'}, -final_empty_line=> 1);
4943                print "</div>\n";
4944        }
4945        if ($extra) {
4946                print "<div class=\"page_nav\">\n";
4947                print "$extra\n";
4948                print "</div>\n";
4949        }
4950}
4951
4952sub git_shortlog_body {
4953        # uses global variable $project
4954        my ($commitlist, $from, $to, $refs, $extra) = @_;
4955
4956        $from = 0 unless defined $from;
4957        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4958
4959        print "<table class=\"shortlog\">\n";
4960        my $alternate = 1;
4961        for (my $i = $from; $i <= $to; $i++) {
4962                my %co = %{$commitlist->[$i]};
4963                my $commit = $co{'id'};
4964                my $ref = format_ref_marker($refs, $commit);
4965                if ($alternate) {
4966                        print "<tr class=\"dark\">\n";
4967                } else {
4968                        print "<tr class=\"light\">\n";
4969                }
4970                $alternate ^= 1;
4971                # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
4972                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4973                      format_author_html('td', \%co, 10) . "<td>";
4974                print format_subject_html($co{'title'}, $co{'title_short'},
4975                                          href(action=>"commit", hash=>$commit), $ref);
4976                print "</td>\n" .
4977                      "<td class=\"link\">" .
4978                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
4979                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
4980                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
4981                my $snapshot_links = format_snapshot_links($commit);
4982                if (defined $snapshot_links) {
4983                        print " | " . $snapshot_links;
4984                }
4985                print "</td>\n" .
4986                      "</tr>\n";
4987        }
4988        if (defined $extra) {
4989                print "<tr>\n" .
4990                      "<td colspan=\"4\">$extra</td>\n" .
4991                      "</tr>\n";
4992        }
4993        print "</table>\n";
4994}
4995
4996sub git_history_body {
4997        # Warning: assumes constant type (blob or tree) during history
4998        my ($commitlist, $from, $to, $refs, $extra,
4999            $file_name, $file_hash, $ftype) = @_;
5000
5001        $from = 0 unless defined $from;
5002        $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5003
5004        print "<table class=\"history\">\n";
5005        my $alternate = 1;
5006        for (my $i = $from; $i <= $to; $i++) {
5007                my %co = %{$commitlist->[$i]};
5008                if (!%co) {
5009                        next;
5010                }
5011                my $commit = $co{'id'};
5012
5013                my $ref = format_ref_marker($refs, $commit);
5014
5015                if ($alternate) {
5016                        print "<tr class=\"dark\">\n";
5017                } else {
5018                        print "<tr class=\"light\">\n";
5019                }
5020                $alternate ^= 1;
5021                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5022        # shortlog:   format_author_html('td', \%co, 10)
5023                      format_author_html('td', \%co, 15, 3) . "<td>";
5024                # originally git_history used chop_str($co{'title'}, 50)
5025                print format_subject_html($co{'title'}, $co{'title_short'},
5026                                          href(action=>"commit", hash=>$commit), $ref);
5027                print "</td>\n" .
5028                      "<td class=\"link\">" .
5029                      $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5030                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5031
5032                if ($ftype eq 'blob') {
5033                        my $blob_current = $file_hash;
5034                        my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5035                        if (defined $blob_current && defined $blob_parent &&
5036                                        $blob_current ne $blob_parent) {
5037                                print " | " .
5038                                        $cgi->a({-href => href(action=>"blobdiff",
5039                                                               hash=>$blob_current, hash_parent=>$blob_parent,
5040                                                               hash_base=>$hash_base, hash_parent_base=>$commit,
5041                                                               file_name=>$file_name)},
5042                                                "diff to current");
5043                        }
5044                }
5045                print "</td>\n" .
5046                      "</tr>\n";
5047        }
5048        if (defined $extra) {
5049                print "<tr>\n" .
5050                      "<td colspan=\"4\">$extra</td>\n" .
5051                      "</tr>\n";
5052        }
5053        print "</table>\n";
5054}
5055
5056sub git_tags_body {
5057        # uses global variable $project
5058        my ($taglist, $from, $to, $extra) = @_;
5059        $from = 0 unless defined $from;
5060        $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5061
5062        print "<table class=\"tags\">\n";
5063        my $alternate = 1;
5064        for (my $i = $from; $i <= $to; $i++) {
5065                my $entry = $taglist->[$i];
5066                my %tag = %$entry;
5067                my $comment = $tag{'subject'};
5068                my $comment_short;
5069                if (defined $comment) {
5070                        $comment_short = chop_str($comment, 30, 5);
5071                }
5072                if ($alternate) {
5073                        print "<tr class=\"dark\">\n";
5074                } else {
5075                        print "<tr class=\"light\">\n";
5076                }
5077                $alternate ^= 1;
5078                if (defined $tag{'age'}) {
5079                        print "<td><i>$tag{'age'}</i></td>\n";
5080                } else {
5081                        print "<td></td>\n";
5082                }
5083                print "<td>" .
5084                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5085                               -class => "list name"}, esc_html($tag{'name'})) .
5086                      "</td>\n" .
5087                      "<td>";
5088                if (defined $comment) {
5089                        print format_subject_html($comment, $comment_short,
5090                                                  href(action=>"tag", hash=>$tag{'id'}));
5091                }
5092                print "</td>\n" .
5093                      "<td class=\"selflink\">";
5094                if ($tag{'type'} eq "tag") {
5095                        print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5096                } else {
5097                        print "&nbsp;";
5098                }
5099                print "</td>\n" .
5100                      "<td class=\"link\">" . " | " .
5101                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5102                if ($tag{'reftype'} eq "commit") {
5103                        print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5104                              " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5105                } elsif ($tag{'reftype'} eq "blob") {
5106                        print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5107                }
5108                print "</td>\n" .
5109                      "</tr>";
5110        }
5111        if (defined $extra) {
5112                print "<tr>\n" .
5113                      "<td colspan=\"5\">$extra</td>\n" .
5114                      "</tr>\n";
5115        }
5116        print "</table>\n";
5117}
5118
5119sub git_heads_body {
5120        # uses global variable $project
5121        my ($headlist, $head, $from, $to, $extra) = @_;
5122        $from = 0 unless defined $from;
5123        $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5124
5125        print "<table class=\"heads\">\n";
5126        my $alternate = 1;
5127        for (my $i = $from; $i <= $to; $i++) {
5128                my $entry = $headlist->[$i];
5129                my %ref = %$entry;
5130                my $curr = $ref{'id'} eq $head;
5131                if ($alternate) {
5132                        print "<tr class=\"dark\">\n";
5133                } else {
5134                        print "<tr class=\"light\">\n";
5135                }
5136                $alternate ^= 1;
5137                print "<td><i>$ref{'age'}</i></td>\n" .
5138                      ($curr ? "<td class=\"current_head\">" : "<td>") .
5139                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5140                               -class => "list name"},esc_html($ref{'name'})) .
5141                      "</td>\n" .
5142                      "<td class=\"link\">" .
5143                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5144                      $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5145                      $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5146                      "</td>\n" .
5147                      "</tr>";
5148        }
5149        if (defined $extra) {
5150                print "<tr>\n" .
5151                      "<td colspan=\"3\">$extra</td>\n" .
5152                      "</tr>\n";
5153        }
5154        print "</table>\n";
5155}
5156
5157# Display a single remote block
5158sub git_remote_block {
5159        my ($remote, $rdata, $limit, $head) = @_;
5160
5161        my $heads = $rdata->{'heads'};
5162        my $fetch = $rdata->{'fetch'};
5163        my $push = $rdata->{'push'};
5164
5165        my $urls_table = "<table class=\"projects_list\">\n" ;
5166
5167        if (defined $fetch) {
5168                if ($fetch eq $push) {
5169                        $urls_table .= format_repo_url("URL", $fetch);
5170                } else {
5171                        $urls_table .= format_repo_url("Fetch URL", $fetch);
5172                        $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5173                }
5174        } elsif (defined $push) {
5175                $urls_table .= format_repo_url("Push URL", $push);
5176        } else {
5177                $urls_table .= format_repo_url("", "No remote URL");
5178        }
5179
5180        $urls_table .= "</table>\n";
5181
5182        my $dots;
5183        if (defined $limit && $limit < @$heads) {
5184                $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5185        }
5186
5187        print $urls_table;
5188        git_heads_body($heads, $head, 0, $limit, $dots);
5189}
5190
5191# Display a list of remote names with the respective fetch and push URLs
5192sub git_remotes_list {
5193        my ($remotedata, $limit) = @_;
5194        print "<table class=\"heads\">\n";
5195        my $alternate = 1;
5196        my @remotes = sort keys %$remotedata;
5197
5198        my $limited = $limit && $limit < @remotes;
5199
5200        $#remotes = $limit - 1 if $limited;
5201
5202        while (my $remote = shift @remotes) {
5203                my $rdata = $remotedata->{$remote};
5204                my $fetch = $rdata->{'fetch'};
5205                my $push = $rdata->{'push'};
5206                if ($alternate) {
5207                        print "<tr class=\"dark\">\n";
5208                } else {
5209                        print "<tr class=\"light\">\n";
5210                }
5211                $alternate ^= 1;
5212                print "<td>" .
5213                      $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5214                               -class=> "list name"},esc_html($remote)) .
5215                      "</td>";
5216                print "<td class=\"link\">" .
5217                      (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5218                      " | " .
5219                      (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5220                      "</td>";
5221
5222                print "</tr>\n";
5223        }
5224
5225        if ($limited) {
5226                print "<tr>\n" .
5227                      "<td colspan=\"3\">" .
5228                      $cgi->a({-href => href(action=>"remotes")}, "...") .
5229                      "</td>\n" . "</tr>\n";
5230        }
5231
5232        print "</table>";
5233}
5234
5235# Display remote heads grouped by remote, unless there are too many
5236# remotes, in which case we only display the remote names
5237sub git_remotes_body {
5238        my ($remotedata, $limit, $head) = @_;
5239        if ($limit and $limit < keys %$remotedata) {
5240                git_remotes_list($remotedata, $limit);
5241        } else {
5242                fill_remote_heads($remotedata);
5243                while (my ($remote, $rdata) = each %$remotedata) {
5244                        git_print_section({-class=>"remote", -id=>$remote},
5245                                ["remotes", $remote, $remote], sub {
5246                                        git_remote_block($remote, $rdata, $limit, $head);
5247                                });
5248                }
5249        }
5250}
5251
5252sub git_search_grep_body {
5253        my ($commitlist, $from, $to, $extra) = @_;
5254        $from = 0 unless defined $from;
5255        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5256
5257        print "<table class=\"commit_search\">\n";
5258        my $alternate = 1;
5259        for (my $i = $from; $i <= $to; $i++) {
5260                my %co = %{$commitlist->[$i]};
5261                if (!%co) {
5262                        next;
5263                }
5264                my $commit = $co{'id'};
5265                if ($alternate) {
5266                        print "<tr class=\"dark\">\n";
5267                } else {
5268                        print "<tr class=\"light\">\n";
5269                }
5270                $alternate ^= 1;
5271                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5272                      format_author_html('td', \%co, 15, 5) .
5273                      "<td>" .
5274                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5275                               -class => "list subject"},
5276                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
5277                my $comment = $co{'comment'};
5278                foreach my $line (@$comment) {
5279                        if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
5280                                my ($lead, $match, $trail) = ($1, $2, $3);
5281                                $match = chop_str($match, 70, 5, 'center');
5282                                my $contextlen = int((80 - length($match))/2);
5283                                $contextlen = 30 if ($contextlen > 30);
5284                                $lead  = chop_str($lead,  $contextlen, 10, 'left');
5285                                $trail = chop_str($trail, $contextlen, 10, 'right');
5286
5287                                $lead  = esc_html($lead);
5288                                $match = esc_html($match);
5289                                $trail = esc_html($trail);
5290
5291                                print "$lead<span class=\"match\">$match</span>$trail<br />";
5292                        }
5293                }
5294                print "</td>\n" .
5295                      "<td class=\"link\">" .
5296                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5297                      " | " .
5298                      $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5299                      " | " .
5300                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5301                print "</td>\n" .
5302                      "</tr>\n";
5303        }
5304        if (defined $extra) {
5305                print "<tr>\n" .
5306                      "<td colspan=\"3\">$extra</td>\n" .
5307                      "</tr>\n";
5308        }
5309        print "</table>\n";
5310}
5311
5312## ======================================================================
5313## ======================================================================
5314## actions
5315
5316sub git_project_list {
5317        my $order = $input_params{'order'};
5318        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5319                die_error(400, "Unknown order parameter");
5320        }
5321
5322        my @list = git_get_projects_list();
5323        if (!@list) {
5324                die_error(404, "No projects found");
5325        }
5326
5327        git_header_html();
5328        if (defined $home_text && -f $home_text) {
5329                print "<div class=\"index_include\">\n";
5330                insert_file($home_text);
5331                print "</div>\n";
5332        }
5333        print $cgi->startform(-method => "get") .
5334              "<p class=\"projsearch\">Search:\n" .
5335              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
5336              "</p>" .
5337              $cgi->end_form() . "\n";
5338        git_project_list_body(\@list, $order);
5339        git_footer_html();
5340}
5341
5342sub git_forks {
5343        my $order = $input_params{'order'};
5344        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5345                die_error(400, "Unknown order parameter");
5346        }
5347
5348        my @list = git_get_projects_list($project);
5349        if (!@list) {
5350                die_error(404, "No forks found");
5351        }
5352
5353        git_header_html();
5354        git_print_page_nav('','');
5355        git_print_header_div('summary', "$project forks");
5356        git_project_list_body(\@list, $order);
5357        git_footer_html();
5358}
5359
5360sub git_project_index {
5361        my @projects = git_get_projects_list($project);
5362
5363        print $cgi->header(
5364                -type => 'text/plain',
5365                -charset => 'utf-8',
5366                -content_disposition => 'inline; filename="index.aux"');
5367
5368        foreach my $pr (@projects) {
5369                if (!exists $pr->{'owner'}) {
5370                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
5371                }
5372
5373                my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
5374                # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
5375                $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5376                $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5377                $path  =~ s/ /\+/g;
5378                $owner =~ s/ /\+/g;
5379
5380                print "$path $owner\n";
5381        }
5382}
5383
5384sub git_summary {
5385        my $descr = git_get_project_description($project) || "none";
5386        my %co = parse_commit("HEAD");
5387        my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
5388        my $head = $co{'id'};
5389        my $remote_heads = gitweb_check_feature('remote_heads');
5390
5391        my $owner = git_get_project_owner($project);
5392
5393        my $refs = git_get_references();
5394        # These get_*_list functions return one more to allow us to see if
5395        # there are more ...
5396        my @taglist  = git_get_tags_list(16);
5397        my @headlist = git_get_heads_list(16);
5398        my %remotedata = $remote_heads ? git_get_remotes_list() : ();
5399        my @forklist;
5400        my $check_forks = gitweb_check_feature('forks');
5401
5402        if ($check_forks) {
5403                @forklist = git_get_projects_list($project);
5404        }
5405
5406        git_header_html();
5407        git_print_page_nav('summary','', $head);
5408
5409        print "<div class=\"title\">&nbsp;</div>\n";
5410        print "<table class=\"projects_list\">\n" .
5411              "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
5412              "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
5413        if (defined $cd{'rfc2822'}) {
5414                print "<tr id=\"metadata_lchange\"><td>last change</td>" .
5415                      "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
5416        }
5417
5418        # use per project git URL list in $projectroot/$project/cloneurl
5419        # or make project git URL from git base URL and project name
5420        my $url_tag = "URL";
5421        my @url_list = git_get_project_url_list($project);
5422        @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
5423        foreach my $git_url (@url_list) {
5424                next unless $git_url;
5425                print format_repo_url($url_tag, $git_url);
5426                $url_tag = "";
5427        }
5428
5429        # Tag cloud
5430        my $show_ctags = gitweb_check_feature('ctags');
5431        if ($show_ctags) {
5432                my $ctags = git_get_project_ctags($project);
5433                my $cloud = git_populate_project_tagcloud($ctags);
5434                print "<tr id=\"metadata_ctags\"><td>Content tags:<br />";
5435                print "</td>\n<td>" unless %$ctags;
5436                print "<form action=\"$show_ctags\" method=\"post\"><input type=\"hidden\" name=\"p\" value=\"$project\" />Add: <input type=\"text\" name=\"t\" size=\"8\" /></form>";
5437                print "</td>\n<td>" if %$ctags;
5438                print git_show_project_tagcloud($cloud, 48);
5439                print "</td></tr>";
5440        }
5441
5442        print "</table>\n";
5443
5444        # If XSS prevention is on, we don't include README.html.
5445        # TODO: Allow a readme in some safe format.
5446        if (!$prevent_xss && -s "$projectroot/$project/README.html") {
5447                print "<div class=\"title\">readme</div>\n" .
5448                      "<div class=\"readme\">\n";
5449                insert_file("$projectroot/$project/README.html");
5450                print "\n</div>\n"; # class="readme"
5451        }
5452
5453        # we need to request one more than 16 (0..15) to check if
5454        # those 16 are all
5455        my @commitlist = $head ? parse_commits($head, 17) : ();
5456        if (@commitlist) {
5457                git_print_header_div('shortlog');
5458                git_shortlog_body(\@commitlist, 0, 15, $refs,
5459                                  $#commitlist <=  15 ? undef :
5460                                  $cgi->a({-href => href(action=>"shortlog")}, "..."));
5461        }
5462
5463        if (@taglist) {
5464                git_print_header_div('tags');
5465                git_tags_body(\@taglist, 0, 15,
5466                              $#taglist <=  15 ? undef :
5467                              $cgi->a({-href => href(action=>"tags")}, "..."));
5468        }
5469
5470        if (@headlist) {
5471                git_print_header_div('heads');
5472                git_heads_body(\@headlist, $head, 0, 15,
5473                               $#headlist <= 15 ? undef :
5474                               $cgi->a({-href => href(action=>"heads")}, "..."));
5475        }
5476
5477        if (%remotedata) {
5478                git_print_header_div('remotes');
5479                git_remotes_body(\%remotedata, 15, $head);
5480        }
5481
5482        if (@forklist) {
5483                git_print_header_div('forks');
5484                git_project_list_body(\@forklist, 'age', 0, 15,
5485                                      $#forklist <= 15 ? undef :
5486                                      $cgi->a({-href => href(action=>"forks")}, "..."),
5487                                      'no_header');
5488        }
5489
5490        git_footer_html();
5491}
5492
5493sub git_tag {
5494        my %tag = parse_tag($hash);
5495
5496        if (! %tag) {
5497                die_error(404, "Unknown tag object");
5498        }
5499
5500        my $head = git_get_head_hash($project);
5501        git_header_html();
5502        git_print_page_nav('','', $head,undef,$head);
5503        git_print_header_div('commit', esc_html($tag{'name'}), $hash);
5504        print "<div class=\"title_text\">\n" .
5505              "<table class=\"object_header\">\n" .
5506              "<tr>\n" .
5507              "<td>object</td>\n" .
5508              "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5509                               $tag{'object'}) . "</td>\n" .
5510              "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5511                                              $tag{'type'}) . "</td>\n" .
5512              "</tr>\n";
5513        if (defined($tag{'author'})) {
5514                git_print_authorship_rows(\%tag, 'author');
5515        }
5516        print "</table>\n\n" .
5517              "</div>\n";
5518        print "<div class=\"page_body\">";
5519        my $comment = $tag{'comment'};
5520        foreach my $line (@$comment) {
5521                chomp $line;
5522                print esc_html($line, -nbsp=>1) . "<br/>\n";
5523        }
5524        print "</div>\n";
5525        git_footer_html();
5526}
5527
5528sub git_blame_common {
5529        my $format = shift || 'porcelain';
5530        if ($format eq 'porcelain' && $cgi->param('js')) {
5531                $format = 'incremental';
5532                $action = 'blame_incremental'; # for page title etc
5533        }
5534
5535        # permissions
5536        gitweb_check_feature('blame')
5537                or die_error(403, "Blame view not allowed");
5538
5539        # error checking
5540        die_error(400, "No file name given") unless $file_name;
5541        $hash_base ||= git_get_head_hash($project);
5542        die_error(404, "Couldn't find base commit") unless $hash_base;
5543        my %co = parse_commit($hash_base)
5544                or die_error(404, "Commit not found");
5545        my $ftype = "blob";
5546        if (!defined $hash) {
5547                $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
5548                        or die_error(404, "Error looking up file");
5549        } else {
5550                $ftype = git_get_type($hash);
5551                if ($ftype !~ "blob") {
5552                        die_error(400, "Object is not a blob");
5553                }
5554        }
5555
5556        my $fd;
5557        if ($format eq 'incremental') {
5558                # get file contents (as base)
5559                open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
5560                        or die_error(500, "Open git-cat-file failed");
5561        } elsif ($format eq 'data') {
5562                # run git-blame --incremental
5563                open $fd, "-|", git_cmd(), "blame", "--incremental",
5564                        $hash_base, "--", $file_name
5565                        or die_error(500, "Open git-blame --incremental failed");
5566        } else {
5567                # run git-blame --porcelain
5568                open $fd, "-|", git_cmd(), "blame", '-p',
5569                        $hash_base, '--', $file_name
5570                        or die_error(500, "Open git-blame --porcelain failed");
5571        }
5572
5573        # incremental blame data returns early
5574        if ($format eq 'data') {
5575                print $cgi->header(
5576                        -type=>"text/plain", -charset => "utf-8",
5577                        -status=> "200 OK");
5578                local $| = 1; # output autoflush
5579                print while <$fd>;
5580                close $fd
5581                        or print "ERROR $!\n";
5582
5583                print 'END';
5584                if (defined $t0 && gitweb_check_feature('timed')) {
5585                        print ' '.
5586                              tv_interval($t0, [ gettimeofday() ]).
5587                              ' '.$number_of_git_cmds;
5588                }
5589                print "\n";
5590
5591                return;
5592        }
5593
5594        # page header
5595        git_header_html();
5596        my $formats_nav =
5597                $cgi->a({-href => href(action=>"blob", -replay=>1)},
5598                        "blob") .
5599                " | ";
5600        if ($format eq 'incremental') {
5601                $formats_nav .=
5602                        $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
5603                                "blame") . " (non-incremental)";
5604        } else {
5605                $formats_nav .=
5606                        $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
5607                                "blame") . " (incremental)";
5608        }
5609        $formats_nav .=
5610                " | " .
5611                $cgi->a({-href => href(action=>"history", -replay=>1)},
5612                        "history") .
5613                " | " .
5614                $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
5615                        "HEAD");
5616        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5617        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5618        git_print_page_path($file_name, $ftype, $hash_base);
5619
5620        # page body
5621        if ($format eq 'incremental') {
5622                print "<noscript>\n<div class=\"error\"><center><b>\n".
5623                      "This page requires JavaScript to run.\n Use ".
5624                      $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
5625                              'this page').
5626                      " instead.\n".
5627                      "</b></center></div>\n</noscript>\n";
5628
5629                print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
5630        }
5631
5632        print qq!<div class="page_body">\n!;
5633        print qq!<div id="progress_info">... / ...</div>\n!
5634                if ($format eq 'incremental');
5635        print qq!<table id="blame_table" class="blame" width="100%">\n!.
5636              #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
5637              qq!<thead>\n!.
5638              qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
5639              qq!</thead>\n!.
5640              qq!<tbody>\n!;
5641
5642        my @rev_color = qw(light dark);
5643        my $num_colors = scalar(@rev_color);
5644        my $current_color = 0;
5645
5646        if ($format eq 'incremental') {
5647                my $color_class = $rev_color[$current_color];
5648
5649                #contents of a file
5650                my $linenr = 0;
5651        LINE:
5652                while (my $line = <$fd>) {
5653                        chomp $line;
5654                        $linenr++;
5655
5656                        print qq!<tr id="l$linenr" class="$color_class">!.
5657                              qq!<td class="sha1"><a href=""> </a></td>!.
5658                              qq!<td class="linenr">!.
5659                              qq!<a class="linenr" href="">$linenr</a></td>!;
5660                        print qq!<td class="pre">! . esc_html($line) . "</td>\n";
5661                        print qq!</tr>\n!;
5662                }
5663
5664        } else { # porcelain, i.e. ordinary blame
5665                my %metainfo = (); # saves information about commits
5666
5667                # blame data
5668        LINE:
5669                while (my $line = <$fd>) {
5670                        chomp $line;
5671                        # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
5672                        # no <lines in group> for subsequent lines in group of lines
5673                        my ($full_rev, $orig_lineno, $lineno, $group_size) =
5674                           ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
5675                        if (!exists $metainfo{$full_rev}) {
5676                                $metainfo{$full_rev} = { 'nprevious' => 0 };
5677                        }
5678                        my $meta = $metainfo{$full_rev};
5679                        my $data;
5680                        while ($data = <$fd>) {
5681                                chomp $data;
5682                                last if ($data =~ s/^\t//); # contents of line
5683                                if ($data =~ /^(\S+)(?: (.*))?$/) {
5684                                        $meta->{$1} = $2 unless exists $meta->{$1};
5685                                }
5686                                if ($data =~ /^previous /) {
5687                                        $meta->{'nprevious'}++;
5688                                }
5689                        }
5690                        my $short_rev = substr($full_rev, 0, 8);
5691                        my $author = $meta->{'author'};
5692                        my %date =
5693                                parse_date($meta->{'author-time'}, $meta->{'author-tz'});
5694                        my $date = $date{'iso-tz'};
5695                        if ($group_size) {
5696                                $current_color = ($current_color + 1) % $num_colors;
5697                        }
5698                        my $tr_class = $rev_color[$current_color];
5699                        $tr_class .= ' boundary' if (exists $meta->{'boundary'});
5700                        $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
5701                        $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
5702                        print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
5703                        if ($group_size) {
5704                                print "<td class=\"sha1\"";
5705                                print " title=\"". esc_html($author) . ", $date\"";
5706                                print " rowspan=\"$group_size\"" if ($group_size > 1);
5707                                print ">";
5708                                print $cgi->a({-href => href(action=>"commit",
5709                                                             hash=>$full_rev,
5710                                                             file_name=>$file_name)},
5711                                              esc_html($short_rev));
5712                                if ($group_size >= 2) {
5713                                        my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
5714                                        if (@author_initials) {
5715                                                print "<br />" .
5716                                                      esc_html(join('', @author_initials));
5717                                                #           or join('.', ...)
5718                                        }
5719                                }
5720                                print "</td>\n";
5721                        }
5722                        # 'previous' <sha1 of parent commit> <filename at commit>
5723                        if (exists $meta->{'previous'} &&
5724                            $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
5725                                $meta->{'parent'} = $1;
5726                                $meta->{'file_parent'} = unquote($2);
5727                        }
5728                        my $linenr_commit =
5729                                exists($meta->{'parent'}) ?
5730                                $meta->{'parent'} : $full_rev;
5731                        my $linenr_filename =
5732                                exists($meta->{'file_parent'}) ?
5733                                $meta->{'file_parent'} : unquote($meta->{'filename'});
5734                        my $blamed = href(action => 'blame',
5735                                          file_name => $linenr_filename,
5736                                          hash_base => $linenr_commit);
5737                        print "<td class=\"linenr\">";
5738                        print $cgi->a({ -href => "$blamed#l$orig_lineno",
5739                                        -class => "linenr" },
5740                                      esc_html($lineno));
5741                        print "</td>";
5742                        print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
5743                        print "</tr>\n";
5744                } # end while
5745
5746        }
5747
5748        # footer
5749        print "</tbody>\n".
5750              "</table>\n"; # class="blame"
5751        print "</div>\n";   # class="blame_body"
5752        close $fd
5753                or print "Reading blob failed\n";
5754
5755        git_footer_html();
5756}
5757
5758sub git_blame {
5759        git_blame_common();
5760}
5761
5762sub git_blame_incremental {
5763        git_blame_common('incremental');
5764}
5765
5766sub git_blame_data {
5767        git_blame_common('data');
5768}
5769
5770sub git_tags {
5771        my $head = git_get_head_hash($project);
5772        git_header_html();
5773        git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
5774        git_print_header_div('summary', $project);
5775
5776        my @tagslist = git_get_tags_list();
5777        if (@tagslist) {
5778                git_tags_body(\@tagslist);
5779        }
5780        git_footer_html();
5781}
5782
5783sub git_heads {
5784        my $head = git_get_head_hash($project);
5785        git_header_html();
5786        git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
5787        git_print_header_div('summary', $project);
5788
5789        my @headslist = git_get_heads_list();
5790        if (@headslist) {
5791                git_heads_body(\@headslist, $head);
5792        }
5793        git_footer_html();
5794}
5795
5796# used both for single remote view and for list of all the remotes
5797sub git_remotes {
5798        gitweb_check_feature('remote_heads')
5799                or die_error(403, "Remote heads view is disabled");
5800
5801        my $head = git_get_head_hash($project);
5802        my $remote = $input_params{'hash'};
5803
5804        my $remotedata = git_get_remotes_list($remote);
5805        die_error(500, "Unable to get remote information") unless defined $remotedata;
5806
5807        unless (%$remotedata) {
5808                die_error(404, defined $remote ?
5809                        "Remote $remote not found" :
5810                        "No remotes found");
5811        }
5812
5813        git_header_html(undef, undef, -action_extra => $remote);
5814        git_print_page_nav('', '',  $head, undef, $head,
5815                format_ref_views($remote ? '' : 'remotes'));
5816
5817        fill_remote_heads($remotedata);
5818        if (defined $remote) {
5819                git_print_header_div('remotes', "$remote remote for $project");
5820                git_remote_block($remote, $remotedata->{$remote}, undef, $head);
5821        } else {
5822                git_print_header_div('summary', "$project remotes");
5823                git_remotes_body($remotedata, undef, $head);
5824        }
5825
5826        git_footer_html();
5827}
5828
5829sub git_blob_plain {
5830        my $type = shift;
5831        my $expires;
5832
5833        if (!defined $hash) {
5834                if (defined $file_name) {
5835                        my $base = $hash_base || git_get_head_hash($project);
5836                        $hash = git_get_hash_by_path($base, $file_name, "blob")
5837                                or die_error(404, "Cannot find file");
5838                } else {
5839                        die_error(400, "No file name defined");
5840                }
5841        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5842                # blobs defined by non-textual hash id's can be cached
5843                $expires = "+1d";
5844        }
5845
5846        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5847                or die_error(500, "Open git-cat-file blob '$hash' failed");
5848
5849        # content-type (can include charset)
5850        $type = blob_contenttype($fd, $file_name, $type);
5851
5852        # "save as" filename, even when no $file_name is given
5853        my $save_as = "$hash";
5854        if (defined $file_name) {
5855                $save_as = $file_name;
5856        } elsif ($type =~ m/^text\//) {
5857                $save_as .= '.txt';
5858        }
5859
5860        # With XSS prevention on, blobs of all types except a few known safe
5861        # ones are served with "Content-Disposition: attachment" to make sure
5862        # they don't run in our security domain.  For certain image types,
5863        # blob view writes an <img> tag referring to blob_plain view, and we
5864        # want to be sure not to break that by serving the image as an
5865        # attachment (though Firefox 3 doesn't seem to care).
5866        my $sandbox = $prevent_xss &&
5867                $type !~ m!^(?:text/plain|image/(?:gif|png|jpeg))$!;
5868
5869        print $cgi->header(
5870                -type => $type,
5871                -expires => $expires,
5872                -content_disposition =>
5873                        ($sandbox ? 'attachment' : 'inline')
5874                        . '; filename="' . $save_as . '"');
5875        local $/ = undef;
5876        binmode STDOUT, ':raw';
5877        print <$fd>;
5878        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
5879        close $fd;
5880}
5881
5882sub git_blob {
5883        my $expires;
5884
5885        if (!defined $hash) {
5886                if (defined $file_name) {
5887                        my $base = $hash_base || git_get_head_hash($project);
5888                        $hash = git_get_hash_by_path($base, $file_name, "blob")
5889                                or die_error(404, "Cannot find file");
5890                } else {
5891                        die_error(400, "No file name defined");
5892                }
5893        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5894                # blobs defined by non-textual hash id's can be cached
5895                $expires = "+1d";
5896        }
5897
5898        my $have_blame = gitweb_check_feature('blame');
5899        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5900                or die_error(500, "Couldn't cat $file_name, $hash");
5901        my $mimetype = blob_mimetype($fd, $file_name);
5902        # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
5903        if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
5904                close $fd;
5905                return git_blob_plain($mimetype);
5906        }
5907        # we can have blame only for text/* mimetype
5908        $have_blame &&= ($mimetype =~ m!^text/!);
5909
5910        my $highlight = gitweb_check_feature('highlight');
5911        my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
5912        $fd = run_highlighter($fd, $highlight, $syntax)
5913                if $syntax;
5914
5915        git_header_html(undef, $expires);
5916        my $formats_nav = '';
5917        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
5918                if (defined $file_name) {
5919                        if ($have_blame) {
5920                                $formats_nav .=
5921                                        $cgi->a({-href => href(action=>"blame", -replay=>1)},
5922                                                "blame") .
5923                                        " | ";
5924                        }
5925                        $formats_nav .=
5926                                $cgi->a({-href => href(action=>"history", -replay=>1)},
5927                                        "history") .
5928                                " | " .
5929                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5930                                        "raw") .
5931                                " | " .
5932                                $cgi->a({-href => href(action=>"blob",
5933                                                       hash_base=>"HEAD", file_name=>$file_name)},
5934                                        "HEAD");
5935                } else {
5936                        $formats_nav .=
5937                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5938                                        "raw");
5939                }
5940                git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5941                git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5942        } else {
5943                print "<div class=\"page_nav\">\n" .
5944                      "<br/><br/></div>\n" .
5945                      "<div class=\"title\">".esc_html($hash)."</div>\n";
5946        }
5947        git_print_page_path($file_name, "blob", $hash_base);
5948        print "<div class=\"page_body\">\n";
5949        if ($mimetype =~ m!^image/!) {
5950                print qq!<img type="!.esc_attr($mimetype).qq!"!;
5951                if ($file_name) {
5952                        print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
5953                }
5954                print qq! src="! .
5955                      href(action=>"blob_plain", hash=>$hash,
5956                           hash_base=>$hash_base, file_name=>$file_name) .
5957                      qq!" />\n!;
5958        } else {
5959                my $nr;
5960                while (my $line = <$fd>) {
5961                        chomp $line;
5962                        $nr++;
5963                        $line = untabify($line);
5964                        printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
5965                               $nr, esc_attr(href(-replay => 1)), $nr, $nr, $syntax ? $line : esc_html($line, -nbsp=>1);
5966                }
5967        }
5968        close $fd
5969                or print "Reading blob failed.\n";
5970        print "</div>";
5971        git_footer_html();
5972}
5973
5974sub git_tree {
5975        if (!defined $hash_base) {
5976                $hash_base = "HEAD";
5977        }
5978        if (!defined $hash) {
5979                if (defined $file_name) {
5980                        $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
5981                } else {
5982                        $hash = $hash_base;
5983                }
5984        }
5985        die_error(404, "No such tree") unless defined($hash);
5986
5987        my $show_sizes = gitweb_check_feature('show-sizes');
5988        my $have_blame = gitweb_check_feature('blame');
5989
5990        my @entries = ();
5991        {
5992                local $/ = "\0";
5993                open my $fd, "-|", git_cmd(), "ls-tree", '-z',
5994                        ($show_sizes ? '-l' : ()), @extra_options, $hash
5995                        or die_error(500, "Open git-ls-tree failed");
5996                @entries = map { chomp; $_ } <$fd>;
5997                close $fd
5998                        or die_error(404, "Reading tree failed");
5999        }
6000
6001        my $refs = git_get_references();
6002        my $ref = format_ref_marker($refs, $hash_base);
6003        git_header_html();
6004        my $basedir = '';
6005        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6006                my @views_nav = ();
6007                if (defined $file_name) {
6008                        push @views_nav,
6009                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6010                                        "history"),
6011                                $cgi->a({-href => href(action=>"tree",
6012                                                       hash_base=>"HEAD", file_name=>$file_name)},
6013                                        "HEAD"),
6014                }
6015                my $snapshot_links = format_snapshot_links($hash);
6016                if (defined $snapshot_links) {
6017                        # FIXME: Should be available when we have no hash base as well.
6018                        push @views_nav, $snapshot_links;
6019                }
6020                git_print_page_nav('tree','', $hash_base, undef, undef,
6021                                   join(' | ', @views_nav));
6022                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6023        } else {
6024                undef $hash_base;
6025                print "<div class=\"page_nav\">\n";
6026                print "<br/><br/></div>\n";
6027                print "<div class=\"title\">".esc_html($hash)."</div>\n";
6028        }
6029        if (defined $file_name) {
6030                $basedir = $file_name;
6031                if ($basedir ne '' && substr($basedir, -1) ne '/') {
6032                        $basedir .= '/';
6033                }
6034                git_print_page_path($file_name, 'tree', $hash_base);
6035        }
6036        print "<div class=\"page_body\">\n";
6037        print "<table class=\"tree\">\n";
6038        my $alternate = 1;
6039        # '..' (top directory) link if possible
6040        if (defined $hash_base &&
6041            defined $file_name && $file_name =~ m![^/]+$!) {
6042                if ($alternate) {
6043                        print "<tr class=\"dark\">\n";
6044                } else {
6045                        print "<tr class=\"light\">\n";
6046                }
6047                $alternate ^= 1;
6048
6049                my $up = $file_name;
6050                $up =~ s!/?[^/]+$!!;
6051                undef $up unless $up;
6052                # based on git_print_tree_entry
6053                print '<td class="mode">' . mode_str('040000') . "</td>\n";
6054                print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6055                print '<td class="list">';
6056                print $cgi->a({-href => href(action=>"tree",
6057                                             hash_base=>$hash_base,
6058                                             file_name=>$up)},
6059                              "..");
6060                print "</td>\n";
6061                print "<td class=\"link\"></td>\n";
6062
6063                print "</tr>\n";
6064        }
6065        foreach my $line (@entries) {
6066                my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6067
6068                if ($alternate) {
6069                        print "<tr class=\"dark\">\n";
6070                } else {
6071                        print "<tr class=\"light\">\n";
6072                }
6073                $alternate ^= 1;
6074
6075                git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6076
6077                print "</tr>\n";
6078        }
6079        print "</table>\n" .
6080              "</div>";
6081        git_footer_html();
6082}
6083
6084sub snapshot_name {
6085        my ($project, $hash) = @_;
6086
6087        # path/to/project.git  -> project
6088        # path/to/project/.git -> project
6089        my $name = to_utf8($project);
6090        $name =~ s,([^/])/*\.git$,$1,;
6091        $name = basename($name);
6092        # sanitize name
6093        $name =~ s/[[:cntrl:]]/?/g;
6094
6095        my $ver = $hash;
6096        if ($hash =~ /^[0-9a-fA-F]+$/) {
6097                # shorten SHA-1 hash
6098                my $full_hash = git_get_full_hash($project, $hash);
6099                if ($full_hash =~ /^$hash/ && length($hash) > 7) {
6100                        $ver = git_get_short_hash($project, $hash);
6101                }
6102        } elsif ($hash =~ m!^refs/tags/(.*)$!) {
6103                # tags don't need shortened SHA-1 hash
6104                $ver = $1;
6105        } else {
6106                # branches and other need shortened SHA-1 hash
6107                if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
6108                        $ver = $1;
6109                }
6110                $ver .= '-' . git_get_short_hash($project, $hash);
6111        }
6112        # in case of hierarchical branch names
6113        $ver =~ s!/!.!g;
6114
6115        # name = project-version_string
6116        $name = "$name-$ver";
6117
6118        return wantarray ? ($name, $name) : $name;
6119}
6120
6121sub git_snapshot {
6122        my $format = $input_params{'snapshot_format'};
6123        if (!@snapshot_fmts) {
6124                die_error(403, "Snapshots not allowed");
6125        }
6126        # default to first supported snapshot format
6127        $format ||= $snapshot_fmts[0];
6128        if ($format !~ m/^[a-z0-9]+$/) {
6129                die_error(400, "Invalid snapshot format parameter");
6130        } elsif (!exists($known_snapshot_formats{$format})) {
6131                die_error(400, "Unknown snapshot format");
6132        } elsif ($known_snapshot_formats{$format}{'disabled'}) {
6133                die_error(403, "Snapshot format not allowed");
6134        } elsif (!grep($_ eq $format, @snapshot_fmts)) {
6135                die_error(403, "Unsupported snapshot format");
6136        }
6137
6138        my $type = git_get_type("$hash^{}");
6139        if (!$type) {
6140                die_error(404, 'Object does not exist');
6141        }  elsif ($type eq 'blob') {
6142                die_error(400, 'Object is not a tree-ish');
6143        }
6144
6145        my ($name, $prefix) = snapshot_name($project, $hash);
6146        my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
6147        my $cmd = quote_command(
6148                git_cmd(), 'archive',
6149                "--format=$known_snapshot_formats{$format}{'format'}",
6150                "--prefix=$prefix/", $hash);
6151        if (exists $known_snapshot_formats{$format}{'compressor'}) {
6152                $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
6153        }
6154
6155        $filename =~ s/(["\\])/\\$1/g;
6156        print $cgi->header(
6157                -type => $known_snapshot_formats{$format}{'type'},
6158                -content_disposition => 'inline; filename="' . $filename . '"',
6159                -status => '200 OK');
6160
6161        open my $fd, "-|", $cmd
6162                or die_error(500, "Execute git-archive failed");
6163        binmode STDOUT, ':raw';
6164        print <$fd>;
6165        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6166        close $fd;
6167}
6168
6169sub git_log_generic {
6170        my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
6171
6172        my $head = git_get_head_hash($project);
6173        if (!defined $base) {
6174                $base = $head;
6175        }
6176        if (!defined $page) {
6177                $page = 0;
6178        }
6179        my $refs = git_get_references();
6180
6181        my $commit_hash = $base;
6182        if (defined $parent) {
6183                $commit_hash = "$parent..$base";
6184        }
6185        my @commitlist =
6186                parse_commits($commit_hash, 101, (100 * $page),
6187                              defined $file_name ? ($file_name, "--full-history") : ());
6188
6189        my $ftype;
6190        if (!defined $file_hash && defined $file_name) {
6191                # some commits could have deleted file in question,
6192                # and not have it in tree, but one of them has to have it
6193                for (my $i = 0; $i < @commitlist; $i++) {
6194                        $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
6195                        last if defined $file_hash;
6196                }
6197        }
6198        if (defined $file_hash) {
6199                $ftype = git_get_type($file_hash);
6200        }
6201        if (defined $file_name && !defined $ftype) {
6202                die_error(500, "Unknown type of object");
6203        }
6204        my %co;
6205        if (defined $file_name) {
6206                %co = parse_commit($base)
6207                        or die_error(404, "Unknown commit object");
6208        }
6209
6210
6211        my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
6212        my $next_link = '';
6213        if ($#commitlist >= 100) {
6214                $next_link =
6215                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
6216                                 -accesskey => "n", -title => "Alt-n"}, "next");
6217        }
6218        my $patch_max = gitweb_get_feature('patches');
6219        if ($patch_max && !defined $file_name) {
6220                if ($patch_max < 0 || @commitlist <= $patch_max) {
6221                        $paging_nav .= " &sdot; " .
6222                                $cgi->a({-href => href(action=>"patches", -replay=>1)},
6223                                        "patches");
6224                }
6225        }
6226
6227        git_header_html();
6228        git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
6229        if (defined $file_name) {
6230                git_print_header_div('commit', esc_html($co{'title'}), $base);
6231        } else {
6232                git_print_header_div('summary', $project)
6233        }
6234        git_print_page_path($file_name, $ftype, $hash_base)
6235                if (defined $file_name);
6236
6237        $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
6238                     $file_name, $file_hash, $ftype);
6239
6240        git_footer_html();
6241}
6242
6243sub git_log {
6244        git_log_generic('log', \&git_log_body,
6245                        $hash, $hash_parent);
6246}
6247
6248sub git_commit {
6249        $hash ||= $hash_base || "HEAD";
6250        my %co = parse_commit($hash)
6251            or die_error(404, "Unknown commit object");
6252
6253        my $parent  = $co{'parent'};
6254        my $parents = $co{'parents'}; # listref
6255
6256        # we need to prepare $formats_nav before any parameter munging
6257        my $formats_nav;
6258        if (!defined $parent) {
6259                # --root commitdiff
6260                $formats_nav .= '(initial)';
6261        } elsif (@$parents == 1) {
6262                # single parent commit
6263                $formats_nav .=
6264                        '(parent: ' .
6265                        $cgi->a({-href => href(action=>"commit",
6266                                               hash=>$parent)},
6267                                esc_html(substr($parent, 0, 7))) .
6268                        ')';
6269        } else {
6270                # merge commit
6271                $formats_nav .=
6272                        '(merge: ' .
6273                        join(' ', map {
6274                                $cgi->a({-href => href(action=>"commit",
6275                                                       hash=>$_)},
6276                                        esc_html(substr($_, 0, 7)));
6277                        } @$parents ) .
6278                        ')';
6279        }
6280        if (gitweb_check_feature('patches') && @$parents <= 1) {
6281                $formats_nav .= " | " .
6282                        $cgi->a({-href => href(action=>"patch", -replay=>1)},
6283                                "patch");
6284        }
6285
6286        if (!defined $parent) {
6287                $parent = "--root";
6288        }
6289        my @difftree;
6290        open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
6291                @diff_opts,
6292                (@$parents <= 1 ? $parent : '-c'),
6293                $hash, "--"
6294                or die_error(500, "Open git-diff-tree failed");
6295        @difftree = map { chomp; $_ } <$fd>;
6296        close $fd or die_error(404, "Reading git-diff-tree failed");
6297
6298        # non-textual hash id's can be cached
6299        my $expires;
6300        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6301                $expires = "+1d";
6302        }
6303        my $refs = git_get_references();
6304        my $ref = format_ref_marker($refs, $co{'id'});
6305
6306        git_header_html(undef, $expires);
6307        git_print_page_nav('commit', '',
6308                           $hash, $co{'tree'}, $hash,
6309                           $formats_nav);
6310
6311        if (defined $co{'parent'}) {
6312                git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
6313        } else {
6314                git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
6315        }
6316        print "<div class=\"title_text\">\n" .
6317              "<table class=\"object_header\">\n";
6318        git_print_authorship_rows(\%co);
6319        print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
6320        print "<tr>" .
6321              "<td>tree</td>" .
6322              "<td class=\"sha1\">" .
6323              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
6324                       class => "list"}, $co{'tree'}) .
6325              "</td>" .
6326              "<td class=\"link\">" .
6327              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
6328                      "tree");
6329        my $snapshot_links = format_snapshot_links($hash);
6330        if (defined $snapshot_links) {
6331                print " | " . $snapshot_links;
6332        }
6333        print "</td>" .
6334              "</tr>\n";
6335
6336        foreach my $par (@$parents) {
6337                print "<tr>" .
6338                      "<td>parent</td>" .
6339                      "<td class=\"sha1\">" .
6340                      $cgi->a({-href => href(action=>"commit", hash=>$par),
6341                               class => "list"}, $par) .
6342                      "</td>" .
6343                      "<td class=\"link\">" .
6344                      $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
6345                      " | " .
6346                      $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
6347                      "</td>" .
6348                      "</tr>\n";
6349        }
6350        print "</table>".
6351              "</div>\n";
6352
6353        print "<div class=\"page_body\">\n";
6354        git_print_log($co{'comment'});
6355        print "</div>\n";
6356
6357        git_difftree_body(\@difftree, $hash, @$parents);
6358
6359        git_footer_html();
6360}
6361
6362sub git_object {
6363        # object is defined by:
6364        # - hash or hash_base alone
6365        # - hash_base and file_name
6366        my $type;
6367
6368        # - hash or hash_base alone
6369        if ($hash || ($hash_base && !defined $file_name)) {
6370                my $object_id = $hash || $hash_base;
6371
6372                open my $fd, "-|", quote_command(
6373                        git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
6374                        or die_error(404, "Object does not exist");
6375                $type = <$fd>;
6376                chomp $type;
6377                close $fd
6378                        or die_error(404, "Object does not exist");
6379
6380        # - hash_base and file_name
6381        } elsif ($hash_base && defined $file_name) {
6382                $file_name =~ s,/+$,,;
6383
6384                system(git_cmd(), "cat-file", '-e', $hash_base) == 0
6385                        or die_error(404, "Base object does not exist");
6386
6387                # here errors should not hapen
6388                open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
6389                        or die_error(500, "Open git-ls-tree failed");
6390                my $line = <$fd>;
6391                close $fd;
6392
6393                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
6394                unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
6395                        die_error(404, "File or directory for given base does not exist");
6396                }
6397                $type = $2;
6398                $hash = $3;
6399        } else {
6400                die_error(400, "Not enough information to find object");
6401        }
6402
6403        print $cgi->redirect(-uri => href(action=>$type, -full=>1,
6404                                          hash=>$hash, hash_base=>$hash_base,
6405                                          file_name=>$file_name),
6406                             -status => '302 Found');
6407}
6408
6409sub git_blobdiff {
6410        my $format = shift || 'html';
6411
6412        my $fd;
6413        my @difftree;
6414        my %diffinfo;
6415        my $expires;
6416
6417        # preparing $fd and %diffinfo for git_patchset_body
6418        # new style URI
6419        if (defined $hash_base && defined $hash_parent_base) {
6420                if (defined $file_name) {
6421                        # read raw output
6422                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6423                                $hash_parent_base, $hash_base,
6424                                "--", (defined $file_parent ? $file_parent : ()), $file_name
6425                                or die_error(500, "Open git-diff-tree failed");
6426                        @difftree = map { chomp; $_ } <$fd>;
6427                        close $fd
6428                                or die_error(404, "Reading git-diff-tree failed");
6429                        @difftree
6430                                or die_error(404, "Blob diff not found");
6431
6432                } elsif (defined $hash &&
6433                         $hash =~ /[0-9a-fA-F]{40}/) {
6434                        # try to find filename from $hash
6435
6436                        # read filtered raw output
6437                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6438                                $hash_parent_base, $hash_base, "--"
6439                                or die_error(500, "Open git-diff-tree failed");
6440                        @difftree =
6441                                # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
6442                                # $hash == to_id
6443                                grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
6444                                map { chomp; $_ } <$fd>;
6445                        close $fd
6446                                or die_error(404, "Reading git-diff-tree failed");
6447                        @difftree
6448                                or die_error(404, "Blob diff not found");
6449
6450                } else {
6451                        die_error(400, "Missing one of the blob diff parameters");
6452                }
6453
6454                if (@difftree > 1) {
6455                        die_error(400, "Ambiguous blob diff specification");
6456                }
6457
6458                %diffinfo = parse_difftree_raw_line($difftree[0]);
6459                $file_parent ||= $diffinfo{'from_file'} || $file_name;
6460                $file_name   ||= $diffinfo{'to_file'};
6461
6462                $hash_parent ||= $diffinfo{'from_id'};
6463                $hash        ||= $diffinfo{'to_id'};
6464
6465                # non-textual hash id's can be cached
6466                if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
6467                    $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
6468                        $expires = '+1d';
6469                }
6470
6471                # open patch output
6472                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6473                        '-p', ($format eq 'html' ? "--full-index" : ()),
6474                        $hash_parent_base, $hash_base,
6475                        "--", (defined $file_parent ? $file_parent : ()), $file_name
6476                        or die_error(500, "Open git-diff-tree failed");
6477        }
6478
6479        # old/legacy style URI -- not generated anymore since 1.4.3.
6480        if (!%diffinfo) {
6481                die_error('404 Not Found', "Missing one of the blob diff parameters")
6482        }
6483
6484        # header
6485        if ($format eq 'html') {
6486                my $formats_nav =
6487                        $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
6488                                "raw");
6489                git_header_html(undef, $expires);
6490                if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6491                        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6492                        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6493                } else {
6494                        print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
6495                        print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
6496                }
6497                if (defined $file_name) {
6498                        git_print_page_path($file_name, "blob", $hash_base);
6499                } else {
6500                        print "<div class=\"page_path\"></div>\n";
6501                }
6502
6503        } elsif ($format eq 'plain') {
6504                print $cgi->header(
6505                        -type => 'text/plain',
6506                        -charset => 'utf-8',
6507                        -expires => $expires,
6508                        -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
6509
6510                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6511
6512        } else {
6513                die_error(400, "Unknown blobdiff format");
6514        }
6515
6516        # patch
6517        if ($format eq 'html') {
6518                print "<div class=\"page_body\">\n";
6519
6520                git_patchset_body($fd, [ \%diffinfo ], $hash_base, $hash_parent_base);
6521                close $fd;
6522
6523                print "</div>\n"; # class="page_body"
6524                git_footer_html();
6525
6526        } else {
6527                while (my $line = <$fd>) {
6528                        $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
6529                        $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
6530
6531                        print $line;
6532
6533                        last if $line =~ m!^\+\+\+!;
6534                }
6535                local $/ = undef;
6536                print <$fd>;
6537                close $fd;
6538        }
6539}
6540
6541sub git_blobdiff_plain {
6542        git_blobdiff('plain');
6543}
6544
6545sub git_commitdiff {
6546        my %params = @_;
6547        my $format = $params{-format} || 'html';
6548
6549        my ($patch_max) = gitweb_get_feature('patches');
6550        if ($format eq 'patch') {
6551                die_error(403, "Patch view not allowed") unless $patch_max;
6552        }
6553
6554        $hash ||= $hash_base || "HEAD";
6555        my %co = parse_commit($hash)
6556            or die_error(404, "Unknown commit object");
6557
6558        # choose format for commitdiff for merge
6559        if (! defined $hash_parent && @{$co{'parents'}} > 1) {
6560                $hash_parent = '--cc';
6561        }
6562        # we need to prepare $formats_nav before almost any parameter munging
6563        my $formats_nav;
6564        if ($format eq 'html') {
6565                $formats_nav =
6566                        $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
6567                                "raw");
6568                if ($patch_max && @{$co{'parents'}} <= 1) {
6569                        $formats_nav .= " | " .
6570                                $cgi->a({-href => href(action=>"patch", -replay=>1)},
6571                                        "patch");
6572                }
6573
6574                if (defined $hash_parent &&
6575                    $hash_parent ne '-c' && $hash_parent ne '--cc') {
6576                        # commitdiff with two commits given
6577                        my $hash_parent_short = $hash_parent;
6578                        if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
6579                                $hash_parent_short = substr($hash_parent, 0, 7);
6580                        }
6581                        $formats_nav .=
6582                                ' (from';
6583                        for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
6584                                if ($co{'parents'}[$i] eq $hash_parent) {
6585                                        $formats_nav .= ' parent ' . ($i+1);
6586                                        last;
6587                                }
6588                        }
6589                        $formats_nav .= ': ' .
6590                                $cgi->a({-href => href(action=>"commitdiff",
6591                                                       hash=>$hash_parent)},
6592                                        esc_html($hash_parent_short)) .
6593                                ')';
6594                } elsif (!$co{'parent'}) {
6595                        # --root commitdiff
6596                        $formats_nav .= ' (initial)';
6597                } elsif (scalar @{$co{'parents'}} == 1) {
6598                        # single parent commit
6599                        $formats_nav .=
6600                                ' (parent: ' .
6601                                $cgi->a({-href => href(action=>"commitdiff",
6602                                                       hash=>$co{'parent'})},
6603                                        esc_html(substr($co{'parent'}, 0, 7))) .
6604                                ')';
6605                } else {
6606                        # merge commit
6607                        if ($hash_parent eq '--cc') {
6608                                $formats_nav .= ' | ' .
6609                                        $cgi->a({-href => href(action=>"commitdiff",
6610                                                               hash=>$hash, hash_parent=>'-c')},
6611                                                'combined');
6612                        } else { # $hash_parent eq '-c'
6613                                $formats_nav .= ' | ' .
6614                                        $cgi->a({-href => href(action=>"commitdiff",
6615                                                               hash=>$hash, hash_parent=>'--cc')},
6616                                                'compact');
6617                        }
6618                        $formats_nav .=
6619                                ' (merge: ' .
6620                                join(' ', map {
6621                                        $cgi->a({-href => href(action=>"commitdiff",
6622                                                               hash=>$_)},
6623                                                esc_html(substr($_, 0, 7)));
6624                                } @{$co{'parents'}} ) .
6625                                ')';
6626                }
6627        }
6628
6629        my $hash_parent_param = $hash_parent;
6630        if (!defined $hash_parent_param) {
6631                # --cc for multiple parents, --root for parentless
6632                $hash_parent_param =
6633                        @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
6634        }
6635
6636        # read commitdiff
6637        my $fd;
6638        my @difftree;
6639        if ($format eq 'html') {
6640                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6641                        "--no-commit-id", "--patch-with-raw", "--full-index",
6642                        $hash_parent_param, $hash, "--"
6643                        or die_error(500, "Open git-diff-tree failed");
6644
6645                while (my $line = <$fd>) {
6646                        chomp $line;
6647                        # empty line ends raw part of diff-tree output
6648                        last unless $line;
6649                        push @difftree, scalar parse_difftree_raw_line($line);
6650                }
6651
6652        } elsif ($format eq 'plain') {
6653                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6654                        '-p', $hash_parent_param, $hash, "--"
6655                        or die_error(500, "Open git-diff-tree failed");
6656        } elsif ($format eq 'patch') {
6657                # For commit ranges, we limit the output to the number of
6658                # patches specified in the 'patches' feature.
6659                # For single commits, we limit the output to a single patch,
6660                # diverging from the git-format-patch default.
6661                my @commit_spec = ();
6662                if ($hash_parent) {
6663                        if ($patch_max > 0) {
6664                                push @commit_spec, "-$patch_max";
6665                        }
6666                        push @commit_spec, '-n', "$hash_parent..$hash";
6667                } else {
6668                        if ($params{-single}) {
6669                                push @commit_spec, '-1';
6670                        } else {
6671                                if ($patch_max > 0) {
6672                                        push @commit_spec, "-$patch_max";
6673                                }
6674                                push @commit_spec, "-n";
6675                        }
6676                        push @commit_spec, '--root', $hash;
6677                }
6678                open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
6679                        '--encoding=utf8', '--stdout', @commit_spec
6680                        or die_error(500, "Open git-format-patch failed");
6681        } else {
6682                die_error(400, "Unknown commitdiff format");
6683        }
6684
6685        # non-textual hash id's can be cached
6686        my $expires;
6687        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6688                $expires = "+1d";
6689        }
6690
6691        # write commit message
6692        if ($format eq 'html') {
6693                my $refs = git_get_references();
6694                my $ref = format_ref_marker($refs, $co{'id'});
6695
6696                git_header_html(undef, $expires);
6697                git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
6698                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
6699                print "<div class=\"title_text\">\n" .
6700                      "<table class=\"object_header\">\n";
6701                git_print_authorship_rows(\%co);
6702                print "</table>".
6703                      "</div>\n";
6704                print "<div class=\"page_body\">\n";
6705                if (@{$co{'comment'}} > 1) {
6706                        print "<div class=\"log\">\n";
6707                        git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
6708                        print "</div>\n"; # class="log"
6709                }
6710
6711        } elsif ($format eq 'plain') {
6712                my $refs = git_get_references("tags");
6713                my $tagname = git_get_rev_name_tags($hash);
6714                my $filename = basename($project) . "-$hash.patch";
6715
6716                print $cgi->header(
6717                        -type => 'text/plain',
6718                        -charset => 'utf-8',
6719                        -expires => $expires,
6720                        -content_disposition => 'inline; filename="' . "$filename" . '"');
6721                my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
6722                print "From: " . to_utf8($co{'author'}) . "\n";
6723                print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
6724                print "Subject: " . to_utf8($co{'title'}) . "\n";
6725
6726                print "X-Git-Tag: $tagname\n" if $tagname;
6727                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6728
6729                foreach my $line (@{$co{'comment'}}) {
6730                        print to_utf8($line) . "\n";
6731                }
6732                print "---\n\n";
6733        } elsif ($format eq 'patch') {
6734                my $filename = basename($project) . "-$hash.patch";
6735
6736                print $cgi->header(
6737                        -type => 'text/plain',
6738                        -charset => 'utf-8',
6739                        -expires => $expires,
6740                        -content_disposition => 'inline; filename="' . "$filename" . '"');
6741        }
6742
6743        # write patch
6744        if ($format eq 'html') {
6745                my $use_parents = !defined $hash_parent ||
6746                        $hash_parent eq '-c' || $hash_parent eq '--cc';
6747                git_difftree_body(\@difftree, $hash,
6748                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
6749                print "<br/>\n";
6750
6751                git_patchset_body($fd, \@difftree, $hash,
6752                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
6753                close $fd;
6754                print "</div>\n"; # class="page_body"
6755                git_footer_html();
6756
6757        } elsif ($format eq 'plain') {
6758                local $/ = undef;
6759                print <$fd>;
6760                close $fd
6761                        or print "Reading git-diff-tree failed\n";
6762        } elsif ($format eq 'patch') {
6763                local $/ = undef;
6764                print <$fd>;
6765                close $fd
6766                        or print "Reading git-format-patch failed\n";
6767        }
6768}
6769
6770sub git_commitdiff_plain {
6771        git_commitdiff(-format => 'plain');
6772}
6773
6774# format-patch-style patches
6775sub git_patch {
6776        git_commitdiff(-format => 'patch', -single => 1);
6777}
6778
6779sub git_patches {
6780        git_commitdiff(-format => 'patch');
6781}
6782
6783sub git_history {
6784        git_log_generic('history', \&git_history_body,
6785                        $hash_base, $hash_parent_base,
6786                        $file_name, $hash);
6787}
6788
6789sub git_search {
6790        gitweb_check_feature('search') or die_error(403, "Search is disabled");
6791        if (!defined $searchtext) {
6792                die_error(400, "Text field is empty");
6793        }
6794        if (!defined $hash) {
6795                $hash = git_get_head_hash($project);
6796        }
6797        my %co = parse_commit($hash);
6798        if (!%co) {
6799                die_error(404, "Unknown commit object");
6800        }
6801        if (!defined $page) {
6802                $page = 0;
6803        }
6804
6805        $searchtype ||= 'commit';
6806        if ($searchtype eq 'pickaxe') {
6807                # pickaxe may take all resources of your box and run for several minutes
6808                # with every query - so decide by yourself how public you make this feature
6809                gitweb_check_feature('pickaxe')
6810                    or die_error(403, "Pickaxe is disabled");
6811        }
6812        if ($searchtype eq 'grep') {
6813                gitweb_check_feature('grep')
6814                    or die_error(403, "Grep is disabled");
6815        }
6816
6817        git_header_html();
6818
6819        if ($searchtype eq 'commit' or $searchtype eq 'author' or $searchtype eq 'committer') {
6820                my $greptype;
6821                if ($searchtype eq 'commit') {
6822                        $greptype = "--grep=";
6823                } elsif ($searchtype eq 'author') {
6824                        $greptype = "--author=";
6825                } elsif ($searchtype eq 'committer') {
6826                        $greptype = "--committer=";
6827                }
6828                $greptype .= $searchtext;
6829                my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
6830                                               $greptype, '--regexp-ignore-case',
6831                                               $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
6832
6833                my $paging_nav = '';
6834                if ($page > 0) {
6835                        $paging_nav .=
6836                                $cgi->a({-href => href(action=>"search", hash=>$hash,
6837                                                       searchtext=>$searchtext,
6838                                                       searchtype=>$searchtype)},
6839                                        "first");
6840                        $paging_nav .= " &sdot; " .
6841                                $cgi->a({-href => href(-replay=>1, page=>$page-1),
6842                                         -accesskey => "p", -title => "Alt-p"}, "prev");
6843                } else {
6844                        $paging_nav .= "first";
6845                        $paging_nav .= " &sdot; prev";
6846                }
6847                my $next_link = '';
6848                if ($#commitlist >= 100) {
6849                        $next_link =
6850                                $cgi->a({-href => href(-replay=>1, page=>$page+1),
6851                                         -accesskey => "n", -title => "Alt-n"}, "next");
6852                        $paging_nav .= " &sdot; $next_link";
6853                } else {
6854                        $paging_nav .= " &sdot; next";
6855                }
6856
6857                git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
6858                git_print_header_div('commit', esc_html($co{'title'}), $hash);
6859                if ($page == 0 && !@commitlist) {
6860                        print "<p>No match.</p>\n";
6861                } else {
6862                        git_search_grep_body(\@commitlist, 0, 99, $next_link);
6863                }
6864        }
6865
6866        if ($searchtype eq 'pickaxe') {
6867                git_print_page_nav('','', $hash,$co{'tree'},$hash);
6868                git_print_header_div('commit', esc_html($co{'title'}), $hash);
6869
6870                print "<table class=\"pickaxe search\">\n";
6871                my $alternate = 1;
6872                local $/ = "\n";
6873                open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
6874                        '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
6875                        ($search_use_regexp ? '--pickaxe-regex' : ());
6876                undef %co;
6877                my @files;
6878                while (my $line = <$fd>) {
6879                        chomp $line;
6880                        next unless $line;
6881
6882                        my %set = parse_difftree_raw_line($line);
6883                        if (defined $set{'commit'}) {
6884                                # finish previous commit
6885                                if (%co) {
6886                                        print "</td>\n" .
6887                                              "<td class=\"link\">" .
6888                                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6889                                              " | " .
6890                                              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6891                                        print "</td>\n" .
6892                                              "</tr>\n";
6893                                }
6894
6895                                if ($alternate) {
6896                                        print "<tr class=\"dark\">\n";
6897                                } else {
6898                                        print "<tr class=\"light\">\n";
6899                                }
6900                                $alternate ^= 1;
6901                                %co = parse_commit($set{'commit'});
6902                                my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6903                                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6904                                      "<td><i>$author</i></td>\n" .
6905                                      "<td>" .
6906                                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6907                                              -class => "list subject"},
6908                                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
6909                        } elsif (defined $set{'to_id'}) {
6910                                next if ($set{'to_id'} =~ m/^0{40}$/);
6911
6912                                print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6913                                                             hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6914                                              -class => "list"},
6915                                              "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6916                                      "<br/>\n";
6917                        }
6918                }
6919                close $fd;
6920
6921                # finish last commit (warning: repetition!)
6922                if (%co) {
6923                        print "</td>\n" .
6924                              "<td class=\"link\">" .
6925                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6926                              " | " .
6927                              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6928                        print "</td>\n" .
6929                              "</tr>\n";
6930                }
6931
6932                print "</table>\n";
6933        }
6934
6935        if ($searchtype eq 'grep') {
6936                git_print_page_nav('','', $hash,$co{'tree'},$hash);
6937                git_print_header_div('commit', esc_html($co{'title'}), $hash);
6938
6939                print "<table class=\"grep_search\">\n";
6940                my $alternate = 1;
6941                my $matches = 0;
6942                local $/ = "\n";
6943                open my $fd, "-|", git_cmd(), 'grep', '-n',
6944                        $search_use_regexp ? ('-E', '-i') : '-F',
6945                        $searchtext, $co{'tree'};
6946                my $lastfile = '';
6947                while (my $line = <$fd>) {
6948                        chomp $line;
6949                        my ($file, $lno, $ltext, $binary);
6950                        last if ($matches++ > 1000);
6951                        if ($line =~ /^Binary file (.+) matches$/) {
6952                                $file = $1;
6953                                $binary = 1;
6954                        } else {
6955                                (undef, $file, $lno, $ltext) = split(/:/, $line, 4);
6956                        }
6957                        if ($file ne $lastfile) {
6958                                $lastfile and print "</td></tr>\n";
6959                                if ($alternate++) {
6960                                        print "<tr class=\"dark\">\n";
6961                                } else {
6962                                        print "<tr class=\"light\">\n";
6963                                }
6964                                print "<td class=\"list\">".
6965                                        $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6966                                                               file_name=>"$file"),
6967                                                -class => "list"}, esc_path($file));
6968                                print "</td><td>\n";
6969                                $lastfile = $file;
6970                        }
6971                        if ($binary) {
6972                                print "<div class=\"binary\">Binary file</div>\n";
6973                        } else {
6974                                $ltext = untabify($ltext);
6975                                if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6976                                        $ltext = esc_html($1, -nbsp=>1);
6977                                        $ltext .= '<span class="match">';
6978                                        $ltext .= esc_html($2, -nbsp=>1);
6979                                        $ltext .= '</span>';
6980                                        $ltext .= esc_html($3, -nbsp=>1);
6981                                } else {
6982                                        $ltext = esc_html($ltext, -nbsp=>1);
6983                                }
6984                                print "<div class=\"pre\">" .
6985                                        $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6986                                                               file_name=>"$file").'#l'.$lno,
6987                                                -class => "linenr"}, sprintf('%4i', $lno))
6988                                        . ' ' .  $ltext . "</div>\n";
6989                        }
6990                }
6991                if ($lastfile) {
6992                        print "</td></tr>\n";
6993                        if ($matches > 1000) {
6994                                print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6995                        }
6996                } else {
6997                        print "<div class=\"diff nodifferences\">No matches found</div>\n";
6998                }
6999                close $fd;
7000
7001                print "</table>\n";
7002        }
7003        git_footer_html();
7004}
7005
7006sub git_search_help {
7007        git_header_html();
7008        git_print_page_nav('','', $hash,$hash,$hash);
7009        print <<EOT;
7010<p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7011regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7012the pattern entered is recognized as the POSIX extended
7013<a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7014insensitive).</p>
7015<dl>
7016<dt><b>commit</b></dt>
7017<dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7018EOT
7019        my $have_grep = gitweb_check_feature('grep');
7020        if ($have_grep) {
7021                print <<EOT;
7022<dt><b>grep</b></dt>
7023<dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7024    a different one) are searched for the given pattern. On large trees, this search can take
7025a while and put some strain on the server, so please use it with some consideration. Note that
7026due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7027case-sensitive.</dd>
7028EOT
7029        }
7030        print <<EOT;
7031<dt><b>author</b></dt>
7032<dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7033<dt><b>committer</b></dt>
7034<dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7035EOT
7036        my $have_pickaxe = gitweb_check_feature('pickaxe');
7037        if ($have_pickaxe) {
7038                print <<EOT;
7039<dt><b>pickaxe</b></dt>
7040<dd>All commits that caused the string to appear or disappear from any file (changes that
7041added, removed or "modified" the string) will be listed. This search can take a while and
7042takes a lot of strain on the server, so please use it wisely. Note that since you may be
7043interested even in changes just changing the case as well, this search is case sensitive.</dd>
7044EOT
7045        }
7046        print "</dl>\n";
7047        git_footer_html();
7048}
7049
7050sub git_shortlog {
7051        git_log_generic('shortlog', \&git_shortlog_body,
7052                        $hash, $hash_parent);
7053}
7054
7055## ......................................................................
7056## feeds (RSS, Atom; OPML)
7057
7058sub git_feed {
7059        my $format = shift || 'atom';
7060        my $have_blame = gitweb_check_feature('blame');
7061
7062        # Atom: http://www.atomenabled.org/developers/syndication/
7063        # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7064        if ($format ne 'rss' && $format ne 'atom') {
7065                die_error(400, "Unknown web feed format");
7066        }
7067
7068        # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7069        my $head = $hash || 'HEAD';
7070        my @commitlist = parse_commits($head, 150, 0, $file_name);
7071
7072        my %latest_commit;
7073        my %latest_date;
7074        my $content_type = "application/$format+xml";
7075        if (defined $cgi->http('HTTP_ACCEPT') &&
7076                 $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7077                # browser (feed reader) prefers text/xml
7078                $content_type = 'text/xml';
7079        }
7080        if (defined($commitlist[0])) {
7081                %latest_commit = %{$commitlist[0]};
7082                my $latest_epoch = $latest_commit{'committer_epoch'};
7083                %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7084                my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7085                if (defined $if_modified) {
7086                        my $since;
7087                        if (eval { require HTTP::Date; 1; }) {
7088                                $since = HTTP::Date::str2time($if_modified);
7089                        } elsif (eval { require Time::ParseDate; 1; }) {
7090                                $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7091                        }
7092                        if (defined $since && $latest_epoch <= $since) {
7093                                print $cgi->header(
7094                                        -type => $content_type,
7095                                        -charset => 'utf-8',
7096                                        -last_modified => $latest_date{'rfc2822'},
7097                                        -status => '304 Not Modified');
7098                                return;
7099                        }
7100                }
7101                print $cgi->header(
7102                        -type => $content_type,
7103                        -charset => 'utf-8',
7104                        -last_modified => $latest_date{'rfc2822'});
7105        } else {
7106                print $cgi->header(
7107                        -type => $content_type,
7108                        -charset => 'utf-8');
7109        }
7110
7111        # Optimization: skip generating the body if client asks only
7112        # for Last-Modified date.
7113        return if ($cgi->request_method() eq 'HEAD');
7114
7115        # header variables
7116        my $title = "$site_name - $project/$action";
7117        my $feed_type = 'log';
7118        if (defined $hash) {
7119                $title .= " - '$hash'";
7120                $feed_type = 'branch log';
7121                if (defined $file_name) {
7122                        $title .= " :: $file_name";
7123                        $feed_type = 'history';
7124                }
7125        } elsif (defined $file_name) {
7126                $title .= " - $file_name";
7127                $feed_type = 'history';
7128        }
7129        $title .= " $feed_type";
7130        my $descr = git_get_project_description($project);
7131        if (defined $descr) {
7132                $descr = esc_html($descr);
7133        } else {
7134                $descr = "$project " .
7135                         ($format eq 'rss' ? 'RSS' : 'Atom') .
7136                         " feed";
7137        }
7138        my $owner = git_get_project_owner($project);
7139        $owner = esc_html($owner);
7140
7141        #header
7142        my $alt_url;
7143        if (defined $file_name) {
7144                $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7145        } elsif (defined $hash) {
7146                $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7147        } else {
7148                $alt_url = href(-full=>1, action=>"summary");
7149        }
7150        print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7151        if ($format eq 'rss') {
7152                print <<XML;
7153<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7154<channel>
7155XML
7156                print "<title>$title</title>\n" .
7157                      "<link>$alt_url</link>\n" .
7158                      "<description>$descr</description>\n" .
7159                      "<language>en</language>\n" .
7160                      # project owner is responsible for 'editorial' content
7161                      "<managingEditor>$owner</managingEditor>\n";
7162                if (defined $logo || defined $favicon) {
7163                        # prefer the logo to the favicon, since RSS
7164                        # doesn't allow both
7165                        my $img = esc_url($logo || $favicon);
7166                        print "<image>\n" .
7167                              "<url>$img</url>\n" .
7168                              "<title>$title</title>\n" .
7169                              "<link>$alt_url</link>\n" .
7170                              "</image>\n";
7171                }
7172                if (%latest_date) {
7173                        print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7174                        print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7175                }
7176                print "<generator>gitweb v.$version/$git_version</generator>\n";
7177        } elsif ($format eq 'atom') {
7178                print <<XML;
7179<feed xmlns="http://www.w3.org/2005/Atom">
7180XML
7181                print "<title>$title</title>\n" .
7182                      "<subtitle>$descr</subtitle>\n" .
7183                      '<link rel="alternate" type="text/html" href="' .
7184                      $alt_url . '" />' . "\n" .
7185                      '<link rel="self" type="' . $content_type . '" href="' .
7186                      $cgi->self_url() . '" />' . "\n" .
7187                      "<id>" . href(-full=>1) . "</id>\n" .
7188                      # use project owner for feed author
7189                      "<author><name>$owner</name></author>\n";
7190                if (defined $favicon) {
7191                        print "<icon>" . esc_url($favicon) . "</icon>\n";
7192                }
7193                if (defined $logo) {
7194                        # not twice as wide as tall: 72 x 27 pixels
7195                        print "<logo>" . esc_url($logo) . "</logo>\n";
7196                }
7197                if (! %latest_date) {
7198                        # dummy date to keep the feed valid until commits trickle in:
7199                        print "<updated>1970-01-01T00:00:00Z</updated>\n";
7200                } else {
7201                        print "<updated>$latest_date{'iso-8601'}</updated>\n";
7202                }
7203                print "<generator version='$version/$git_version'>gitweb</generator>\n";
7204        }
7205
7206        # contents
7207        for (my $i = 0; $i <= $#commitlist; $i++) {
7208                my %co = %{$commitlist[$i]};
7209                my $commit = $co{'id'};
7210                # we read 150, we always show 30 and the ones more recent than 48 hours
7211                if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7212                        last;
7213                }
7214                my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7215
7216                # get list of changed files
7217                open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7218                        $co{'parent'} || "--root",
7219                        $co{'id'}, "--", (defined $file_name ? $file_name : ())
7220                        or next;
7221                my @difftree = map { chomp; $_ } <$fd>;
7222                close $fd
7223                        or next;
7224
7225                # print element (entry, item)
7226                my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7227                if ($format eq 'rss') {
7228                        print "<item>\n" .
7229                              "<title>" . esc_html($co{'title'}) . "</title>\n" .
7230                              "<author>" . esc_html($co{'author'}) . "</author>\n" .
7231                              "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7232                              "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7233                              "<link>$co_url</link>\n" .
7234                              "<description>" . esc_html($co{'title'}) . "</description>\n" .
7235                              "<content:encoded>" .
7236                              "<![CDATA[\n";
7237                } elsif ($format eq 'atom') {
7238                        print "<entry>\n" .
7239                              "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7240                              "<updated>$cd{'iso-8601'}</updated>\n" .
7241                              "<author>\n" .
7242                              "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7243                        if ($co{'author_email'}) {
7244                                print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7245                        }
7246                        print "</author>\n" .
7247                              # use committer for contributor
7248                              "<contributor>\n" .
7249                              "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7250                        if ($co{'committer_email'}) {
7251                                print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7252                        }
7253                        print "</contributor>\n" .
7254                              "<published>$cd{'iso-8601'}</published>\n" .
7255                              "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7256                              "<id>$co_url</id>\n" .
7257                              "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
7258                              "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
7259                }
7260                my $comment = $co{'comment'};
7261                print "<pre>\n";
7262                foreach my $line (@$comment) {
7263                        $line = esc_html($line);
7264                        print "$line\n";
7265                }
7266                print "</pre><ul>\n";
7267                foreach my $difftree_line (@difftree) {
7268                        my %difftree = parse_difftree_raw_line($difftree_line);
7269                        next if !$difftree{'from_id'};
7270
7271                        my $file = $difftree{'file'} || $difftree{'to_file'};
7272
7273                        print "<li>" .
7274                              "[" .
7275                              $cgi->a({-href => href(-full=>1, action=>"blobdiff",
7276                                                     hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
7277                                                     hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
7278                                                     file_name=>$file, file_parent=>$difftree{'from_file'}),
7279                                      -title => "diff"}, 'D');
7280                        if ($have_blame) {
7281                                print $cgi->a({-href => href(-full=>1, action=>"blame",
7282                                                             file_name=>$file, hash_base=>$commit),
7283                                              -title => "blame"}, 'B');
7284                        }
7285                        # if this is not a feed of a file history
7286                        if (!defined $file_name || $file_name ne $file) {
7287                                print $cgi->a({-href => href(-full=>1, action=>"history",
7288                                                             file_name=>$file, hash=>$commit),
7289                                              -title => "history"}, 'H');
7290                        }
7291                        $file = esc_path($file);
7292                        print "] ".
7293                              "$file</li>\n";
7294                }
7295                if ($format eq 'rss') {
7296                        print "</ul>]]>\n" .
7297                              "</content:encoded>\n" .
7298                              "</item>\n";
7299                } elsif ($format eq 'atom') {
7300                        print "</ul>\n</div>\n" .
7301                              "</content>\n" .
7302                              "</entry>\n";
7303                }
7304        }
7305
7306        # end of feed
7307        if ($format eq 'rss') {
7308                print "</channel>\n</rss>\n";
7309        } elsif ($format eq 'atom') {
7310                print "</feed>\n";
7311        }
7312}
7313
7314sub git_rss {
7315        git_feed('rss');
7316}
7317
7318sub git_atom {
7319        git_feed('atom');
7320}
7321
7322sub git_opml {
7323        my @list = git_get_projects_list();
7324
7325        print $cgi->header(
7326                -type => 'text/xml',
7327                -charset => 'utf-8',
7328                -content_disposition => 'inline; filename="opml.xml"');
7329
7330        print <<XML;
7331<?xml version="1.0" encoding="utf-8"?>
7332<opml version="1.0">
7333<head>
7334  <title>$site_name OPML Export</title>
7335</head>
7336<body>
7337<outline text="git RSS feeds">
7338XML
7339
7340        foreach my $pr (@list) {
7341                my %proj = %$pr;
7342                my $head = git_get_head_hash($proj{'path'});
7343                if (!defined $head) {
7344                        next;
7345                }
7346                $git_dir = "$projectroot/$proj{'path'}";
7347                my %co = parse_commit($head);
7348                if (!%co) {
7349                        next;
7350                }
7351
7352                my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7353                my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7354                my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7355                print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7356        }
7357        print <<XML;
7358</outline>
7359</body>
7360</opml>
7361XML
7362}