ecd4a39d22768c5ac7a577ae43928d3aea28867f
   1#!/usr/bin/perl
   2
   3# gitweb - simple web interface to track changes in git repositories
   4#
   5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
   6# (C) 2005, Christian Gierke
   7#
   8# This program is licensed under the GPLv2
   9
  10use 5.008;
  11use strict;
  12use warnings;
  13use CGI qw(:standard :escapeHTML -nosticky);
  14use CGI::Util qw(unescape);
  15use CGI::Carp qw(fatalsToBrowser set_message);
  16use Encode;
  17use Fcntl ':mode';
  18use File::Find qw();
  19use File::Basename qw(basename);
  20use Time::HiRes qw(gettimeofday tv_interval);
  21binmode STDOUT, ':utf8';
  22
  23our $t0 = [ gettimeofday() ];
  24our $number_of_git_cmds = 0;
  25
  26BEGIN {
  27        CGI->compile() if $ENV{'MOD_PERL'};
  28}
  29
  30our $version = "++GIT_VERSION++";
  31
  32our ($my_url, $my_uri, $base_url, $path_info, $home_link);
  33sub evaluate_uri {
  34        our $cgi;
  35
  36        our $my_url = $cgi->url();
  37        our $my_uri = $cgi->url(-absolute => 1);
  38
  39        # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
  40        # needed and used only for URLs with nonempty PATH_INFO
  41        our $base_url = $my_url;
  42
  43        # When the script is used as DirectoryIndex, the URL does not contain the name
  44        # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
  45        # have to do it ourselves. We make $path_info global because it's also used
  46        # later on.
  47        #
  48        # Another issue with the script being the DirectoryIndex is that the resulting
  49        # $my_url data is not the full script URL: this is good, because we want
  50        # generated links to keep implying the script name if it wasn't explicitly
  51        # indicated in the URL we're handling, but it means that $my_url cannot be used
  52        # as base URL.
  53        # Therefore, if we needed to strip PATH_INFO, then we know that we have
  54        # to build the base URL ourselves:
  55        our $path_info = $ENV{"PATH_INFO"};
  56        if ($path_info) {
  57                if ($my_url =~ s,\Q$path_info\E$,, &&
  58                    $my_uri =~ s,\Q$path_info\E$,, &&
  59                    defined $ENV{'SCRIPT_NAME'}) {
  60                        $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
  61                }
  62        }
  63
  64        # target of the home link on top of all pages
  65        our $home_link = $my_uri || "/";
  66}
  67
  68# core git executable to use
  69# this can just be "git" if your webserver has a sensible PATH
  70our $GIT = "++GIT_BINDIR++/git";
  71
  72# absolute fs-path which will be prepended to the project path
  73#our $projectroot = "/pub/scm";
  74our $projectroot = "++GITWEB_PROJECTROOT++";
  75
  76# fs traversing limit for getting project list
  77# the number is relative to the projectroot
  78our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
  79
  80# string of the home link on top of all pages
  81our $home_link_str = "++GITWEB_HOME_LINK_STR++";
  82
  83# name of your site or organization to appear in page titles
  84# replace this with something more descriptive for clearer bookmarks
  85our $site_name = "++GITWEB_SITENAME++"
  86                 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
  87
  88# html snippet to include in the <head> section of each page
  89our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
  90# filename of html text to include at top of each page
  91our $site_header = "++GITWEB_SITE_HEADER++";
  92# html text to include at home page
  93our $home_text = "++GITWEB_HOMETEXT++";
  94# filename of html text to include at bottom of each page
  95our $site_footer = "++GITWEB_SITE_FOOTER++";
  96
  97# URI of stylesheets
  98our @stylesheets = ("++GITWEB_CSS++");
  99# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
 100our $stylesheet = undef;
 101# URI of GIT logo (72x27 size)
 102our $logo = "++GITWEB_LOGO++";
 103# URI of GIT favicon, assumed to be image/png type
 104our $favicon = "++GITWEB_FAVICON++";
 105# URI of gitweb.js (JavaScript code for gitweb)
 106our $javascript = "++GITWEB_JS++";
 107
 108# URI and label (title) of GIT logo link
 109#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
 110#our $logo_label = "git documentation";
 111our $logo_url = "http://git-scm.com/";
 112our $logo_label = "git homepage";
 113
 114# source of projects list
 115our $projects_list = "++GITWEB_LIST++";
 116
 117# the width (in characters) of the projects list "Description" column
 118our $projects_list_description_width = 25;
 119
 120# group projects by category on the projects list
 121# (enabled if this variable evaluates to true)
 122our $projects_list_group_categories = 0;
 123
 124# default category if none specified
 125# (leave the empty string for no category)
 126our $project_list_default_category = "";
 127
 128# default order of projects list
 129# valid values are none, project, descr, owner, and age
 130our $default_projects_order = "project";
 131
 132# show repository only if this file exists
 133# (only effective if this variable evaluates to true)
 134our $export_ok = "++GITWEB_EXPORT_OK++";
 135
 136# show repository only if this subroutine returns true
 137# when given the path to the project, for example:
 138#    sub { return -e "$_[0]/git-daemon-export-ok"; }
 139our $export_auth_hook = undef;
 140
 141# only allow viewing of repositories also shown on the overview page
 142our $strict_export = "++GITWEB_STRICT_EXPORT++";
 143
 144# list of git base URLs used for URL to where fetch project from,
 145# i.e. full URL is "$git_base_url/$project"
 146our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
 147
 148# default blob_plain mimetype and default charset for text/plain blob
 149our $default_blob_plain_mimetype = 'text/plain';
 150our $default_text_plain_charset  = undef;
 151
 152# file to use for guessing MIME types before trying /etc/mime.types
 153# (relative to the current git repository)
 154our $mimetypes_file = undef;
 155
 156# assume this charset if line contains non-UTF-8 characters;
 157# it should be valid encoding (see Encoding::Supported(3pm) for list),
 158# for which encoding all byte sequences are valid, for example
 159# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
 160# could be even 'utf-8' for the old behavior)
 161our $fallback_encoding = 'latin1';
 162
 163# rename detection options for git-diff and git-diff-tree
 164# - default is '-M', with the cost proportional to
 165#   (number of removed files) * (number of new files).
 166# - more costly is '-C' (which implies '-M'), with the cost proportional to
 167#   (number of changed files + number of removed files) * (number of new files)
 168# - even more costly is '-C', '--find-copies-harder' with cost
 169#   (number of files in the original tree) * (number of new files)
 170# - one might want to include '-B' option, e.g. '-B', '-M'
 171our @diff_opts = ('-M'); # taken from git_commit
 172
 173# Disables features that would allow repository owners to inject script into
 174# the gitweb domain.
 175our $prevent_xss = 0;
 176
 177# Path to the highlight executable to use (must be the one from
 178# http://www.andre-simon.de due to assumptions about parameters and output).
 179# Useful if highlight is not installed on your webserver's PATH.
 180# [Default: highlight]
 181our $highlight_bin = "++HIGHLIGHT_BIN++";
 182
 183# information about snapshot formats that gitweb is capable of serving
 184our %known_snapshot_formats = (
 185        # name => {
 186        #       'display' => display name,
 187        #       'type' => mime type,
 188        #       'suffix' => filename suffix,
 189        #       'format' => --format for git-archive,
 190        #       'compressor' => [compressor command and arguments]
 191        #                       (array reference, optional)
 192        #       'disabled' => boolean (optional)}
 193        #
 194        'tgz' => {
 195                'display' => 'tar.gz',
 196                'type' => 'application/x-gzip',
 197                'suffix' => '.tar.gz',
 198                'format' => 'tar',
 199                'compressor' => ['gzip', '-n']},
 200
 201        'tbz2' => {
 202                'display' => 'tar.bz2',
 203                'type' => 'application/x-bzip2',
 204                'suffix' => '.tar.bz2',
 205                'format' => 'tar',
 206                'compressor' => ['bzip2']},
 207
 208        'txz' => {
 209                'display' => 'tar.xz',
 210                'type' => 'application/x-xz',
 211                'suffix' => '.tar.xz',
 212                'format' => 'tar',
 213                'compressor' => ['xz'],
 214                'disabled' => 1},
 215
 216        'zip' => {
 217                'display' => 'zip',
 218                'type' => 'application/x-zip',
 219                'suffix' => '.zip',
 220                'format' => 'zip'},
 221);
 222
 223# Aliases so we understand old gitweb.snapshot values in repository
 224# configuration.
 225our %known_snapshot_format_aliases = (
 226        'gzip'  => 'tgz',
 227        'bzip2' => 'tbz2',
 228        'xz'    => 'txz',
 229
 230        # backward compatibility: legacy gitweb config support
 231        'x-gzip' => undef, 'gz' => undef,
 232        'x-bzip2' => undef, 'bz2' => undef,
 233        'x-zip' => undef, '' => undef,
 234);
 235
 236# Pixel sizes for icons and avatars. If the default font sizes or lineheights
 237# are changed, it may be appropriate to change these values too via
 238# $GITWEB_CONFIG.
 239our %avatar_size = (
 240        'default' => 16,
 241        'double'  => 32
 242);
 243
 244# Used to set the maximum load that we will still respond to gitweb queries.
 245# If server load exceed this value then return "503 server busy" error.
 246# If gitweb cannot determined server load, it is taken to be 0.
 247# Leave it undefined (or set to 'undef') to turn off load checking.
 248our $maxload = 300;
 249
 250# configuration for 'highlight' (http://www.andre-simon.de/)
 251# match by basename
 252our %highlight_basename = (
 253        #'Program' => 'py',
 254        #'Library' => 'py',
 255        'SConstruct' => 'py', # SCons equivalent of Makefile
 256        'Makefile' => 'make',
 257);
 258# match by extension
 259our %highlight_ext = (
 260        # main extensions, defining name of syntax;
 261        # see files in /usr/share/highlight/langDefs/ directory
 262        map { $_ => $_ }
 263                qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
 264        # alternate extensions, see /etc/highlight/filetypes.conf
 265        'h' => 'c',
 266        map { $_ => 'sh'  } qw(bash zsh ksh),
 267        map { $_ => 'cpp' } qw(cxx c++ cc),
 268        map { $_ => 'php' } qw(php3 php4 php5 phps),
 269        map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
 270        map { $_ => 'make'} qw(mak mk),
 271        map { $_ => 'xml' } qw(xhtml html htm),
 272);
 273
 274# You define site-wide feature defaults here; override them with
 275# $GITWEB_CONFIG as necessary.
 276our %feature = (
 277        # feature => {
 278        #       'sub' => feature-sub (subroutine),
 279        #       'override' => allow-override (boolean),
 280        #       'default' => [ default options...] (array reference)}
 281        #
 282        # if feature is overridable (it means that allow-override has true value),
 283        # then feature-sub will be called with default options as parameters;
 284        # return value of feature-sub indicates if to enable specified feature
 285        #
 286        # if there is no 'sub' key (no feature-sub), then feature cannot be
 287        # overridden
 288        #
 289        # use gitweb_get_feature(<feature>) to retrieve the <feature> value
 290        # (an array) or gitweb_check_feature(<feature>) to check if <feature>
 291        # is enabled
 292
 293        # Enable the 'blame' blob view, showing the last commit that modified
 294        # each line in the file. This can be very CPU-intensive.
 295
 296        # To enable system wide have in $GITWEB_CONFIG
 297        # $feature{'blame'}{'default'} = [1];
 298        # To have project specific config enable override in $GITWEB_CONFIG
 299        # $feature{'blame'}{'override'} = 1;
 300        # and in project config gitweb.blame = 0|1;
 301        'blame' => {
 302                'sub' => sub { feature_bool('blame', @_) },
 303                'override' => 0,
 304                'default' => [0]},
 305
 306        # Enable the 'snapshot' link, providing a compressed archive of any
 307        # tree. This can potentially generate high traffic if you have large
 308        # project.
 309
 310        # Value is a list of formats defined in %known_snapshot_formats that
 311        # you wish to offer.
 312        # To disable system wide have in $GITWEB_CONFIG
 313        # $feature{'snapshot'}{'default'} = [];
 314        # To have project specific config enable override in $GITWEB_CONFIG
 315        # $feature{'snapshot'}{'override'} = 1;
 316        # and in project config, a comma-separated list of formats or "none"
 317        # to disable.  Example: gitweb.snapshot = tbz2,zip;
 318        'snapshot' => {
 319                'sub' => \&feature_snapshot,
 320                'override' => 0,
 321                'default' => ['tgz']},
 322
 323        # Enable text search, which will list the commits which match author,
 324        # committer or commit text to a given string.  Enabled by default.
 325        # Project specific override is not supported.
 326        #
 327        # Note that this controls all search features, which means that if
 328        # it is disabled, then 'grep' and 'pickaxe' search would also be
 329        # disabled.
 330        'search' => {
 331                'override' => 0,
 332                'default' => [1]},
 333
 334        # Enable grep search, which will list the files in currently selected
 335        # tree containing the given string. Enabled by default. This can be
 336        # potentially CPU-intensive, of course.
 337        # Note that you need to have 'search' feature enabled too.
 338
 339        # To enable system wide have in $GITWEB_CONFIG
 340        # $feature{'grep'}{'default'} = [1];
 341        # To have project specific config enable override in $GITWEB_CONFIG
 342        # $feature{'grep'}{'override'} = 1;
 343        # and in project config gitweb.grep = 0|1;
 344        'grep' => {
 345                'sub' => sub { feature_bool('grep', @_) },
 346                'override' => 0,
 347                'default' => [1]},
 348
 349        # Enable the pickaxe search, which will list the commits that modified
 350        # a given string in a file. This can be practical and quite faster
 351        # alternative to 'blame', but still potentially CPU-intensive.
 352        # Note that you need to have 'search' feature enabled too.
 353
 354        # To enable system wide have in $GITWEB_CONFIG
 355        # $feature{'pickaxe'}{'default'} = [1];
 356        # To have project specific config enable override in $GITWEB_CONFIG
 357        # $feature{'pickaxe'}{'override'} = 1;
 358        # and in project config gitweb.pickaxe = 0|1;
 359        'pickaxe' => {
 360                'sub' => sub { feature_bool('pickaxe', @_) },
 361                'override' => 0,
 362                'default' => [1]},
 363
 364        # Enable showing size of blobs in a 'tree' view, in a separate
 365        # column, similar to what 'ls -l' does.  This cost a bit of IO.
 366
 367        # To disable system wide have in $GITWEB_CONFIG
 368        # $feature{'show-sizes'}{'default'} = [0];
 369        # To have project specific config enable override in $GITWEB_CONFIG
 370        # $feature{'show-sizes'}{'override'} = 1;
 371        # and in project config gitweb.showsizes = 0|1;
 372        'show-sizes' => {
 373                'sub' => sub { feature_bool('showsizes', @_) },
 374                'override' => 0,
 375                'default' => [1]},
 376
 377        # Make gitweb use an alternative format of the URLs which can be
 378        # more readable and natural-looking: project name is embedded
 379        # directly in the path and the query string contains other
 380        # auxiliary information. All gitweb installations recognize
 381        # URL in either format; this configures in which formats gitweb
 382        # generates links.
 383
 384        # To enable system wide have in $GITWEB_CONFIG
 385        # $feature{'pathinfo'}{'default'} = [1];
 386        # Project specific override is not supported.
 387
 388        # Note that you will need to change the default location of CSS,
 389        # favicon, logo and possibly other files to an absolute URL. Also,
 390        # if gitweb.cgi serves as your indexfile, you will need to force
 391        # $my_uri to contain the script name in your $GITWEB_CONFIG.
 392        'pathinfo' => {
 393                'override' => 0,
 394                'default' => [0]},
 395
 396        # Make gitweb consider projects in project root subdirectories
 397        # to be forks of existing projects. Given project $projname.git,
 398        # projects matching $projname/*.git will not be shown in the main
 399        # projects list, instead a '+' mark will be added to $projname
 400        # there and a 'forks' view will be enabled for the project, listing
 401        # all the forks. If project list is taken from a file, forks have
 402        # to be listed after the main project.
 403
 404        # To enable system wide have in $GITWEB_CONFIG
 405        # $feature{'forks'}{'default'} = [1];
 406        # Project specific override is not supported.
 407        'forks' => {
 408                'override' => 0,
 409                'default' => [0]},
 410
 411        # Insert custom links to the action bar of all project pages.
 412        # This enables you mainly to link to third-party scripts integrating
 413        # into gitweb; e.g. git-browser for graphical history representation
 414        # or custom web-based repository administration interface.
 415
 416        # The 'default' value consists of a list of triplets in the form
 417        # (label, link, position) where position is the label after which
 418        # to insert the link and link is a format string where %n expands
 419        # to the project name, %f to the project path within the filesystem,
 420        # %h to the current hash (h gitweb parameter) and %b to the current
 421        # hash base (hb gitweb parameter); %% expands to %.
 422
 423        # To enable system wide have in $GITWEB_CONFIG e.g.
 424        # $feature{'actions'}{'default'} = [('graphiclog',
 425        #       '/git-browser/by-commit.html?r=%n', 'summary')];
 426        # Project specific override is not supported.
 427        'actions' => {
 428                'override' => 0,
 429                'default' => []},
 430
 431        # Allow gitweb scan project content tags of project repository,
 432        # and display the popular Web 2.0-ish "tag cloud" near the projects
 433        # list.  Note that this is something COMPLETELY different from the
 434        # normal Git tags.
 435
 436        # gitweb by itself can show existing tags, but it does not handle
 437        # tagging itself; you need to do it externally, outside gitweb.
 438        # The format is described in git_get_project_ctags() subroutine.
 439        # You may want to install the HTML::TagCloud Perl module to get
 440        # a pretty tag cloud instead of just a list of tags.
 441
 442        # To enable system wide have in $GITWEB_CONFIG
 443        # $feature{'ctags'}{'default'} = [1];
 444        # Project specific override is not supported.
 445
 446        # In the future whether ctags editing is enabled might depend
 447        # on the value, but using 1 should always mean no editing of ctags.
 448        'ctags' => {
 449                'override' => 0,
 450                'default' => [0]},
 451
 452        # The maximum number of patches in a patchset generated in patch
 453        # view. Set this to 0 or undef to disable patch view, or to a
 454        # negative number to remove any limit.
 455
 456        # To disable system wide have in $GITWEB_CONFIG
 457        # $feature{'patches'}{'default'} = [0];
 458        # To have project specific config enable override in $GITWEB_CONFIG
 459        # $feature{'patches'}{'override'} = 1;
 460        # and in project config gitweb.patches = 0|n;
 461        # where n is the maximum number of patches allowed in a patchset.
 462        'patches' => {
 463                'sub' => \&feature_patches,
 464                'override' => 0,
 465                'default' => [16]},
 466
 467        # Avatar support. When this feature is enabled, views such as
 468        # shortlog or commit will display an avatar associated with
 469        # the email of the committer(s) and/or author(s).
 470
 471        # Currently available providers are gravatar and picon.
 472        # If an unknown provider is specified, the feature is disabled.
 473
 474        # Gravatar depends on Digest::MD5.
 475        # Picon currently relies on the indiana.edu database.
 476
 477        # To enable system wide have in $GITWEB_CONFIG
 478        # $feature{'avatar'}{'default'} = ['<provider>'];
 479        # where <provider> is either gravatar or picon.
 480        # To have project specific config enable override in $GITWEB_CONFIG
 481        # $feature{'avatar'}{'override'} = 1;
 482        # and in project config gitweb.avatar = <provider>;
 483        'avatar' => {
 484                'sub' => \&feature_avatar,
 485                'override' => 0,
 486                'default' => ['']},
 487
 488        # Enable displaying how much time and how many git commands
 489        # it took to generate and display page.  Disabled by default.
 490        # Project specific override is not supported.
 491        'timed' => {
 492                'override' => 0,
 493                'default' => [0]},
 494
 495        # Enable turning some links into links to actions which require
 496        # JavaScript to run (like 'blame_incremental').  Not enabled by
 497        # default.  Project specific override is currently not supported.
 498        'javascript-actions' => {
 499                'override' => 0,
 500                'default' => [0]},
 501
 502        # Enable and configure ability to change common timezone for dates
 503        # in gitweb output via JavaScript.  Enabled by default.
 504        # Project specific override is not supported.
 505        'javascript-timezone' => {
 506                'override' => 0,
 507                'default' => [
 508                        'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
 509                                     # or undef to turn off this feature
 510                        'gitweb_tz', # name of cookie where to store selected timezone
 511                        'datetime',  # CSS class used to mark up dates for manipulation
 512                ]},
 513
 514        # Syntax highlighting support. This is based on Daniel Svensson's
 515        # and Sham Chukoury's work in gitweb-xmms2.git.
 516        # It requires the 'highlight' program present in $PATH,
 517        # and therefore is disabled by default.
 518
 519        # To enable system wide have in $GITWEB_CONFIG
 520        # $feature{'highlight'}{'default'} = [1];
 521
 522        'highlight' => {
 523                'sub' => sub { feature_bool('highlight', @_) },
 524                'override' => 0,
 525                'default' => [0]},
 526
 527        # Enable displaying of remote heads in the heads list
 528
 529        # To enable system wide have in $GITWEB_CONFIG
 530        # $feature{'remote_heads'}{'default'} = [1];
 531        # To have project specific config enable override in $GITWEB_CONFIG
 532        # $feature{'remote_heads'}{'override'} = 1;
 533        # and in project config gitweb.remote_heads = 0|1;
 534        'remote_heads' => {
 535                'sub' => sub { feature_bool('remote_heads', @_) },
 536                'override' => 0,
 537                'default' => [0]},
 538);
 539
 540sub gitweb_get_feature {
 541        my ($name) = @_;
 542        return unless exists $feature{$name};
 543        my ($sub, $override, @defaults) = (
 544                $feature{$name}{'sub'},
 545                $feature{$name}{'override'},
 546                @{$feature{$name}{'default'}});
 547        # project specific override is possible only if we have project
 548        our $git_dir; # global variable, declared later
 549        if (!$override || !defined $git_dir) {
 550                return @defaults;
 551        }
 552        if (!defined $sub) {
 553                warn "feature $name is not overridable";
 554                return @defaults;
 555        }
 556        return $sub->(@defaults);
 557}
 558
 559# A wrapper to check if a given feature is enabled.
 560# With this, you can say
 561#
 562#   my $bool_feat = gitweb_check_feature('bool_feat');
 563#   gitweb_check_feature('bool_feat') or somecode;
 564#
 565# instead of
 566#
 567#   my ($bool_feat) = gitweb_get_feature('bool_feat');
 568#   (gitweb_get_feature('bool_feat'))[0] or somecode;
 569#
 570sub gitweb_check_feature {
 571        return (gitweb_get_feature(@_))[0];
 572}
 573
 574
 575sub feature_bool {
 576        my $key = shift;
 577        my ($val) = git_get_project_config($key, '--bool');
 578
 579        if (!defined $val) {
 580                return ($_[0]);
 581        } elsif ($val eq 'true') {
 582                return (1);
 583        } elsif ($val eq 'false') {
 584                return (0);
 585        }
 586}
 587
 588sub feature_snapshot {
 589        my (@fmts) = @_;
 590
 591        my ($val) = git_get_project_config('snapshot');
 592
 593        if ($val) {
 594                @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
 595        }
 596
 597        return @fmts;
 598}
 599
 600sub feature_patches {
 601        my @val = (git_get_project_config('patches', '--int'));
 602
 603        if (@val) {
 604                return @val;
 605        }
 606
 607        return ($_[0]);
 608}
 609
 610sub feature_avatar {
 611        my @val = (git_get_project_config('avatar'));
 612
 613        return @val ? @val : @_;
 614}
 615
 616# checking HEAD file with -e is fragile if the repository was
 617# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
 618# and then pruned.
 619sub check_head_link {
 620        my ($dir) = @_;
 621        my $headfile = "$dir/HEAD";
 622        return ((-e $headfile) ||
 623                (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
 624}
 625
 626sub check_export_ok {
 627        my ($dir) = @_;
 628        return (check_head_link($dir) &&
 629                (!$export_ok || -e "$dir/$export_ok") &&
 630                (!$export_auth_hook || $export_auth_hook->($dir)));
 631}
 632
 633# process alternate names for backward compatibility
 634# filter out unsupported (unknown) snapshot formats
 635sub filter_snapshot_fmts {
 636        my @fmts = @_;
 637
 638        @fmts = map {
 639                exists $known_snapshot_format_aliases{$_} ?
 640                       $known_snapshot_format_aliases{$_} : $_} @fmts;
 641        @fmts = grep {
 642                exists $known_snapshot_formats{$_} &&
 643                !$known_snapshot_formats{$_}{'disabled'}} @fmts;
 644}
 645
 646# If it is set to code reference, it is code that it is to be run once per
 647# request, allowing updating configurations that change with each request,
 648# while running other code in config file only once.
 649#
 650# Otherwise, if it is false then gitweb would process config file only once;
 651# if it is true then gitweb config would be run for each request.
 652our $per_request_config = 1;
 653
 654# read and parse gitweb config file given by its parameter.
 655# returns true on success, false on recoverable error, allowing
 656# to chain this subroutine, using first file that exists.
 657# dies on errors during parsing config file, as it is unrecoverable.
 658sub read_config_file {
 659        my $filename = shift;
 660        return unless defined $filename;
 661        # die if there are errors parsing config file
 662        if (-e $filename) {
 663                do $filename;
 664                die $@ if $@;
 665                return 1;
 666        }
 667        return;
 668}
 669
 670our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
 671sub evaluate_gitweb_config {
 672        our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
 673        our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
 674        our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
 675
 676        # Protect agains duplications of file names, to not read config twice.
 677        # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
 678        # there possibility of duplication of filename there doesn't matter.
 679        $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
 680        $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
 681
 682        # Common system-wide settings for convenience.
 683        # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
 684        read_config_file($GITWEB_CONFIG_COMMON);
 685
 686        # Use first config file that exists.  This means use the per-instance
 687        # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
 688        read_config_file($GITWEB_CONFIG) and return;
 689        read_config_file($GITWEB_CONFIG_SYSTEM);
 690}
 691
 692# Get loadavg of system, to compare against $maxload.
 693# Currently it requires '/proc/loadavg' present to get loadavg;
 694# if it is not present it returns 0, which means no load checking.
 695sub get_loadavg {
 696        if( -e '/proc/loadavg' ){
 697                open my $fd, '<', '/proc/loadavg'
 698                        or return 0;
 699                my @load = split(/\s+/, scalar <$fd>);
 700                close $fd;
 701
 702                # The first three columns measure CPU and IO utilization of the last one,
 703                # five, and 10 minute periods.  The fourth column shows the number of
 704                # currently running processes and the total number of processes in the m/n
 705                # format.  The last column displays the last process ID used.
 706                return $load[0] || 0;
 707        }
 708        # additional checks for load average should go here for things that don't export
 709        # /proc/loadavg
 710
 711        return 0;
 712}
 713
 714# version of the core git binary
 715our $git_version;
 716sub evaluate_git_version {
 717        our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
 718        $number_of_git_cmds++;
 719}
 720
 721sub check_loadavg {
 722        if (defined $maxload && get_loadavg() > $maxload) {
 723                die_error(503, "The load average on the server is too high");
 724        }
 725}
 726
 727# ======================================================================
 728# input validation and dispatch
 729
 730# input parameters can be collected from a variety of sources (presently, CGI
 731# and PATH_INFO), so we define an %input_params hash that collects them all
 732# together during validation: this allows subsequent uses (e.g. href()) to be
 733# agnostic of the parameter origin
 734
 735our %input_params = ();
 736
 737# input parameters are stored with the long parameter name as key. This will
 738# also be used in the href subroutine to convert parameters to their CGI
 739# equivalent, and since the href() usage is the most frequent one, we store
 740# the name -> CGI key mapping here, instead of the reverse.
 741#
 742# XXX: Warning: If you touch this, check the search form for updating,
 743# too.
 744
 745our @cgi_param_mapping = (
 746        project => "p",
 747        action => "a",
 748        file_name => "f",
 749        file_parent => "fp",
 750        hash => "h",
 751        hash_parent => "hp",
 752        hash_base => "hb",
 753        hash_parent_base => "hpb",
 754        page => "pg",
 755        order => "o",
 756        searchtext => "s",
 757        searchtype => "st",
 758        snapshot_format => "sf",
 759        extra_options => "opt",
 760        search_use_regexp => "sr",
 761        ctag => "by_tag",
 762        diff_style => "ds",
 763        project_filter => "pf",
 764        # this must be last entry (for manipulation from JavaScript)
 765        javascript => "js"
 766);
 767our %cgi_param_mapping = @cgi_param_mapping;
 768
 769# we will also need to know the possible actions, for validation
 770our %actions = (
 771        "blame" => \&git_blame,
 772        "blame_incremental" => \&git_blame_incremental,
 773        "blame_data" => \&git_blame_data,
 774        "blobdiff" => \&git_blobdiff,
 775        "blobdiff_plain" => \&git_blobdiff_plain,
 776        "blob" => \&git_blob,
 777        "blob_plain" => \&git_blob_plain,
 778        "commitdiff" => \&git_commitdiff,
 779        "commitdiff_plain" => \&git_commitdiff_plain,
 780        "commit" => \&git_commit,
 781        "forks" => \&git_forks,
 782        "heads" => \&git_heads,
 783        "history" => \&git_history,
 784        "log" => \&git_log,
 785        "patch" => \&git_patch,
 786        "patches" => \&git_patches,
 787        "remotes" => \&git_remotes,
 788        "rss" => \&git_rss,
 789        "atom" => \&git_atom,
 790        "search" => \&git_search,
 791        "search_help" => \&git_search_help,
 792        "shortlog" => \&git_shortlog,
 793        "summary" => \&git_summary,
 794        "tag" => \&git_tag,
 795        "tags" => \&git_tags,
 796        "tree" => \&git_tree,
 797        "snapshot" => \&git_snapshot,
 798        "object" => \&git_object,
 799        # those below don't need $project
 800        "opml" => \&git_opml,
 801        "project_list" => \&git_project_list,
 802        "project_index" => \&git_project_index,
 803);
 804
 805# finally, we have the hash of allowed extra_options for the commands that
 806# allow them
 807our %allowed_options = (
 808        "--no-merges" => [ qw(rss atom log shortlog history) ],
 809);
 810
 811# fill %input_params with the CGI parameters. All values except for 'opt'
 812# should be single values, but opt can be an array. We should probably
 813# build an array of parameters that can be multi-valued, but since for the time
 814# being it's only this one, we just single it out
 815sub evaluate_query_params {
 816        our $cgi;
 817
 818        while (my ($name, $symbol) = each %cgi_param_mapping) {
 819                if ($symbol eq 'opt') {
 820                        $input_params{$name} = [ $cgi->param($symbol) ];
 821                } else {
 822                        $input_params{$name} = $cgi->param($symbol);
 823                }
 824        }
 825}
 826
 827# now read PATH_INFO and update the parameter list for missing parameters
 828sub evaluate_path_info {
 829        return if defined $input_params{'project'};
 830        return if !$path_info;
 831        $path_info =~ s,^/+,,;
 832        return if !$path_info;
 833
 834        # find which part of PATH_INFO is project
 835        my $project = $path_info;
 836        $project =~ s,/+$,,;
 837        while ($project && !check_head_link("$projectroot/$project")) {
 838                $project =~ s,/*[^/]*$,,;
 839        }
 840        return unless $project;
 841        $input_params{'project'} = $project;
 842
 843        # do not change any parameters if an action is given using the query string
 844        return if $input_params{'action'};
 845        $path_info =~ s,^\Q$project\E/*,,;
 846
 847        # next, check if we have an action
 848        my $action = $path_info;
 849        $action =~ s,/.*$,,;
 850        if (exists $actions{$action}) {
 851                $path_info =~ s,^$action/*,,;
 852                $input_params{'action'} = $action;
 853        }
 854
 855        # list of actions that want hash_base instead of hash, but can have no
 856        # pathname (f) parameter
 857        my @wants_base = (
 858                'tree',
 859                'history',
 860        );
 861
 862        # we want to catch, among others
 863        # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
 864        my ($parentrefname, $parentpathname, $refname, $pathname) =
 865                ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
 866
 867        # first, analyze the 'current' part
 868        if (defined $pathname) {
 869                # we got "branch:filename" or "branch:dir/"
 870                # we could use git_get_type(branch:pathname), but:
 871                # - it needs $git_dir
 872                # - it does a git() call
 873                # - the convention of terminating directories with a slash
 874                #   makes it superfluous
 875                # - embedding the action in the PATH_INFO would make it even
 876                #   more superfluous
 877                $pathname =~ s,^/+,,;
 878                if (!$pathname || substr($pathname, -1) eq "/") {
 879                        $input_params{'action'} ||= "tree";
 880                        $pathname =~ s,/$,,;
 881                } else {
 882                        # the default action depends on whether we had parent info
 883                        # or not
 884                        if ($parentrefname) {
 885                                $input_params{'action'} ||= "blobdiff_plain";
 886                        } else {
 887                                $input_params{'action'} ||= "blob_plain";
 888                        }
 889                }
 890                $input_params{'hash_base'} ||= $refname;
 891                $input_params{'file_name'} ||= $pathname;
 892        } elsif (defined $refname) {
 893                # we got "branch". In this case we have to choose if we have to
 894                # set hash or hash_base.
 895                #
 896                # Most of the actions without a pathname only want hash to be
 897                # set, except for the ones specified in @wants_base that want
 898                # hash_base instead. It should also be noted that hand-crafted
 899                # links having 'history' as an action and no pathname or hash
 900                # set will fail, but that happens regardless of PATH_INFO.
 901                if (defined $parentrefname) {
 902                        # if there is parent let the default be 'shortlog' action
 903                        # (for http://git.example.com/repo.git/A..B links); if there
 904                        # is no parent, dispatch will detect type of object and set
 905                        # action appropriately if required (if action is not set)
 906                        $input_params{'action'} ||= "shortlog";
 907                }
 908                if ($input_params{'action'} &&
 909                    grep { $_ eq $input_params{'action'} } @wants_base) {
 910                        $input_params{'hash_base'} ||= $refname;
 911                } else {
 912                        $input_params{'hash'} ||= $refname;
 913                }
 914        }
 915
 916        # next, handle the 'parent' part, if present
 917        if (defined $parentrefname) {
 918                # a missing pathspec defaults to the 'current' filename, allowing e.g.
 919                # someproject/blobdiff/oldrev..newrev:/filename
 920                if ($parentpathname) {
 921                        $parentpathname =~ s,^/+,,;
 922                        $parentpathname =~ s,/$,,;
 923                        $input_params{'file_parent'} ||= $parentpathname;
 924                } else {
 925                        $input_params{'file_parent'} ||= $input_params{'file_name'};
 926                }
 927                # we assume that hash_parent_base is wanted if a path was specified,
 928                # or if the action wants hash_base instead of hash
 929                if (defined $input_params{'file_parent'} ||
 930                        grep { $_ eq $input_params{'action'} } @wants_base) {
 931                        $input_params{'hash_parent_base'} ||= $parentrefname;
 932                } else {
 933                        $input_params{'hash_parent'} ||= $parentrefname;
 934                }
 935        }
 936
 937        # for the snapshot action, we allow URLs in the form
 938        # $project/snapshot/$hash.ext
 939        # where .ext determines the snapshot and gets removed from the
 940        # passed $refname to provide the $hash.
 941        #
 942        # To be able to tell that $refname includes the format extension, we
 943        # require the following two conditions to be satisfied:
 944        # - the hash input parameter MUST have been set from the $refname part
 945        #   of the URL (i.e. they must be equal)
 946        # - the snapshot format MUST NOT have been defined already (e.g. from
 947        #   CGI parameter sf)
 948        # It's also useless to try any matching unless $refname has a dot,
 949        # so we check for that too
 950        if (defined $input_params{'action'} &&
 951                $input_params{'action'} eq 'snapshot' &&
 952                defined $refname && index($refname, '.') != -1 &&
 953                $refname eq $input_params{'hash'} &&
 954                !defined $input_params{'snapshot_format'}) {
 955                # We loop over the known snapshot formats, checking for
 956                # extensions. Allowed extensions are both the defined suffix
 957                # (which includes the initial dot already) and the snapshot
 958                # format key itself, with a prepended dot
 959                while (my ($fmt, $opt) = each %known_snapshot_formats) {
 960                        my $hash = $refname;
 961                        unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
 962                                next;
 963                        }
 964                        my $sfx = $1;
 965                        # a valid suffix was found, so set the snapshot format
 966                        # and reset the hash parameter
 967                        $input_params{'snapshot_format'} = $fmt;
 968                        $input_params{'hash'} = $hash;
 969                        # we also set the format suffix to the one requested
 970                        # in the URL: this way a request for e.g. .tgz returns
 971                        # a .tgz instead of a .tar.gz
 972                        $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
 973                        last;
 974                }
 975        }
 976}
 977
 978our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
 979     $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
 980     $searchtext, $search_regexp, $project_filter);
 981sub evaluate_and_validate_params {
 982        our $action = $input_params{'action'};
 983        if (defined $action) {
 984                if (!validate_action($action)) {
 985                        die_error(400, "Invalid action parameter");
 986                }
 987        }
 988
 989        # parameters which are pathnames
 990        our $project = $input_params{'project'};
 991        if (defined $project) {
 992                if (!validate_project($project)) {
 993                        undef $project;
 994                        die_error(404, "No such project");
 995                }
 996        }
 997
 998        our $project_filter = $input_params{'project_filter'};
 999        if (defined $project_filter) {
1000                if (!validate_pathname($project_filter)) {
1001                        die_error(404, "Invalid project_filter parameter");
1002                }
1003        }
1004
1005        our $file_name = $input_params{'file_name'};
1006        if (defined $file_name) {
1007                if (!validate_pathname($file_name)) {
1008                        die_error(400, "Invalid file parameter");
1009                }
1010        }
1011
1012        our $file_parent = $input_params{'file_parent'};
1013        if (defined $file_parent) {
1014                if (!validate_pathname($file_parent)) {
1015                        die_error(400, "Invalid file parent parameter");
1016                }
1017        }
1018
1019        # parameters which are refnames
1020        our $hash = $input_params{'hash'};
1021        if (defined $hash) {
1022                if (!validate_refname($hash)) {
1023                        die_error(400, "Invalid hash parameter");
1024                }
1025        }
1026
1027        our $hash_parent = $input_params{'hash_parent'};
1028        if (defined $hash_parent) {
1029                if (!validate_refname($hash_parent)) {
1030                        die_error(400, "Invalid hash parent parameter");
1031                }
1032        }
1033
1034        our $hash_base = $input_params{'hash_base'};
1035        if (defined $hash_base) {
1036                if (!validate_refname($hash_base)) {
1037                        die_error(400, "Invalid hash base parameter");
1038                }
1039        }
1040
1041        our @extra_options = @{$input_params{'extra_options'}};
1042        # @extra_options is always defined, since it can only be (currently) set from
1043        # CGI, and $cgi->param() returns the empty array in array context if the param
1044        # is not set
1045        foreach my $opt (@extra_options) {
1046                if (not exists $allowed_options{$opt}) {
1047                        die_error(400, "Invalid option parameter");
1048                }
1049                if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1050                        die_error(400, "Invalid option parameter for this action");
1051                }
1052        }
1053
1054        our $hash_parent_base = $input_params{'hash_parent_base'};
1055        if (defined $hash_parent_base) {
1056                if (!validate_refname($hash_parent_base)) {
1057                        die_error(400, "Invalid hash parent base parameter");
1058                }
1059        }
1060
1061        # other parameters
1062        our $page = $input_params{'page'};
1063        if (defined $page) {
1064                if ($page =~ m/[^0-9]/) {
1065                        die_error(400, "Invalid page parameter");
1066                }
1067        }
1068
1069        our $searchtype = $input_params{'searchtype'};
1070        if (defined $searchtype) {
1071                if ($searchtype =~ m/[^a-z]/) {
1072                        die_error(400, "Invalid searchtype parameter");
1073                }
1074        }
1075
1076        our $search_use_regexp = $input_params{'search_use_regexp'};
1077
1078        our $searchtext = $input_params{'searchtext'};
1079        our $search_regexp;
1080        if (defined $searchtext) {
1081                if (length($searchtext) < 2) {
1082                        die_error(403, "At least two characters are required for search parameter");
1083                }
1084                $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
1085        }
1086}
1087
1088# path to the current git repository
1089our $git_dir;
1090sub evaluate_git_dir {
1091        our $git_dir = "$projectroot/$project" if $project;
1092}
1093
1094our (@snapshot_fmts, $git_avatar);
1095sub configure_gitweb_features {
1096        # list of supported snapshot formats
1097        our @snapshot_fmts = gitweb_get_feature('snapshot');
1098        @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1099
1100        # check that the avatar feature is set to a known provider name,
1101        # and for each provider check if the dependencies are satisfied.
1102        # if the provider name is invalid or the dependencies are not met,
1103        # reset $git_avatar to the empty string.
1104        our ($git_avatar) = gitweb_get_feature('avatar');
1105        if ($git_avatar eq 'gravatar') {
1106                $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1107        } elsif ($git_avatar eq 'picon') {
1108                # no dependencies
1109        } else {
1110                $git_avatar = '';
1111        }
1112}
1113
1114# custom error handler: 'die <message>' is Internal Server Error
1115sub handle_errors_html {
1116        my $msg = shift; # it is already HTML escaped
1117
1118        # to avoid infinite loop where error occurs in die_error,
1119        # change handler to default handler, disabling handle_errors_html
1120        set_message("Error occured when inside die_error:\n$msg");
1121
1122        # you cannot jump out of die_error when called as error handler;
1123        # the subroutine set via CGI::Carp::set_message is called _after_
1124        # HTTP headers are already written, so it cannot write them itself
1125        die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1126}
1127set_message(\&handle_errors_html);
1128
1129# dispatch
1130sub dispatch {
1131        if (!defined $action) {
1132                if (defined $hash) {
1133                        $action = git_get_type($hash);
1134                } elsif (defined $hash_base && defined $file_name) {
1135                        $action = git_get_type("$hash_base:$file_name");
1136                } elsif (defined $project) {
1137                        $action = 'summary';
1138                } else {
1139                        $action = 'project_list';
1140                }
1141        }
1142        if (!defined($actions{$action})) {
1143                die_error(400, "Unknown action");
1144        }
1145        if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1146            !$project) {
1147                die_error(400, "Project needed");
1148        }
1149        $actions{$action}->();
1150}
1151
1152sub reset_timer {
1153        our $t0 = [ gettimeofday() ]
1154                if defined $t0;
1155        our $number_of_git_cmds = 0;
1156}
1157
1158our $first_request = 1;
1159sub run_request {
1160        reset_timer();
1161
1162        evaluate_uri();
1163        if ($first_request) {
1164                evaluate_gitweb_config();
1165                evaluate_git_version();
1166        }
1167        if ($per_request_config) {
1168                if (ref($per_request_config) eq 'CODE') {
1169                        $per_request_config->();
1170                } elsif (!$first_request) {
1171                        evaluate_gitweb_config();
1172                }
1173        }
1174        check_loadavg();
1175
1176        # $projectroot and $projects_list might be set in gitweb config file
1177        $projects_list ||= $projectroot;
1178
1179        evaluate_query_params();
1180        evaluate_path_info();
1181        evaluate_and_validate_params();
1182        evaluate_git_dir();
1183
1184        configure_gitweb_features();
1185
1186        dispatch();
1187}
1188
1189our $is_last_request = sub { 1 };
1190our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1191our $CGI = 'CGI';
1192our $cgi;
1193sub configure_as_fcgi {
1194        require CGI::Fast;
1195        our $CGI = 'CGI::Fast';
1196
1197        my $request_number = 0;
1198        # let each child service 100 requests
1199        our $is_last_request = sub { ++$request_number > 100 };
1200}
1201sub evaluate_argv {
1202        my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1203        configure_as_fcgi()
1204                if $script_name =~ /\.fcgi$/;
1205
1206        return unless (@ARGV);
1207
1208        require Getopt::Long;
1209        Getopt::Long::GetOptions(
1210                'fastcgi|fcgi|f' => \&configure_as_fcgi,
1211                'nproc|n=i' => sub {
1212                        my ($arg, $val) = @_;
1213                        return unless eval { require FCGI::ProcManager; 1; };
1214                        my $proc_manager = FCGI::ProcManager->new({
1215                                n_processes => $val,
1216                        });
1217                        our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1218                        our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1219                        our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1220                },
1221        );
1222}
1223
1224sub run {
1225        evaluate_argv();
1226
1227        $first_request = 1;
1228        $pre_listen_hook->()
1229                if $pre_listen_hook;
1230
1231 REQUEST:
1232        while ($cgi = $CGI->new()) {
1233                $pre_dispatch_hook->()
1234                        if $pre_dispatch_hook;
1235
1236                run_request();
1237
1238                $post_dispatch_hook->()
1239                        if $post_dispatch_hook;
1240                $first_request = 0;
1241
1242                last REQUEST if ($is_last_request->());
1243        }
1244
1245 DONE_GITWEB:
1246        1;
1247}
1248
1249run();
1250
1251if (defined caller) {
1252        # wrapped in a subroutine processing requests,
1253        # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1254        return;
1255} else {
1256        # pure CGI script, serving single request
1257        exit;
1258}
1259
1260## ======================================================================
1261## action links
1262
1263# possible values of extra options
1264# -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1265# -replay => 1      - start from a current view (replay with modifications)
1266# -path_info => 0|1 - don't use/use path_info URL (if possible)
1267# -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1268sub href {
1269        my %params = @_;
1270        # default is to use -absolute url() i.e. $my_uri
1271        my $href = $params{-full} ? $my_url : $my_uri;
1272
1273        # implicit -replay, must be first of implicit params
1274        $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1275
1276        $params{'project'} = $project unless exists $params{'project'};
1277
1278        if ($params{-replay}) {
1279                while (my ($name, $symbol) = each %cgi_param_mapping) {
1280                        if (!exists $params{$name}) {
1281                                $params{$name} = $input_params{$name};
1282                        }
1283                }
1284        }
1285
1286        my $use_pathinfo = gitweb_check_feature('pathinfo');
1287        if (defined $params{'project'} &&
1288            (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1289                # try to put as many parameters as possible in PATH_INFO:
1290                #   - project name
1291                #   - action
1292                #   - hash_parent or hash_parent_base:/file_parent
1293                #   - hash or hash_base:/filename
1294                #   - the snapshot_format as an appropriate suffix
1295
1296                # When the script is the root DirectoryIndex for the domain,
1297                # $href here would be something like http://gitweb.example.com/
1298                # Thus, we strip any trailing / from $href, to spare us double
1299                # slashes in the final URL
1300                $href =~ s,/$,,;
1301
1302                # Then add the project name, if present
1303                $href .= "/".esc_path_info($params{'project'});
1304                delete $params{'project'};
1305
1306                # since we destructively absorb parameters, we keep this
1307                # boolean that remembers if we're handling a snapshot
1308                my $is_snapshot = $params{'action'} eq 'snapshot';
1309
1310                # Summary just uses the project path URL, any other action is
1311                # added to the URL
1312                if (defined $params{'action'}) {
1313                        $href .= "/".esc_path_info($params{'action'})
1314                                unless $params{'action'} eq 'summary';
1315                        delete $params{'action'};
1316                }
1317
1318                # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1319                # stripping nonexistent or useless pieces
1320                $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1321                        || $params{'hash_parent'} || $params{'hash'});
1322                if (defined $params{'hash_base'}) {
1323                        if (defined $params{'hash_parent_base'}) {
1324                                $href .= esc_path_info($params{'hash_parent_base'});
1325                                # skip the file_parent if it's the same as the file_name
1326                                if (defined $params{'file_parent'}) {
1327                                        if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1328                                                delete $params{'file_parent'};
1329                                        } elsif ($params{'file_parent'} !~ /\.\./) {
1330                                                $href .= ":/".esc_path_info($params{'file_parent'});
1331                                                delete $params{'file_parent'};
1332                                        }
1333                                }
1334                                $href .= "..";
1335                                delete $params{'hash_parent'};
1336                                delete $params{'hash_parent_base'};
1337                        } elsif (defined $params{'hash_parent'}) {
1338                                $href .= esc_path_info($params{'hash_parent'}). "..";
1339                                delete $params{'hash_parent'};
1340                        }
1341
1342                        $href .= esc_path_info($params{'hash_base'});
1343                        if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1344                                $href .= ":/".esc_path_info($params{'file_name'});
1345                                delete $params{'file_name'};
1346                        }
1347                        delete $params{'hash'};
1348                        delete $params{'hash_base'};
1349                } elsif (defined $params{'hash'}) {
1350                        $href .= esc_path_info($params{'hash'});
1351                        delete $params{'hash'};
1352                }
1353
1354                # If the action was a snapshot, we can absorb the
1355                # snapshot_format parameter too
1356                if ($is_snapshot) {
1357                        my $fmt = $params{'snapshot_format'};
1358                        # snapshot_format should always be defined when href()
1359                        # is called, but just in case some code forgets, we
1360                        # fall back to the default
1361                        $fmt ||= $snapshot_fmts[0];
1362                        $href .= $known_snapshot_formats{$fmt}{'suffix'};
1363                        delete $params{'snapshot_format'};
1364                }
1365        }
1366
1367        # now encode the parameters explicitly
1368        my @result = ();
1369        for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1370                my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1371                if (defined $params{$name}) {
1372                        if (ref($params{$name}) eq "ARRAY") {
1373                                foreach my $par (@{$params{$name}}) {
1374                                        push @result, $symbol . "=" . esc_param($par);
1375                                }
1376                        } else {
1377                                push @result, $symbol . "=" . esc_param($params{$name});
1378                        }
1379                }
1380        }
1381        $href .= "?" . join(';', @result) if scalar @result;
1382
1383        # final transformation: trailing spaces must be escaped (URI-encoded)
1384        $href =~ s/(\s+)$/CGI::escape($1)/e;
1385
1386        if ($params{-anchor}) {
1387                $href .= "#".esc_param($params{-anchor});
1388        }
1389
1390        return $href;
1391}
1392
1393
1394## ======================================================================
1395## validation, quoting/unquoting and escaping
1396
1397sub validate_action {
1398        my $input = shift || return undef;
1399        return undef unless exists $actions{$input};
1400        return $input;
1401}
1402
1403sub validate_project {
1404        my $input = shift || return undef;
1405        if (!validate_pathname($input) ||
1406                !(-d "$projectroot/$input") ||
1407                !check_export_ok("$projectroot/$input") ||
1408                ($strict_export && !project_in_list($input))) {
1409                return undef;
1410        } else {
1411                return $input;
1412        }
1413}
1414
1415sub validate_pathname {
1416        my $input = shift || return undef;
1417
1418        # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1419        # at the beginning, at the end, and between slashes.
1420        # also this catches doubled slashes
1421        if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1422                return undef;
1423        }
1424        # no null characters
1425        if ($input =~ m!\0!) {
1426                return undef;
1427        }
1428        return $input;
1429}
1430
1431sub validate_refname {
1432        my $input = shift || return undef;
1433
1434        # textual hashes are O.K.
1435        if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1436                return $input;
1437        }
1438        # it must be correct pathname
1439        $input = validate_pathname($input)
1440                or return undef;
1441        # restrictions on ref name according to git-check-ref-format
1442        if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1443                return undef;
1444        }
1445        return $input;
1446}
1447
1448# decode sequences of octets in utf8 into Perl's internal form,
1449# which is utf-8 with utf8 flag set if needed.  gitweb writes out
1450# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1451sub to_utf8 {
1452        my $str = shift;
1453        return undef unless defined $str;
1454
1455        if (utf8::is_utf8($str) || utf8::decode($str)) {
1456                return $str;
1457        } else {
1458                return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1459        }
1460}
1461
1462# quote unsafe chars, but keep the slash, even when it's not
1463# correct, but quoted slashes look too horrible in bookmarks
1464sub esc_param {
1465        my $str = shift;
1466        return undef unless defined $str;
1467        $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1468        $str =~ s/ /\+/g;
1469        return $str;
1470}
1471
1472# the quoting rules for path_info fragment are slightly different
1473sub esc_path_info {
1474        my $str = shift;
1475        return undef unless defined $str;
1476
1477        # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1478        $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1479
1480        return $str;
1481}
1482
1483# quote unsafe chars in whole URL, so some characters cannot be quoted
1484sub esc_url {
1485        my $str = shift;
1486        return undef unless defined $str;
1487        $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1488        $str =~ s/ /\+/g;
1489        return $str;
1490}
1491
1492# quote unsafe characters in HTML attributes
1493sub esc_attr {
1494
1495        # for XHTML conformance escaping '"' to '&quot;' is not enough
1496        return esc_html(@_);
1497}
1498
1499# replace invalid utf8 character with SUBSTITUTION sequence
1500sub esc_html {
1501        my $str = shift;
1502        my %opts = @_;
1503
1504        return undef unless defined $str;
1505
1506        $str = to_utf8($str);
1507        $str = $cgi->escapeHTML($str);
1508        if ($opts{'-nbsp'}) {
1509                $str =~ s/ /&nbsp;/g;
1510        }
1511        $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1512        return $str;
1513}
1514
1515# quote control characters and escape filename to HTML
1516sub esc_path {
1517        my $str = shift;
1518        my %opts = @_;
1519
1520        return undef unless defined $str;
1521
1522        $str = to_utf8($str);
1523        $str = $cgi->escapeHTML($str);
1524        if ($opts{'-nbsp'}) {
1525                $str =~ s/ /&nbsp;/g;
1526        }
1527        $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1528        return $str;
1529}
1530
1531# Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1532sub sanitize {
1533        my $str = shift;
1534
1535        return undef unless defined $str;
1536
1537        $str = to_utf8($str);
1538        $str =~ s|([[:cntrl:]])|($1 =~ /[\t\n\r]/ ? $1 : quot_cec($1))|eg;
1539        return $str;
1540}
1541
1542# Make control characters "printable", using character escape codes (CEC)
1543sub quot_cec {
1544        my $cntrl = shift;
1545        my %opts = @_;
1546        my %es = ( # character escape codes, aka escape sequences
1547                "\t" => '\t',   # tab            (HT)
1548                "\n" => '\n',   # line feed      (LF)
1549                "\r" => '\r',   # carrige return (CR)
1550                "\f" => '\f',   # form feed      (FF)
1551                "\b" => '\b',   # backspace      (BS)
1552                "\a" => '\a',   # alarm (bell)   (BEL)
1553                "\e" => '\e',   # escape         (ESC)
1554                "\013" => '\v', # vertical tab   (VT)
1555                "\000" => '\0', # nul character  (NUL)
1556        );
1557        my $chr = ( (exists $es{$cntrl})
1558                    ? $es{$cntrl}
1559                    : sprintf('\%2x', ord($cntrl)) );
1560        if ($opts{-nohtml}) {
1561                return $chr;
1562        } else {
1563                return "<span class=\"cntrl\">$chr</span>";
1564        }
1565}
1566
1567# Alternatively use unicode control pictures codepoints,
1568# Unicode "printable representation" (PR)
1569sub quot_upr {
1570        my $cntrl = shift;
1571        my %opts = @_;
1572
1573        my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1574        if ($opts{-nohtml}) {
1575                return $chr;
1576        } else {
1577                return "<span class=\"cntrl\">$chr</span>";
1578        }
1579}
1580
1581# git may return quoted and escaped filenames
1582sub unquote {
1583        my $str = shift;
1584
1585        sub unq {
1586                my $seq = shift;
1587                my %es = ( # character escape codes, aka escape sequences
1588                        't' => "\t",   # tab            (HT, TAB)
1589                        'n' => "\n",   # newline        (NL)
1590                        'r' => "\r",   # return         (CR)
1591                        'f' => "\f",   # form feed      (FF)
1592                        'b' => "\b",   # backspace      (BS)
1593                        'a' => "\a",   # alarm (bell)   (BEL)
1594                        'e' => "\e",   # escape         (ESC)
1595                        'v' => "\013", # vertical tab   (VT)
1596                );
1597
1598                if ($seq =~ m/^[0-7]{1,3}$/) {
1599                        # octal char sequence
1600                        return chr(oct($seq));
1601                } elsif (exists $es{$seq}) {
1602                        # C escape sequence, aka character escape code
1603                        return $es{$seq};
1604                }
1605                # quoted ordinary character
1606                return $seq;
1607        }
1608
1609        if ($str =~ m/^"(.*)"$/) {
1610                # needs unquoting
1611                $str = $1;
1612                $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1613        }
1614        return $str;
1615}
1616
1617# escape tabs (convert tabs to spaces)
1618sub untabify {
1619        my $line = shift;
1620
1621        while ((my $pos = index($line, "\t")) != -1) {
1622                if (my $count = (8 - ($pos % 8))) {
1623                        my $spaces = ' ' x $count;
1624                        $line =~ s/\t/$spaces/;
1625                }
1626        }
1627
1628        return $line;
1629}
1630
1631sub project_in_list {
1632        my $project = shift;
1633        my @list = git_get_projects_list();
1634        return @list && scalar(grep { $_->{'path'} eq $project } @list);
1635}
1636
1637## ----------------------------------------------------------------------
1638## HTML aware string manipulation
1639
1640# Try to chop given string on a word boundary between position
1641# $len and $len+$add_len. If there is no word boundary there,
1642# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1643# (marking chopped part) would be longer than given string.
1644sub chop_str {
1645        my $str = shift;
1646        my $len = shift;
1647        my $add_len = shift || 10;
1648        my $where = shift || 'right'; # 'left' | 'center' | 'right'
1649
1650        # Make sure perl knows it is utf8 encoded so we don't
1651        # cut in the middle of a utf8 multibyte char.
1652        $str = to_utf8($str);
1653
1654        # allow only $len chars, but don't cut a word if it would fit in $add_len
1655        # if it doesn't fit, cut it if it's still longer than the dots we would add
1656        # remove chopped character entities entirely
1657
1658        # when chopping in the middle, distribute $len into left and right part
1659        # return early if chopping wouldn't make string shorter
1660        if ($where eq 'center') {
1661                return $str if ($len + 5 >= length($str)); # filler is length 5
1662                $len = int($len/2);
1663        } else {
1664                return $str if ($len + 4 >= length($str)); # filler is length 4
1665        }
1666
1667        # regexps: ending and beginning with word part up to $add_len
1668        my $endre = qr/.{$len}\w{0,$add_len}/;
1669        my $begre = qr/\w{0,$add_len}.{$len}/;
1670
1671        if ($where eq 'left') {
1672                $str =~ m/^(.*?)($begre)$/;
1673                my ($lead, $body) = ($1, $2);
1674                if (length($lead) > 4) {
1675                        $lead = " ...";
1676                }
1677                return "$lead$body";
1678
1679        } elsif ($where eq 'center') {
1680                $str =~ m/^($endre)(.*)$/;
1681                my ($left, $str)  = ($1, $2);
1682                $str =~ m/^(.*?)($begre)$/;
1683                my ($mid, $right) = ($1, $2);
1684                if (length($mid) > 5) {
1685                        $mid = " ... ";
1686                }
1687                return "$left$mid$right";
1688
1689        } else {
1690                $str =~ m/^($endre)(.*)$/;
1691                my $body = $1;
1692                my $tail = $2;
1693                if (length($tail) > 4) {
1694                        $tail = "... ";
1695                }
1696                return "$body$tail";
1697        }
1698}
1699
1700# takes the same arguments as chop_str, but also wraps a <span> around the
1701# result with a title attribute if it does get chopped. Additionally, the
1702# string is HTML-escaped.
1703sub chop_and_escape_str {
1704        my ($str) = @_;
1705
1706        my $chopped = chop_str(@_);
1707        $str = to_utf8($str);
1708        if ($chopped eq $str) {
1709                return esc_html($chopped);
1710        } else {
1711                $str =~ s/[[:cntrl:]]/?/g;
1712                return $cgi->span({-title=>$str}, esc_html($chopped));
1713        }
1714}
1715
1716## ----------------------------------------------------------------------
1717## functions returning short strings
1718
1719# CSS class for given age value (in seconds)
1720sub age_class {
1721        my $age = shift;
1722
1723        if (!defined $age) {
1724                return "noage";
1725        } elsif ($age < 60*60*2) {
1726                return "age0";
1727        } elsif ($age < 60*60*24*2) {
1728                return "age1";
1729        } else {
1730                return "age2";
1731        }
1732}
1733
1734# convert age in seconds to "nn units ago" string
1735sub age_string {
1736        my $age = shift;
1737        my $age_str;
1738
1739        if ($age > 60*60*24*365*2) {
1740                $age_str = (int $age/60/60/24/365);
1741                $age_str .= " years ago";
1742        } elsif ($age > 60*60*24*(365/12)*2) {
1743                $age_str = int $age/60/60/24/(365/12);
1744                $age_str .= " months ago";
1745        } elsif ($age > 60*60*24*7*2) {
1746                $age_str = int $age/60/60/24/7;
1747                $age_str .= " weeks ago";
1748        } elsif ($age > 60*60*24*2) {
1749                $age_str = int $age/60/60/24;
1750                $age_str .= " days ago";
1751        } elsif ($age > 60*60*2) {
1752                $age_str = int $age/60/60;
1753                $age_str .= " hours ago";
1754        } elsif ($age > 60*2) {
1755                $age_str = int $age/60;
1756                $age_str .= " min ago";
1757        } elsif ($age > 2) {
1758                $age_str = int $age;
1759                $age_str .= " sec ago";
1760        } else {
1761                $age_str .= " right now";
1762        }
1763        return $age_str;
1764}
1765
1766use constant {
1767        S_IFINVALID => 0030000,
1768        S_IFGITLINK => 0160000,
1769};
1770
1771# submodule/subproject, a commit object reference
1772sub S_ISGITLINK {
1773        my $mode = shift;
1774
1775        return (($mode & S_IFMT) == S_IFGITLINK)
1776}
1777
1778# convert file mode in octal to symbolic file mode string
1779sub mode_str {
1780        my $mode = oct shift;
1781
1782        if (S_ISGITLINK($mode)) {
1783                return 'm---------';
1784        } elsif (S_ISDIR($mode & S_IFMT)) {
1785                return 'drwxr-xr-x';
1786        } elsif (S_ISLNK($mode)) {
1787                return 'lrwxrwxrwx';
1788        } elsif (S_ISREG($mode)) {
1789                # git cares only about the executable bit
1790                if ($mode & S_IXUSR) {
1791                        return '-rwxr-xr-x';
1792                } else {
1793                        return '-rw-r--r--';
1794                };
1795        } else {
1796                return '----------';
1797        }
1798}
1799
1800# convert file mode in octal to file type string
1801sub file_type {
1802        my $mode = shift;
1803
1804        if ($mode !~ m/^[0-7]+$/) {
1805                return $mode;
1806        } else {
1807                $mode = oct $mode;
1808        }
1809
1810        if (S_ISGITLINK($mode)) {
1811                return "submodule";
1812        } elsif (S_ISDIR($mode & S_IFMT)) {
1813                return "directory";
1814        } elsif (S_ISLNK($mode)) {
1815                return "symlink";
1816        } elsif (S_ISREG($mode)) {
1817                return "file";
1818        } else {
1819                return "unknown";
1820        }
1821}
1822
1823# convert file mode in octal to file type description string
1824sub file_type_long {
1825        my $mode = shift;
1826
1827        if ($mode !~ m/^[0-7]+$/) {
1828                return $mode;
1829        } else {
1830                $mode = oct $mode;
1831        }
1832
1833        if (S_ISGITLINK($mode)) {
1834                return "submodule";
1835        } elsif (S_ISDIR($mode & S_IFMT)) {
1836                return "directory";
1837        } elsif (S_ISLNK($mode)) {
1838                return "symlink";
1839        } elsif (S_ISREG($mode)) {
1840                if ($mode & S_IXUSR) {
1841                        return "executable";
1842                } else {
1843                        return "file";
1844                };
1845        } else {
1846                return "unknown";
1847        }
1848}
1849
1850
1851## ----------------------------------------------------------------------
1852## functions returning short HTML fragments, or transforming HTML fragments
1853## which don't belong to other sections
1854
1855# format line of commit message.
1856sub format_log_line_html {
1857        my $line = shift;
1858
1859        $line = esc_html($line, -nbsp=>1);
1860        $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1861                $cgi->a({-href => href(action=>"object", hash=>$1),
1862                                        -class => "text"}, $1);
1863        }eg;
1864
1865        return $line;
1866}
1867
1868# format marker of refs pointing to given object
1869
1870# the destination action is chosen based on object type and current context:
1871# - for annotated tags, we choose the tag view unless it's the current view
1872#   already, in which case we go to shortlog view
1873# - for other refs, we keep the current view if we're in history, shortlog or
1874#   log view, and select shortlog otherwise
1875sub format_ref_marker {
1876        my ($refs, $id) = @_;
1877        my $markers = '';
1878
1879        if (defined $refs->{$id}) {
1880                foreach my $ref (@{$refs->{$id}}) {
1881                        # this code exploits the fact that non-lightweight tags are the
1882                        # only indirect objects, and that they are the only objects for which
1883                        # we want to use tag instead of shortlog as action
1884                        my ($type, $name) = qw();
1885                        my $indirect = ($ref =~ s/\^\{\}$//);
1886                        # e.g. tags/v2.6.11 or heads/next
1887                        if ($ref =~ m!^(.*?)s?/(.*)$!) {
1888                                $type = $1;
1889                                $name = $2;
1890                        } else {
1891                                $type = "ref";
1892                                $name = $ref;
1893                        }
1894
1895                        my $class = $type;
1896                        $class .= " indirect" if $indirect;
1897
1898                        my $dest_action = "shortlog";
1899
1900                        if ($indirect) {
1901                                $dest_action = "tag" unless $action eq "tag";
1902                        } elsif ($action =~ /^(history|(short)?log)$/) {
1903                                $dest_action = $action;
1904                        }
1905
1906                        my $dest = "";
1907                        $dest .= "refs/" unless $ref =~ m!^refs/!;
1908                        $dest .= $ref;
1909
1910                        my $link = $cgi->a({
1911                                -href => href(
1912                                        action=>$dest_action,
1913                                        hash=>$dest
1914                                )}, $name);
1915
1916                        $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
1917                                $link . "</span>";
1918                }
1919        }
1920
1921        if ($markers) {
1922                return ' <span class="refs">'. $markers . '</span>';
1923        } else {
1924                return "";
1925        }
1926}
1927
1928# format, perhaps shortened and with markers, title line
1929sub format_subject_html {
1930        my ($long, $short, $href, $extra) = @_;
1931        $extra = '' unless defined($extra);
1932
1933        if (length($short) < length($long)) {
1934                $long =~ s/[[:cntrl:]]/?/g;
1935                return $cgi->a({-href => $href, -class => "list subject",
1936                                -title => to_utf8($long)},
1937                       esc_html($short)) . $extra;
1938        } else {
1939                return $cgi->a({-href => $href, -class => "list subject"},
1940                       esc_html($long)) . $extra;
1941        }
1942}
1943
1944# Rather than recomputing the url for an email multiple times, we cache it
1945# after the first hit. This gives a visible benefit in views where the avatar
1946# for the same email is used repeatedly (e.g. shortlog).
1947# The cache is shared by all avatar engines (currently gravatar only), which
1948# are free to use it as preferred. Since only one avatar engine is used for any
1949# given page, there's no risk for cache conflicts.
1950our %avatar_cache = ();
1951
1952# Compute the picon url for a given email, by using the picon search service over at
1953# http://www.cs.indiana.edu/picons/search.html
1954sub picon_url {
1955        my $email = lc shift;
1956        if (!$avatar_cache{$email}) {
1957                my ($user, $domain) = split('@', $email);
1958                $avatar_cache{$email} =
1959                        "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1960                        "$domain/$user/" .
1961                        "users+domains+unknown/up/single";
1962        }
1963        return $avatar_cache{$email};
1964}
1965
1966# Compute the gravatar url for a given email, if it's not in the cache already.
1967# Gravatar stores only the part of the URL before the size, since that's the
1968# one computationally more expensive. This also allows reuse of the cache for
1969# different sizes (for this particular engine).
1970sub gravatar_url {
1971        my $email = lc shift;
1972        my $size = shift;
1973        $avatar_cache{$email} ||=
1974                "http://www.gravatar.com/avatar/" .
1975                        Digest::MD5::md5_hex($email) . "?s=";
1976        return $avatar_cache{$email} . $size;
1977}
1978
1979# Insert an avatar for the given $email at the given $size if the feature
1980# is enabled.
1981sub git_get_avatar {
1982        my ($email, %opts) = @_;
1983        my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1984        my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1985        $opts{-size} ||= 'default';
1986        my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1987        my $url = "";
1988        if ($git_avatar eq 'gravatar') {
1989                $url = gravatar_url($email, $size);
1990        } elsif ($git_avatar eq 'picon') {
1991                $url = picon_url($email);
1992        }
1993        # Other providers can be added by extending the if chain, defining $url
1994        # as needed. If no variant puts something in $url, we assume avatars
1995        # are completely disabled/unavailable.
1996        if ($url) {
1997                return $pre_white .
1998                       "<img width=\"$size\" " .
1999                            "class=\"avatar\" " .
2000                            "src=\"".esc_url($url)."\" " .
2001                            "alt=\"\" " .
2002                       "/>" . $post_white;
2003        } else {
2004                return "";
2005        }
2006}
2007
2008sub format_search_author {
2009        my ($author, $searchtype, $displaytext) = @_;
2010        my $have_search = gitweb_check_feature('search');
2011
2012        if ($have_search) {
2013                my $performed = "";
2014                if ($searchtype eq 'author') {
2015                        $performed = "authored";
2016                } elsif ($searchtype eq 'committer') {
2017                        $performed = "committed";
2018                }
2019
2020                return $cgi->a({-href => href(action=>"search", hash=>$hash,
2021                                searchtext=>$author,
2022                                searchtype=>$searchtype), class=>"list",
2023                                title=>"Search for commits $performed by $author"},
2024                                $displaytext);
2025
2026        } else {
2027                return $displaytext;
2028        }
2029}
2030
2031# format the author name of the given commit with the given tag
2032# the author name is chopped and escaped according to the other
2033# optional parameters (see chop_str).
2034sub format_author_html {
2035        my $tag = shift;
2036        my $co = shift;
2037        my $author = chop_and_escape_str($co->{'author_name'}, @_);
2038        return "<$tag class=\"author\">" .
2039               format_search_author($co->{'author_name'}, "author",
2040                       git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2041                       $author) .
2042               "</$tag>";
2043}
2044
2045# format git diff header line, i.e. "diff --(git|combined|cc) ..."
2046sub format_git_diff_header_line {
2047        my $line = shift;
2048        my $diffinfo = shift;
2049        my ($from, $to) = @_;
2050
2051        if ($diffinfo->{'nparents'}) {
2052                # combined diff
2053                $line =~ s!^(diff (.*?) )"?.*$!$1!;
2054                if ($to->{'href'}) {
2055                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2056                                         esc_path($to->{'file'}));
2057                } else { # file was deleted (no href)
2058                        $line .= esc_path($to->{'file'});
2059                }
2060        } else {
2061                # "ordinary" diff
2062                $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2063                if ($from->{'href'}) {
2064                        $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2065                                         'a/' . esc_path($from->{'file'}));
2066                } else { # file was added (no href)
2067                        $line .= 'a/' . esc_path($from->{'file'});
2068                }
2069                $line .= ' ';
2070                if ($to->{'href'}) {
2071                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2072                                         'b/' . esc_path($to->{'file'}));
2073                } else { # file was deleted
2074                        $line .= 'b/' . esc_path($to->{'file'});
2075                }
2076        }
2077
2078        return "<div class=\"diff header\">$line</div>\n";
2079}
2080
2081# format extended diff header line, before patch itself
2082sub format_extended_diff_header_line {
2083        my $line = shift;
2084        my $diffinfo = shift;
2085        my ($from, $to) = @_;
2086
2087        # match <path>
2088        if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2089                $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2090                                       esc_path($from->{'file'}));
2091        }
2092        if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2093                $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2094                                 esc_path($to->{'file'}));
2095        }
2096        # match single <mode>
2097        if ($line =~ m/\s(\d{6})$/) {
2098                $line .= '<span class="info"> (' .
2099                         file_type_long($1) .
2100                         ')</span>';
2101        }
2102        # match <hash>
2103        if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2104                # can match only for combined diff
2105                $line = 'index ';
2106                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2107                        if ($from->{'href'}[$i]) {
2108                                $line .= $cgi->a({-href=>$from->{'href'}[$i],
2109                                                  -class=>"hash"},
2110                                                 substr($diffinfo->{'from_id'}[$i],0,7));
2111                        } else {
2112                                $line .= '0' x 7;
2113                        }
2114                        # separator
2115                        $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2116                }
2117                $line .= '..';
2118                if ($to->{'href'}) {
2119                        $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2120                                         substr($diffinfo->{'to_id'},0,7));
2121                } else {
2122                        $line .= '0' x 7;
2123                }
2124
2125        } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2126                # can match only for ordinary diff
2127                my ($from_link, $to_link);
2128                if ($from->{'href'}) {
2129                        $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2130                                             substr($diffinfo->{'from_id'},0,7));
2131                } else {
2132                        $from_link = '0' x 7;
2133                }
2134                if ($to->{'href'}) {
2135                        $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2136                                           substr($diffinfo->{'to_id'},0,7));
2137                } else {
2138                        $to_link = '0' x 7;
2139                }
2140                my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2141                $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2142        }
2143
2144        return $line . "<br/>\n";
2145}
2146
2147# format from-file/to-file diff header
2148sub format_diff_from_to_header {
2149        my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2150        my $line;
2151        my $result = '';
2152
2153        $line = $from_line;
2154        #assert($line =~ m/^---/) if DEBUG;
2155        # no extra formatting for "^--- /dev/null"
2156        if (! $diffinfo->{'nparents'}) {
2157                # ordinary (single parent) diff
2158                if ($line =~ m!^--- "?a/!) {
2159                        if ($from->{'href'}) {
2160                                $line = '--- a/' .
2161                                        $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2162                                                esc_path($from->{'file'}));
2163                        } else {
2164                                $line = '--- a/' .
2165                                        esc_path($from->{'file'});
2166                        }
2167                }
2168                $result .= qq!<div class="diff from_file">$line</div>\n!;
2169
2170        } else {
2171                # combined diff (merge commit)
2172                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2173                        if ($from->{'href'}[$i]) {
2174                                $line = '--- ' .
2175                                        $cgi->a({-href=>href(action=>"blobdiff",
2176                                                             hash_parent=>$diffinfo->{'from_id'}[$i],
2177                                                             hash_parent_base=>$parents[$i],
2178                                                             file_parent=>$from->{'file'}[$i],
2179                                                             hash=>$diffinfo->{'to_id'},
2180                                                             hash_base=>$hash,
2181                                                             file_name=>$to->{'file'}),
2182                                                 -class=>"path",
2183                                                 -title=>"diff" . ($i+1)},
2184                                                $i+1) .
2185                                        '/' .
2186                                        $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2187                                                esc_path($from->{'file'}[$i]));
2188                        } else {
2189                                $line = '--- /dev/null';
2190                        }
2191                        $result .= qq!<div class="diff from_file">$line</div>\n!;
2192                }
2193        }
2194
2195        $line = $to_line;
2196        #assert($line =~ m/^\+\+\+/) if DEBUG;
2197        # no extra formatting for "^+++ /dev/null"
2198        if ($line =~ m!^\+\+\+ "?b/!) {
2199                if ($to->{'href'}) {
2200                        $line = '+++ b/' .
2201                                $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2202                                        esc_path($to->{'file'}));
2203                } else {
2204                        $line = '+++ b/' .
2205                                esc_path($to->{'file'});
2206                }
2207        }
2208        $result .= qq!<div class="diff to_file">$line</div>\n!;
2209
2210        return $result;
2211}
2212
2213# create note for patch simplified by combined diff
2214sub format_diff_cc_simplified {
2215        my ($diffinfo, @parents) = @_;
2216        my $result = '';
2217
2218        $result .= "<div class=\"diff header\">" .
2219                   "diff --cc ";
2220        if (!is_deleted($diffinfo)) {
2221                $result .= $cgi->a({-href => href(action=>"blob",
2222                                                  hash_base=>$hash,
2223                                                  hash=>$diffinfo->{'to_id'},
2224                                                  file_name=>$diffinfo->{'to_file'}),
2225                                    -class => "path"},
2226                                   esc_path($diffinfo->{'to_file'}));
2227        } else {
2228                $result .= esc_path($diffinfo->{'to_file'});
2229        }
2230        $result .= "</div>\n" . # class="diff header"
2231                   "<div class=\"diff nodifferences\">" .
2232                   "Simple merge" .
2233                   "</div>\n"; # class="diff nodifferences"
2234
2235        return $result;
2236}
2237
2238sub diff_line_class {
2239        my ($line, $from, $to) = @_;
2240
2241        # ordinary diff
2242        my $num_sign = 1;
2243        # combined diff
2244        if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2245                $num_sign = scalar @{$from->{'href'}};
2246        }
2247
2248        my @diff_line_classifier = (
2249                { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2250                { regexp => qr/^\\/,               class => "incomplete"  },
2251                { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2252                # classifier for context must come before classifier add/rem,
2253                # or we would have to use more complicated regexp, for example
2254                # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2255                { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2256                { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2257        );
2258        for my $clsfy (@diff_line_classifier) {
2259                return $clsfy->{'class'}
2260                        if ($line =~ $clsfy->{'regexp'});
2261        }
2262
2263        # fallback
2264        return "";
2265}
2266
2267# assumes that $from and $to are defined and correctly filled,
2268# and that $line holds a line of chunk header for unified diff
2269sub format_unidiff_chunk_header {
2270        my ($line, $from, $to) = @_;
2271
2272        my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2273                $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2274
2275        $from_lines = 0 unless defined $from_lines;
2276        $to_lines   = 0 unless defined $to_lines;
2277
2278        if ($from->{'href'}) {
2279                $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2280                                     -class=>"list"}, $from_text);
2281        }
2282        if ($to->{'href'}) {
2283                $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2284                                     -class=>"list"}, $to_text);
2285        }
2286        $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2287                "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2288        return $line;
2289}
2290
2291# assumes that $from and $to are defined and correctly filled,
2292# and that $line holds a line of chunk header for combined diff
2293sub format_cc_diff_chunk_header {
2294        my ($line, $from, $to) = @_;
2295
2296        my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2297        my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2298
2299        @from_text = split(' ', $ranges);
2300        for (my $i = 0; $i < @from_text; ++$i) {
2301                ($from_start[$i], $from_nlines[$i]) =
2302                        (split(',', substr($from_text[$i], 1)), 0);
2303        }
2304
2305        $to_text   = pop @from_text;
2306        $to_start  = pop @from_start;
2307        $to_nlines = pop @from_nlines;
2308
2309        $line = "<span class=\"chunk_info\">$prefix ";
2310        for (my $i = 0; $i < @from_text; ++$i) {
2311                if ($from->{'href'}[$i]) {
2312                        $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2313                                          -class=>"list"}, $from_text[$i]);
2314                } else {
2315                        $line .= $from_text[$i];
2316                }
2317                $line .= " ";
2318        }
2319        if ($to->{'href'}) {
2320                $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2321                                  -class=>"list"}, $to_text);
2322        } else {
2323                $line .= $to_text;
2324        }
2325        $line .= " $prefix</span>" .
2326                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2327        return $line;
2328}
2329
2330# process patch (diff) line (not to be used for diff headers),
2331# returning class and HTML-formatted (but not wrapped) line
2332sub process_diff_line {
2333        my $line = shift;
2334        my ($from, $to) = @_;
2335
2336        my $diff_class = diff_line_class($line, $from, $to);
2337
2338        chomp $line;
2339        $line = untabify($line);
2340
2341        if ($from && $to && $line =~ m/^\@{2} /) {
2342                $line = format_unidiff_chunk_header($line, $from, $to);
2343                return $diff_class, $line;
2344
2345        } elsif ($from && $to && $line =~ m/^\@{3}/) {
2346                $line = format_cc_diff_chunk_header($line, $from, $to);
2347                return $diff_class, $line;
2348
2349        }
2350        return $diff_class, esc_html($line, -nbsp=>1);
2351}
2352
2353# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2354# linked.  Pass the hash of the tree/commit to snapshot.
2355sub format_snapshot_links {
2356        my ($hash) = @_;
2357        my $num_fmts = @snapshot_fmts;
2358        if ($num_fmts > 1) {
2359                # A parenthesized list of links bearing format names.
2360                # e.g. "snapshot (_tar.gz_ _zip_)"
2361                return "snapshot (" . join(' ', map
2362                        $cgi->a({
2363                                -href => href(
2364                                        action=>"snapshot",
2365                                        hash=>$hash,
2366                                        snapshot_format=>$_
2367                                )
2368                        }, $known_snapshot_formats{$_}{'display'})
2369                , @snapshot_fmts) . ")";
2370        } elsif ($num_fmts == 1) {
2371                # A single "snapshot" link whose tooltip bears the format name.
2372                # i.e. "_snapshot_"
2373                my ($fmt) = @snapshot_fmts;
2374                return
2375                        $cgi->a({
2376                                -href => href(
2377                                        action=>"snapshot",
2378                                        hash=>$hash,
2379                                        snapshot_format=>$fmt
2380                                ),
2381                                -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2382                        }, "snapshot");
2383        } else { # $num_fmts == 0
2384                return undef;
2385        }
2386}
2387
2388## ......................................................................
2389## functions returning values to be passed, perhaps after some
2390## transformation, to other functions; e.g. returning arguments to href()
2391
2392# returns hash to be passed to href to generate gitweb URL
2393# in -title key it returns description of link
2394sub get_feed_info {
2395        my $format = shift || 'Atom';
2396        my %res = (action => lc($format));
2397
2398        # feed links are possible only for project views
2399        return unless (defined $project);
2400        # some views should link to OPML, or to generic project feed,
2401        # or don't have specific feed yet (so they should use generic)
2402        return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2403
2404        my $branch;
2405        # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2406        # from tag links; this also makes possible to detect branch links
2407        if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2408            (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2409                $branch = $1;
2410        }
2411        # find log type for feed description (title)
2412        my $type = 'log';
2413        if (defined $file_name) {
2414                $type  = "history of $file_name";
2415                $type .= "/" if ($action eq 'tree');
2416                $type .= " on '$branch'" if (defined $branch);
2417        } else {
2418                $type = "log of $branch" if (defined $branch);
2419        }
2420
2421        $res{-title} = $type;
2422        $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2423        $res{'file_name'} = $file_name;
2424
2425        return %res;
2426}
2427
2428## ----------------------------------------------------------------------
2429## git utility subroutines, invoking git commands
2430
2431# returns path to the core git executable and the --git-dir parameter as list
2432sub git_cmd {
2433        $number_of_git_cmds++;
2434        return $GIT, '--git-dir='.$git_dir;
2435}
2436
2437# quote the given arguments for passing them to the shell
2438# quote_command("command", "arg 1", "arg with ' and ! characters")
2439# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2440# Try to avoid using this function wherever possible.
2441sub quote_command {
2442        return join(' ',
2443                map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2444}
2445
2446# get HEAD ref of given project as hash
2447sub git_get_head_hash {
2448        return git_get_full_hash(shift, 'HEAD');
2449}
2450
2451sub git_get_full_hash {
2452        return git_get_hash(@_);
2453}
2454
2455sub git_get_short_hash {
2456        return git_get_hash(@_, '--short=7');
2457}
2458
2459sub git_get_hash {
2460        my ($project, $hash, @options) = @_;
2461        my $o_git_dir = $git_dir;
2462        my $retval = undef;
2463        $git_dir = "$projectroot/$project";
2464        if (open my $fd, '-|', git_cmd(), 'rev-parse',
2465            '--verify', '-q', @options, $hash) {
2466                $retval = <$fd>;
2467                chomp $retval if defined $retval;
2468                close $fd;
2469        }
2470        if (defined $o_git_dir) {
2471                $git_dir = $o_git_dir;
2472        }
2473        return $retval;
2474}
2475
2476# get type of given object
2477sub git_get_type {
2478        my $hash = shift;
2479
2480        open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2481        my $type = <$fd>;
2482        close $fd or return;
2483        chomp $type;
2484        return $type;
2485}
2486
2487# repository configuration
2488our $config_file = '';
2489our %config;
2490
2491# store multiple values for single key as anonymous array reference
2492# single values stored directly in the hash, not as [ <value> ]
2493sub hash_set_multi {
2494        my ($hash, $key, $value) = @_;
2495
2496        if (!exists $hash->{$key}) {
2497                $hash->{$key} = $value;
2498        } elsif (!ref $hash->{$key}) {
2499                $hash->{$key} = [ $hash->{$key}, $value ];
2500        } else {
2501                push @{$hash->{$key}}, $value;
2502        }
2503}
2504
2505# return hash of git project configuration
2506# optionally limited to some section, e.g. 'gitweb'
2507sub git_parse_project_config {
2508        my $section_regexp = shift;
2509        my %config;
2510
2511        local $/ = "\0";
2512
2513        open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2514                or return;
2515
2516        while (my $keyval = <$fh>) {
2517                chomp $keyval;
2518                my ($key, $value) = split(/\n/, $keyval, 2);
2519
2520                hash_set_multi(\%config, $key, $value)
2521                        if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2522        }
2523        close $fh;
2524
2525        return %config;
2526}
2527
2528# convert config value to boolean: 'true' or 'false'
2529# no value, number > 0, 'true' and 'yes' values are true
2530# rest of values are treated as false (never as error)
2531sub config_to_bool {
2532        my $val = shift;
2533
2534        return 1 if !defined $val;             # section.key
2535
2536        # strip leading and trailing whitespace
2537        $val =~ s/^\s+//;
2538        $val =~ s/\s+$//;
2539
2540        return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2541                ($val =~ /^(?:true|yes)$/i));  # section.key = true
2542}
2543
2544# convert config value to simple decimal number
2545# an optional value suffix of 'k', 'm', or 'g' will cause the value
2546# to be multiplied by 1024, 1048576, or 1073741824
2547sub config_to_int {
2548        my $val = shift;
2549
2550        # strip leading and trailing whitespace
2551        $val =~ s/^\s+//;
2552        $val =~ s/\s+$//;
2553
2554        if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2555                $unit = lc($unit);
2556                # unknown unit is treated as 1
2557                return $num * ($unit eq 'g' ? 1073741824 :
2558                               $unit eq 'm' ?    1048576 :
2559                               $unit eq 'k' ?       1024 : 1);
2560        }
2561        return $val;
2562}
2563
2564# convert config value to array reference, if needed
2565sub config_to_multi {
2566        my $val = shift;
2567
2568        return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2569}
2570
2571sub git_get_project_config {
2572        my ($key, $type) = @_;
2573
2574        return unless defined $git_dir;
2575
2576        # key sanity check
2577        return unless ($key);
2578        # only subsection, if exists, is case sensitive,
2579        # and not lowercased by 'git config -z -l'
2580        if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2581                $key = join(".", lc($hi), $mi, lc($lo));
2582        } else {
2583                $key = lc($key);
2584        }
2585        $key =~ s/^gitweb\.//;
2586        return if ($key =~ m/\W/);
2587
2588        # type sanity check
2589        if (defined $type) {
2590                $type =~ s/^--//;
2591                $type = undef
2592                        unless ($type eq 'bool' || $type eq 'int');
2593        }
2594
2595        # get config
2596        if (!defined $config_file ||
2597            $config_file ne "$git_dir/config") {
2598                %config = git_parse_project_config('gitweb');
2599                $config_file = "$git_dir/config";
2600        }
2601
2602        # check if config variable (key) exists
2603        return unless exists $config{"gitweb.$key"};
2604
2605        # ensure given type
2606        if (!defined $type) {
2607                return $config{"gitweb.$key"};
2608        } elsif ($type eq 'bool') {
2609                # backward compatibility: 'git config --bool' returns true/false
2610                return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2611        } elsif ($type eq 'int') {
2612                return config_to_int($config{"gitweb.$key"});
2613        }
2614        return $config{"gitweb.$key"};
2615}
2616
2617# get hash of given path at given ref
2618sub git_get_hash_by_path {
2619        my $base = shift;
2620        my $path = shift || return undef;
2621        my $type = shift;
2622
2623        $path =~ s,/+$,,;
2624
2625        open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2626                or die_error(500, "Open git-ls-tree failed");
2627        my $line = <$fd>;
2628        close $fd or return undef;
2629
2630        if (!defined $line) {
2631                # there is no tree or hash given by $path at $base
2632                return undef;
2633        }
2634
2635        #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2636        $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2637        if (defined $type && $type ne $2) {
2638                # type doesn't match
2639                return undef;
2640        }
2641        return $3;
2642}
2643
2644# get path of entry with given hash at given tree-ish (ref)
2645# used to get 'from' filename for combined diff (merge commit) for renames
2646sub git_get_path_by_hash {
2647        my $base = shift || return;
2648        my $hash = shift || return;
2649
2650        local $/ = "\0";
2651
2652        open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2653                or return undef;
2654        while (my $line = <$fd>) {
2655                chomp $line;
2656
2657                #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2658                #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2659                if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2660                        close $fd;
2661                        return $1;
2662                }
2663        }
2664        close $fd;
2665        return undef;
2666}
2667
2668## ......................................................................
2669## git utility functions, directly accessing git repository
2670
2671# get the value of config variable either from file named as the variable
2672# itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2673# configuration variable in the repository config file.
2674sub git_get_file_or_project_config {
2675        my ($path, $name) = @_;
2676
2677        $git_dir = "$projectroot/$path";
2678        open my $fd, '<', "$git_dir/$name"
2679                or return git_get_project_config($name);
2680        my $conf = <$fd>;
2681        close $fd;
2682        if (defined $conf) {
2683                chomp $conf;
2684        }
2685        return $conf;
2686}
2687
2688sub git_get_project_description {
2689        my $path = shift;
2690        return git_get_file_or_project_config($path, 'description');
2691}
2692
2693sub git_get_project_category {
2694        my $path = shift;
2695        return git_get_file_or_project_config($path, 'category');
2696}
2697
2698
2699# supported formats:
2700# * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2701#   - if its contents is a number, use it as tag weight,
2702#   - otherwise add a tag with weight 1
2703# * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2704#   the same value multiple times increases tag weight
2705# * `gitweb.ctag' multi-valued repo config variable
2706sub git_get_project_ctags {
2707        my $project = shift;
2708        my $ctags = {};
2709
2710        $git_dir = "$projectroot/$project";
2711        if (opendir my $dh, "$git_dir/ctags") {
2712                my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2713                foreach my $tagfile (@files) {
2714                        open my $ct, '<', $tagfile
2715                                or next;
2716                        my $val = <$ct>;
2717                        chomp $val if $val;
2718                        close $ct;
2719
2720                        (my $ctag = $tagfile) =~ s#.*/##;
2721                        if ($val =~ /^\d+$/) {
2722                                $ctags->{$ctag} = $val;
2723                        } else {
2724                                $ctags->{$ctag} = 1;
2725                        }
2726                }
2727                closedir $dh;
2728
2729        } elsif (open my $fh, '<', "$git_dir/ctags") {
2730                while (my $line = <$fh>) {
2731                        chomp $line;
2732                        $ctags->{$line}++ if $line;
2733                }
2734                close $fh;
2735
2736        } else {
2737                my $taglist = config_to_multi(git_get_project_config('ctag'));
2738                foreach my $tag (@$taglist) {
2739                        $ctags->{$tag}++;
2740                }
2741        }
2742
2743        return $ctags;
2744}
2745
2746# return hash, where keys are content tags ('ctags'),
2747# and values are sum of weights of given tag in every project
2748sub git_gather_all_ctags {
2749        my $projects = shift;
2750        my $ctags = {};
2751
2752        foreach my $p (@$projects) {
2753                foreach my $ct (keys %{$p->{'ctags'}}) {
2754                        $ctags->{$ct} += $p->{'ctags'}->{$ct};
2755                }
2756        }
2757
2758        return $ctags;
2759}
2760
2761sub git_populate_project_tagcloud {
2762        my $ctags = shift;
2763
2764        # First, merge different-cased tags; tags vote on casing
2765        my %ctags_lc;
2766        foreach (keys %$ctags) {
2767                $ctags_lc{lc $_}->{count} += $ctags->{$_};
2768                if (not $ctags_lc{lc $_}->{topcount}
2769                    or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2770                        $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2771                        $ctags_lc{lc $_}->{topname} = $_;
2772                }
2773        }
2774
2775        my $cloud;
2776        my $matched = $cgi->param('by_tag');
2777        if (eval { require HTML::TagCloud; 1; }) {
2778                $cloud = HTML::TagCloud->new;
2779                foreach my $ctag (sort keys %ctags_lc) {
2780                        # Pad the title with spaces so that the cloud looks
2781                        # less crammed.
2782                        my $title = esc_html($ctags_lc{$ctag}->{topname});
2783                        $title =~ s/ /&nbsp;/g;
2784                        $title =~ s/^/&nbsp;/g;
2785                        $title =~ s/$/&nbsp;/g;
2786                        if (defined $matched && $matched eq $ctag) {
2787                                $title = qq(<span class="match">$title</span>);
2788                        }
2789                        $cloud->add($title, href(project=>undef, ctag=>$ctag),
2790                                    $ctags_lc{$ctag}->{count});
2791                }
2792        } else {
2793                $cloud = {};
2794                foreach my $ctag (keys %ctags_lc) {
2795                        my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2796                        if (defined $matched && $matched eq $ctag) {
2797                                $title = qq(<span class="match">$title</span>);
2798                        }
2799                        $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2800                        $cloud->{$ctag}{ctag} =
2801                                $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2802                }
2803        }
2804        return $cloud;
2805}
2806
2807sub git_show_project_tagcloud {
2808        my ($cloud, $count) = @_;
2809        if (ref $cloud eq 'HTML::TagCloud') {
2810                return $cloud->html_and_css($count);
2811        } else {
2812                my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2813                return
2814                        '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2815                        join (', ', map {
2816                                $cloud->{$_}->{'ctag'}
2817                        } splice(@tags, 0, $count)) .
2818                        '</div>';
2819        }
2820}
2821
2822sub git_get_project_url_list {
2823        my $path = shift;
2824
2825        $git_dir = "$projectroot/$path";
2826        open my $fd, '<', "$git_dir/cloneurl"
2827                or return wantarray ?
2828                @{ config_to_multi(git_get_project_config('url')) } :
2829                   config_to_multi(git_get_project_config('url'));
2830        my @git_project_url_list = map { chomp; $_ } <$fd>;
2831        close $fd;
2832
2833        return wantarray ? @git_project_url_list : \@git_project_url_list;
2834}
2835
2836sub git_get_projects_list {
2837        my $filter = shift || '';
2838        my $paranoid = shift;
2839        my @list;
2840
2841        if (-d $projects_list) {
2842                # search in directory
2843                my $dir = $projects_list;
2844                # remove the trailing "/"
2845                $dir =~ s!/+$!!;
2846                my $pfxlen = length("$dir");
2847                my $pfxdepth = ($dir =~ tr!/!!);
2848                # when filtering, search only given subdirectory
2849                if ($filter && !$paranoid) {
2850                        $dir .= "/$filter";
2851                        $dir =~ s!/+$!!;
2852                }
2853
2854                File::Find::find({
2855                        follow_fast => 1, # follow symbolic links
2856                        follow_skip => 2, # ignore duplicates
2857                        dangling_symlinks => 0, # ignore dangling symlinks, silently
2858                        wanted => sub {
2859                                # global variables
2860                                our $project_maxdepth;
2861                                our $projectroot;
2862                                # skip project-list toplevel, if we get it.
2863                                return if (m!^[/.]$!);
2864                                # only directories can be git repositories
2865                                return unless (-d $_);
2866                                # don't traverse too deep (Find is super slow on os x)
2867                                # $project_maxdepth excludes depth of $projectroot
2868                                if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2869                                        $File::Find::prune = 1;
2870                                        return;
2871                                }
2872
2873                                my $path = substr($File::Find::name, $pfxlen + 1);
2874                                # paranoidly only filter here
2875                                if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
2876                                        next;
2877                                }
2878                                # we check related file in $projectroot
2879                                if (check_export_ok("$projectroot/$path")) {
2880                                        push @list, { path => $path };
2881                                        $File::Find::prune = 1;
2882                                }
2883                        },
2884                }, "$dir");
2885
2886        } elsif (-f $projects_list) {
2887                # read from file(url-encoded):
2888                # 'git%2Fgit.git Linus+Torvalds'
2889                # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2890                # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2891                open my $fd, '<', $projects_list or return;
2892        PROJECT:
2893                while (my $line = <$fd>) {
2894                        chomp $line;
2895                        my ($path, $owner) = split ' ', $line;
2896                        $path = unescape($path);
2897                        $owner = unescape($owner);
2898                        if (!defined $path) {
2899                                next;
2900                        }
2901                        # if $filter is rpovided, check if $path begins with $filter
2902                        if ($filter && $path !~ m!^\Q$filter\E/!) {
2903                                next;
2904                        }
2905                        if (check_export_ok("$projectroot/$path")) {
2906                                my $pr = {
2907                                        path => $path,
2908                                        owner => to_utf8($owner),
2909                                };
2910                                push @list, $pr;
2911                        }
2912                }
2913                close $fd;
2914        }
2915        return @list;
2916}
2917
2918# written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
2919# as side effects it sets 'forks' field to list of forks for forked projects
2920sub filter_forks_from_projects_list {
2921        my $projects = shift;
2922
2923        my %trie; # prefix tree of directories (path components)
2924        # generate trie out of those directories that might contain forks
2925        foreach my $pr (@$projects) {
2926                my $path = $pr->{'path'};
2927                $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
2928                next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
2929                next unless ($path);      # skip '.git' repository: tests, git-instaweb
2930                next unless (-d "$projectroot/$path"); # containing directory exists
2931                $pr->{'forks'} = [];      # there can be 0 or more forks of project
2932
2933                # add to trie
2934                my @dirs = split('/', $path);
2935                # walk the trie, until either runs out of components or out of trie
2936                my $ref = \%trie;
2937                while (scalar @dirs &&
2938                       exists($ref->{$dirs[0]})) {
2939                        $ref = $ref->{shift @dirs};
2940                }
2941                # create rest of trie structure from rest of components
2942                foreach my $dir (@dirs) {
2943                        $ref = $ref->{$dir} = {};
2944                }
2945                # create end marker, store $pr as a data
2946                $ref->{''} = $pr if (!exists $ref->{''});
2947        }
2948
2949        # filter out forks, by finding shortest prefix match for paths
2950        my @filtered;
2951 PROJECT:
2952        foreach my $pr (@$projects) {
2953                # trie lookup
2954                my $ref = \%trie;
2955        DIR:
2956                foreach my $dir (split('/', $pr->{'path'})) {
2957                        if (exists $ref->{''}) {
2958                                # found [shortest] prefix, is a fork - skip it
2959                                push @{$ref->{''}{'forks'}}, $pr;
2960                                next PROJECT;
2961                        }
2962                        if (!exists $ref->{$dir}) {
2963                                # not in trie, cannot have prefix, not a fork
2964                                push @filtered, $pr;
2965                                next PROJECT;
2966                        }
2967                        # If the dir is there, we just walk one step down the trie.
2968                        $ref = $ref->{$dir};
2969                }
2970                # we ran out of trie
2971                # (shouldn't happen: it's either no match, or end marker)
2972                push @filtered, $pr;
2973        }
2974
2975        return @filtered;
2976}
2977
2978# note: fill_project_list_info must be run first,
2979# for 'descr_long' and 'ctags' to be filled
2980sub search_projects_list {
2981        my ($projlist, %opts) = @_;
2982        my $tagfilter  = $opts{'tagfilter'};
2983        my $searchtext = $opts{'searchtext'};
2984
2985        return @$projlist
2986                unless ($tagfilter || $searchtext);
2987
2988        my @projects;
2989 PROJECT:
2990        foreach my $pr (@$projlist) {
2991
2992                if ($tagfilter) {
2993                        next unless ref($pr->{'ctags'}) eq 'HASH';
2994                        next unless
2995                                grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
2996                }
2997
2998                if ($searchtext) {
2999                        next unless
3000                                $pr->{'path'} =~ /$searchtext/ ||
3001                                $pr->{'descr_long'} =~ /$searchtext/;
3002                }
3003
3004                push @projects, $pr;
3005        }
3006
3007        return @projects;
3008}
3009
3010our $gitweb_project_owner = undef;
3011sub git_get_project_list_from_file {
3012
3013        return if (defined $gitweb_project_owner);
3014
3015        $gitweb_project_owner = {};
3016        # read from file (url-encoded):
3017        # 'git%2Fgit.git Linus+Torvalds'
3018        # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3019        # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3020        if (-f $projects_list) {
3021                open(my $fd, '<', $projects_list);
3022                while (my $line = <$fd>) {
3023                        chomp $line;
3024                        my ($pr, $ow) = split ' ', $line;
3025                        $pr = unescape($pr);
3026                        $ow = unescape($ow);
3027                        $gitweb_project_owner->{$pr} = to_utf8($ow);
3028                }
3029                close $fd;
3030        }
3031}
3032
3033sub git_get_project_owner {
3034        my $project = shift;
3035        my $owner;
3036
3037        return undef unless $project;
3038        $git_dir = "$projectroot/$project";
3039
3040        if (!defined $gitweb_project_owner) {
3041                git_get_project_list_from_file();
3042        }
3043
3044        if (exists $gitweb_project_owner->{$project}) {
3045                $owner = $gitweb_project_owner->{$project};
3046        }
3047        if (!defined $owner){
3048                $owner = git_get_project_config('owner');
3049        }
3050        if (!defined $owner) {
3051                $owner = get_file_owner("$git_dir");
3052        }
3053
3054        return $owner;
3055}
3056
3057sub git_get_last_activity {
3058        my ($path) = @_;
3059        my $fd;
3060
3061        $git_dir = "$projectroot/$path";
3062        open($fd, "-|", git_cmd(), 'for-each-ref',
3063             '--format=%(committer)',
3064             '--sort=-committerdate',
3065             '--count=1',
3066             'refs/heads') or return;
3067        my $most_recent = <$fd>;
3068        close $fd or return;
3069        if (defined $most_recent &&
3070            $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3071                my $timestamp = $1;
3072                my $age = time - $timestamp;
3073                return ($age, age_string($age));
3074        }
3075        return (undef, undef);
3076}
3077
3078# Implementation note: when a single remote is wanted, we cannot use 'git
3079# remote show -n' because that command always work (assuming it's a remote URL
3080# if it's not defined), and we cannot use 'git remote show' because that would
3081# try to make a network roundtrip. So the only way to find if that particular
3082# remote is defined is to walk the list provided by 'git remote -v' and stop if
3083# and when we find what we want.
3084sub git_get_remotes_list {
3085        my $wanted = shift;
3086        my %remotes = ();
3087
3088        open my $fd, '-|' , git_cmd(), 'remote', '-v';
3089        return unless $fd;
3090        while (my $remote = <$fd>) {
3091                chomp $remote;
3092                $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3093                next if $wanted and not $remote eq $wanted;
3094                my ($url, $key) = ($1, $2);
3095
3096                $remotes{$remote} ||= { 'heads' => () };
3097                $remotes{$remote}{$key} = $url;
3098        }
3099        close $fd or return;
3100        return wantarray ? %remotes : \%remotes;
3101}
3102
3103# Takes a hash of remotes as first parameter and fills it by adding the
3104# available remote heads for each of the indicated remotes.
3105sub fill_remote_heads {
3106        my $remotes = shift;
3107        my @heads = map { "remotes/$_" } keys %$remotes;
3108        my @remoteheads = git_get_heads_list(undef, @heads);
3109        foreach my $remote (keys %$remotes) {
3110                $remotes->{$remote}{'heads'} = [ grep {
3111                        $_->{'name'} =~ s!^$remote/!!
3112                        } @remoteheads ];
3113        }
3114}
3115
3116sub git_get_references {
3117        my $type = shift || "";
3118        my %refs;
3119        # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3120        # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3121        open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3122                ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3123                or return;
3124
3125        while (my $line = <$fd>) {
3126                chomp $line;
3127                if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3128                        if (defined $refs{$1}) {
3129                                push @{$refs{$1}}, $2;
3130                        } else {
3131                                $refs{$1} = [ $2 ];
3132                        }
3133                }
3134        }
3135        close $fd or return;
3136        return \%refs;
3137}
3138
3139sub git_get_rev_name_tags {
3140        my $hash = shift || return undef;
3141
3142        open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3143                or return;
3144        my $name_rev = <$fd>;
3145        close $fd;
3146
3147        if ($name_rev =~ m|^$hash tags/(.*)$|) {
3148                return $1;
3149        } else {
3150                # catches also '$hash undefined' output
3151                return undef;
3152        }
3153}
3154
3155## ----------------------------------------------------------------------
3156## parse to hash functions
3157
3158sub parse_date {
3159        my $epoch = shift;
3160        my $tz = shift || "-0000";
3161
3162        my %date;
3163        my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3164        my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3165        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3166        $date{'hour'} = $hour;
3167        $date{'minute'} = $min;
3168        $date{'mday'} = $mday;
3169        $date{'day'} = $days[$wday];
3170        $date{'month'} = $months[$mon];
3171        $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3172                             $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3173        $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3174                             $mday, $months[$mon], $hour ,$min;
3175        $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3176                             1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3177
3178        my ($tz_sign, $tz_hour, $tz_min) =
3179                ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3180        $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3181        my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3182        ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3183        $date{'hour_local'} = $hour;
3184        $date{'minute_local'} = $min;
3185        $date{'tz_local'} = $tz;
3186        $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3187                                  1900+$year, $mon+1, $mday,
3188                                  $hour, $min, $sec, $tz);
3189        return %date;
3190}
3191
3192sub parse_tag {
3193        my $tag_id = shift;
3194        my %tag;
3195        my @comment;
3196
3197        open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3198        $tag{'id'} = $tag_id;
3199        while (my $line = <$fd>) {
3200                chomp $line;
3201                if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3202                        $tag{'object'} = $1;
3203                } elsif ($line =~ m/^type (.+)$/) {
3204                        $tag{'type'} = $1;
3205                } elsif ($line =~ m/^tag (.+)$/) {
3206                        $tag{'name'} = $1;
3207                } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3208                        $tag{'author'} = $1;
3209                        $tag{'author_epoch'} = $2;
3210                        $tag{'author_tz'} = $3;
3211                        if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3212                                $tag{'author_name'}  = $1;
3213                                $tag{'author_email'} = $2;
3214                        } else {
3215                                $tag{'author_name'} = $tag{'author'};
3216                        }
3217                } elsif ($line =~ m/--BEGIN/) {
3218                        push @comment, $line;
3219                        last;
3220                } elsif ($line eq "") {
3221                        last;
3222                }
3223        }
3224        push @comment, <$fd>;
3225        $tag{'comment'} = \@comment;
3226        close $fd or return;
3227        if (!defined $tag{'name'}) {
3228                return
3229        };
3230        return %tag
3231}
3232
3233sub parse_commit_text {
3234        my ($commit_text, $withparents) = @_;
3235        my @commit_lines = split '\n', $commit_text;
3236        my %co;
3237
3238        pop @commit_lines; # Remove '\0'
3239
3240        if (! @commit_lines) {
3241                return;
3242        }
3243
3244        my $header = shift @commit_lines;
3245        if ($header !~ m/^[0-9a-fA-F]{40}/) {
3246                return;
3247        }
3248        ($co{'id'}, my @parents) = split ' ', $header;
3249        while (my $line = shift @commit_lines) {
3250                last if $line eq "\n";
3251                if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3252                        $co{'tree'} = $1;
3253                } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3254                        push @parents, $1;
3255                } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3256                        $co{'author'} = to_utf8($1);
3257                        $co{'author_epoch'} = $2;
3258                        $co{'author_tz'} = $3;
3259                        if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3260                                $co{'author_name'}  = $1;
3261                                $co{'author_email'} = $2;
3262                        } else {
3263                                $co{'author_name'} = $co{'author'};
3264                        }
3265                } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3266                        $co{'committer'} = to_utf8($1);
3267                        $co{'committer_epoch'} = $2;
3268                        $co{'committer_tz'} = $3;
3269                        if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3270                                $co{'committer_name'}  = $1;
3271                                $co{'committer_email'} = $2;
3272                        } else {
3273                                $co{'committer_name'} = $co{'committer'};
3274                        }
3275                }
3276        }
3277        if (!defined $co{'tree'}) {
3278                return;
3279        };
3280        $co{'parents'} = \@parents;
3281        $co{'parent'} = $parents[0];
3282
3283        foreach my $title (@commit_lines) {
3284                $title =~ s/^    //;
3285                if ($title ne "") {
3286                        $co{'title'} = chop_str($title, 80, 5);
3287                        # remove leading stuff of merges to make the interesting part visible
3288                        if (length($title) > 50) {
3289                                $title =~ s/^Automatic //;
3290                                $title =~ s/^merge (of|with) /Merge ... /i;
3291                                if (length($title) > 50) {
3292                                        $title =~ s/(http|rsync):\/\///;
3293                                }
3294                                if (length($title) > 50) {
3295                                        $title =~ s/(master|www|rsync)\.//;
3296                                }
3297                                if (length($title) > 50) {
3298                                        $title =~ s/kernel.org:?//;
3299                                }
3300                                if (length($title) > 50) {
3301                                        $title =~ s/\/pub\/scm//;
3302                                }
3303                        }
3304                        $co{'title_short'} = chop_str($title, 50, 5);
3305                        last;
3306                }
3307        }
3308        if (! defined $co{'title'} || $co{'title'} eq "") {
3309                $co{'title'} = $co{'title_short'} = '(no commit message)';
3310        }
3311        # remove added spaces
3312        foreach my $line (@commit_lines) {
3313                $line =~ s/^    //;
3314        }
3315        $co{'comment'} = \@commit_lines;
3316
3317        my $age = time - $co{'committer_epoch'};
3318        $co{'age'} = $age;
3319        $co{'age_string'} = age_string($age);
3320        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3321        if ($age > 60*60*24*7*2) {
3322                $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3323                $co{'age_string_age'} = $co{'age_string'};
3324        } else {
3325                $co{'age_string_date'} = $co{'age_string'};
3326                $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3327        }
3328        return %co;
3329}
3330
3331sub parse_commit {
3332        my ($commit_id) = @_;
3333        my %co;
3334
3335        local $/ = "\0";
3336
3337        open my $fd, "-|", git_cmd(), "rev-list",
3338                "--parents",
3339                "--header",
3340                "--max-count=1",
3341                $commit_id,
3342                "--",
3343                or die_error(500, "Open git-rev-list failed");
3344        %co = parse_commit_text(<$fd>, 1);
3345        close $fd;
3346
3347        return %co;
3348}
3349
3350sub parse_commits {
3351        my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3352        my @cos;
3353
3354        $maxcount ||= 1;
3355        $skip ||= 0;
3356
3357        local $/ = "\0";
3358
3359        open my $fd, "-|", git_cmd(), "rev-list",
3360                "--header",
3361                @args,
3362                ("--max-count=" . $maxcount),
3363                ("--skip=" . $skip),
3364                @extra_options,
3365                $commit_id,
3366                "--",
3367                ($filename ? ($filename) : ())
3368                or die_error(500, "Open git-rev-list failed");
3369        while (my $line = <$fd>) {
3370                my %co = parse_commit_text($line);
3371                push @cos, \%co;
3372        }
3373        close $fd;
3374
3375        return wantarray ? @cos : \@cos;
3376}
3377
3378# parse line of git-diff-tree "raw" output
3379sub parse_difftree_raw_line {
3380        my $line = shift;
3381        my %res;
3382
3383        # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3384        # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3385        if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3386                $res{'from_mode'} = $1;
3387                $res{'to_mode'} = $2;
3388                $res{'from_id'} = $3;
3389                $res{'to_id'} = $4;
3390                $res{'status'} = $5;
3391                $res{'similarity'} = $6;
3392                if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3393                        ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3394                } else {
3395                        $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3396                }
3397        }
3398        # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3399        # combined diff (for merge commit)
3400        elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3401                $res{'nparents'}  = length($1);
3402                $res{'from_mode'} = [ split(' ', $2) ];
3403                $res{'to_mode'} = pop @{$res{'from_mode'}};
3404                $res{'from_id'} = [ split(' ', $3) ];
3405                $res{'to_id'} = pop @{$res{'from_id'}};
3406                $res{'status'} = [ split('', $4) ];
3407                $res{'to_file'} = unquote($5);
3408        }
3409        # 'c512b523472485aef4fff9e57b229d9d243c967f'
3410        elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3411                $res{'commit'} = $1;
3412        }
3413
3414        return wantarray ? %res : \%res;
3415}
3416
3417# wrapper: return parsed line of git-diff-tree "raw" output
3418# (the argument might be raw line, or parsed info)
3419sub parsed_difftree_line {
3420        my $line_or_ref = shift;
3421
3422        if (ref($line_or_ref) eq "HASH") {
3423                # pre-parsed (or generated by hand)
3424                return $line_or_ref;
3425        } else {
3426                return parse_difftree_raw_line($line_or_ref);
3427        }
3428}
3429
3430# parse line of git-ls-tree output
3431sub parse_ls_tree_line {
3432        my $line = shift;
3433        my %opts = @_;
3434        my %res;
3435
3436        if ($opts{'-l'}) {
3437                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3438                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3439
3440                $res{'mode'} = $1;
3441                $res{'type'} = $2;
3442                $res{'hash'} = $3;
3443                $res{'size'} = $4;
3444                if ($opts{'-z'}) {
3445                        $res{'name'} = $5;
3446                } else {
3447                        $res{'name'} = unquote($5);
3448                }
3449        } else {
3450                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3451                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3452
3453                $res{'mode'} = $1;
3454                $res{'type'} = $2;
3455                $res{'hash'} = $3;
3456                if ($opts{'-z'}) {
3457                        $res{'name'} = $4;
3458                } else {
3459                        $res{'name'} = unquote($4);
3460                }
3461        }
3462
3463        return wantarray ? %res : \%res;
3464}
3465
3466# generates _two_ hashes, references to which are passed as 2 and 3 argument
3467sub parse_from_to_diffinfo {
3468        my ($diffinfo, $from, $to, @parents) = @_;
3469
3470        if ($diffinfo->{'nparents'}) {
3471                # combined diff
3472                $from->{'file'} = [];
3473                $from->{'href'} = [];
3474                fill_from_file_info($diffinfo, @parents)
3475                        unless exists $diffinfo->{'from_file'};
3476                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3477                        $from->{'file'}[$i] =
3478                                defined $diffinfo->{'from_file'}[$i] ?
3479                                        $diffinfo->{'from_file'}[$i] :
3480                                        $diffinfo->{'to_file'};
3481                        if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3482                                $from->{'href'}[$i] = href(action=>"blob",
3483                                                           hash_base=>$parents[$i],
3484                                                           hash=>$diffinfo->{'from_id'}[$i],
3485                                                           file_name=>$from->{'file'}[$i]);
3486                        } else {
3487                                $from->{'href'}[$i] = undef;
3488                        }
3489                }
3490        } else {
3491                # ordinary (not combined) diff
3492                $from->{'file'} = $diffinfo->{'from_file'};
3493                if ($diffinfo->{'status'} ne "A") { # not new (added) file
3494                        $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3495                                               hash=>$diffinfo->{'from_id'},
3496                                               file_name=>$from->{'file'});
3497                } else {
3498                        delete $from->{'href'};
3499                }
3500        }
3501
3502        $to->{'file'} = $diffinfo->{'to_file'};
3503        if (!is_deleted($diffinfo)) { # file exists in result
3504                $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3505                                     hash=>$diffinfo->{'to_id'},
3506                                     file_name=>$to->{'file'});
3507        } else {
3508                delete $to->{'href'};
3509        }
3510}
3511
3512## ......................................................................
3513## parse to array of hashes functions
3514
3515sub git_get_heads_list {
3516        my ($limit, @classes) = @_;
3517        @classes = ('heads') unless @classes;
3518        my @patterns = map { "refs/$_" } @classes;
3519        my @headslist;
3520
3521        open my $fd, '-|', git_cmd(), 'for-each-ref',
3522                ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3523                '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3524                @patterns
3525                or return;
3526        while (my $line = <$fd>) {
3527                my %ref_item;
3528
3529                chomp $line;
3530                my ($refinfo, $committerinfo) = split(/\0/, $line);
3531                my ($hash, $name, $title) = split(' ', $refinfo, 3);
3532                my ($committer, $epoch, $tz) =
3533                        ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3534                $ref_item{'fullname'}  = $name;
3535                $name =~ s!^refs/(?:head|remote)s/!!;
3536
3537                $ref_item{'name'}  = $name;
3538                $ref_item{'id'}    = $hash;
3539                $ref_item{'title'} = $title || '(no commit message)';
3540                $ref_item{'epoch'} = $epoch;
3541                if ($epoch) {
3542                        $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3543                } else {
3544                        $ref_item{'age'} = "unknown";
3545                }
3546
3547                push @headslist, \%ref_item;
3548        }
3549        close $fd;
3550
3551        return wantarray ? @headslist : \@headslist;
3552}
3553
3554sub git_get_tags_list {
3555        my $limit = shift;
3556        my @tagslist;
3557
3558        open my $fd, '-|', git_cmd(), 'for-each-ref',
3559                ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3560                '--format=%(objectname) %(objecttype) %(refname) '.
3561                '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3562                'refs/tags'
3563                or return;
3564        while (my $line = <$fd>) {
3565                my %ref_item;
3566
3567                chomp $line;
3568                my ($refinfo, $creatorinfo) = split(/\0/, $line);
3569                my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3570                my ($creator, $epoch, $tz) =
3571                        ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3572                $ref_item{'fullname'} = $name;
3573                $name =~ s!^refs/tags/!!;
3574
3575                $ref_item{'type'} = $type;
3576                $ref_item{'id'} = $id;
3577                $ref_item{'name'} = $name;
3578                if ($type eq "tag") {
3579                        $ref_item{'subject'} = $title;
3580                        $ref_item{'reftype'} = $reftype;
3581                        $ref_item{'refid'}   = $refid;
3582                } else {
3583                        $ref_item{'reftype'} = $type;
3584                        $ref_item{'refid'}   = $id;
3585                }
3586
3587                if ($type eq "tag" || $type eq "commit") {
3588                        $ref_item{'epoch'} = $epoch;
3589                        if ($epoch) {
3590                                $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3591                        } else {
3592                                $ref_item{'age'} = "unknown";
3593                        }
3594                }
3595
3596                push @tagslist, \%ref_item;
3597        }
3598        close $fd;
3599
3600        return wantarray ? @tagslist : \@tagslist;
3601}
3602
3603## ----------------------------------------------------------------------
3604## filesystem-related functions
3605
3606sub get_file_owner {
3607        my $path = shift;
3608
3609        my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3610        my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3611        if (!defined $gcos) {
3612                return undef;
3613        }
3614        my $owner = $gcos;
3615        $owner =~ s/[,;].*$//;
3616        return to_utf8($owner);
3617}
3618
3619# assume that file exists
3620sub insert_file {
3621        my $filename = shift;
3622
3623        open my $fd, '<', $filename;
3624        print map { to_utf8($_) } <$fd>;
3625        close $fd;
3626}
3627
3628## ......................................................................
3629## mimetype related functions
3630
3631sub mimetype_guess_file {
3632        my $filename = shift;
3633        my $mimemap = shift;
3634        -r $mimemap or return undef;
3635
3636        my %mimemap;
3637        open(my $mh, '<', $mimemap) or return undef;
3638        while (<$mh>) {
3639                next if m/^#/; # skip comments
3640                my ($mimetype, @exts) = split(/\s+/);
3641                foreach my $ext (@exts) {
3642                        $mimemap{$ext} = $mimetype;
3643                }
3644        }
3645        close($mh);
3646
3647        $filename =~ /\.([^.]*)$/;
3648        return $mimemap{$1};
3649}
3650
3651sub mimetype_guess {
3652        my $filename = shift;
3653        my $mime;
3654        $filename =~ /\./ or return undef;
3655
3656        if ($mimetypes_file) {
3657                my $file = $mimetypes_file;
3658                if ($file !~ m!^/!) { # if it is relative path
3659                        # it is relative to project
3660                        $file = "$projectroot/$project/$file";
3661                }
3662                $mime = mimetype_guess_file($filename, $file);
3663        }
3664        $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3665        return $mime;
3666}
3667
3668sub blob_mimetype {
3669        my $fd = shift;
3670        my $filename = shift;
3671
3672        if ($filename) {
3673                my $mime = mimetype_guess($filename);
3674                $mime and return $mime;
3675        }
3676
3677        # just in case
3678        return $default_blob_plain_mimetype unless $fd;
3679
3680        if (-T $fd) {
3681                return 'text/plain';
3682        } elsif (! $filename) {
3683                return 'application/octet-stream';
3684        } elsif ($filename =~ m/\.png$/i) {
3685                return 'image/png';
3686        } elsif ($filename =~ m/\.gif$/i) {
3687                return 'image/gif';
3688        } elsif ($filename =~ m/\.jpe?g$/i) {
3689                return 'image/jpeg';
3690        } else {
3691                return 'application/octet-stream';
3692        }
3693}
3694
3695sub blob_contenttype {
3696        my ($fd, $file_name, $type) = @_;
3697
3698        $type ||= blob_mimetype($fd, $file_name);
3699        if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3700                $type .= "; charset=$default_text_plain_charset";
3701        }
3702
3703        return $type;
3704}
3705
3706# guess file syntax for syntax highlighting; return undef if no highlighting
3707# the name of syntax can (in the future) depend on syntax highlighter used
3708sub guess_file_syntax {
3709        my ($highlight, $mimetype, $file_name) = @_;
3710        return undef unless ($highlight && defined $file_name);
3711        my $basename = basename($file_name, '.in');
3712        return $highlight_basename{$basename}
3713                if exists $highlight_basename{$basename};
3714
3715        $basename =~ /\.([^.]*)$/;
3716        my $ext = $1 or return undef;
3717        return $highlight_ext{$ext}
3718                if exists $highlight_ext{$ext};
3719
3720        return undef;
3721}
3722
3723# run highlighter and return FD of its output,
3724# or return original FD if no highlighting
3725sub run_highlighter {
3726        my ($fd, $highlight, $syntax) = @_;
3727        return $fd unless ($highlight && defined $syntax);
3728
3729        close $fd;
3730        open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3731                  quote_command($highlight_bin).
3732                  " --replace-tabs=8 --fragment --syntax $syntax |"
3733                or die_error(500, "Couldn't open file or run syntax highlighter");
3734        return $fd;
3735}
3736
3737## ======================================================================
3738## functions printing HTML: header, footer, error page
3739
3740sub get_page_title {
3741        my $title = to_utf8($site_name);
3742
3743        unless (defined $project) {
3744                if (defined $project_filter) {
3745                        $title .= " - " . to_utf8($project_filter);
3746                }
3747                return $title;
3748        }
3749        $title .= " - " . to_utf8($project);
3750
3751        return $title unless (defined $action);
3752        $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3753
3754        return $title unless (defined $file_name);
3755        $title .= " - " . esc_path($file_name);
3756        if ($action eq "tree" && $file_name !~ m|/$|) {
3757                $title .= "/";
3758        }
3759
3760        return $title;
3761}
3762
3763sub get_content_type_html {
3764        # require explicit support from the UA if we are to send the page as
3765        # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3766        # we have to do this because MSIE sometimes globs '*/*', pretending to
3767        # support xhtml+xml but choking when it gets what it asked for.
3768        if (defined $cgi->http('HTTP_ACCEPT') &&
3769            $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3770            $cgi->Accept('application/xhtml+xml') != 0) {
3771                return 'application/xhtml+xml';
3772        } else {
3773                return 'text/html';
3774        }
3775}
3776
3777sub print_feed_meta {
3778        if (defined $project) {
3779                my %href_params = get_feed_info();
3780                if (!exists $href_params{'-title'}) {
3781                        $href_params{'-title'} = 'log';
3782                }
3783
3784                foreach my $format (qw(RSS Atom)) {
3785                        my $type = lc($format);
3786                        my %link_attr = (
3787                                '-rel' => 'alternate',
3788                                '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3789                                '-type' => "application/$type+xml"
3790                        );
3791
3792                        $href_params{'action'} = $type;
3793                        $link_attr{'-href'} = href(%href_params);
3794                        print "<link ".
3795                              "rel=\"$link_attr{'-rel'}\" ".
3796                              "title=\"$link_attr{'-title'}\" ".
3797                              "href=\"$link_attr{'-href'}\" ".
3798                              "type=\"$link_attr{'-type'}\" ".
3799                              "/>\n";
3800
3801                        $href_params{'extra_options'} = '--no-merges';
3802                        $link_attr{'-href'} = href(%href_params);
3803                        $link_attr{'-title'} .= ' (no merges)';
3804                        print "<link ".
3805                              "rel=\"$link_attr{'-rel'}\" ".
3806                              "title=\"$link_attr{'-title'}\" ".
3807                              "href=\"$link_attr{'-href'}\" ".
3808                              "type=\"$link_attr{'-type'}\" ".
3809                              "/>\n";
3810                }
3811
3812        } else {
3813                printf('<link rel="alternate" title="%s projects list" '.
3814                       'href="%s" type="text/plain; charset=utf-8" />'."\n",
3815                       esc_attr($site_name), href(project=>undef, action=>"project_index"));
3816                printf('<link rel="alternate" title="%s projects feeds" '.
3817                       'href="%s" type="text/x-opml" />'."\n",
3818                       esc_attr($site_name), href(project=>undef, action=>"opml"));
3819        }
3820}
3821
3822sub print_header_links {
3823        my $status = shift;
3824
3825        # print out each stylesheet that exist, providing backwards capability
3826        # for those people who defined $stylesheet in a config file
3827        if (defined $stylesheet) {
3828                print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3829        } else {
3830                foreach my $stylesheet (@stylesheets) {
3831                        next unless $stylesheet;
3832                        print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3833                }
3834        }
3835        print_feed_meta()
3836                if ($status eq '200 OK');
3837        if (defined $favicon) {
3838                print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3839        }
3840}
3841
3842sub print_nav_breadcrumbs {
3843        my %opts = @_;
3844
3845        print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3846        if (defined $project) {
3847                print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3848                if (defined $action) {
3849                        my $action_print = $action ;
3850                        if (defined $opts{-action_extra}) {
3851                                $action_print = $cgi->a({-href => href(action=>$action)},
3852                                        $action);
3853                        }
3854                        print " / $action_print";
3855                }
3856                if (defined $opts{-action_extra}) {
3857                        print " / $opts{-action_extra}";
3858                }
3859                print "\n";
3860        }
3861}
3862
3863sub print_search_form {
3864        if (!defined $searchtext) {
3865                $searchtext = "";
3866        }
3867        my $search_hash;
3868        if (defined $hash_base) {
3869                $search_hash = $hash_base;
3870        } elsif (defined $hash) {
3871                $search_hash = $hash;
3872        } else {
3873                $search_hash = "HEAD";
3874        }
3875        my $action = $my_uri;
3876        my $use_pathinfo = gitweb_check_feature('pathinfo');
3877        if ($use_pathinfo) {
3878                $action .= "/".esc_url($project);
3879        }
3880        print $cgi->startform(-method => "get", -action => $action) .
3881              "<div class=\"search\">\n" .
3882              (!$use_pathinfo &&
3883              $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3884              $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3885              $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3886              $cgi->popup_menu(-name => 'st', -default => 'commit',
3887                               -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3888              $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3889              " search:\n",
3890              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3891              "<span title=\"Extended regular expression\">" .
3892              $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3893                             -checked => $search_use_regexp) .
3894              "</span>" .
3895              "</div>" .
3896              $cgi->end_form() . "\n";
3897}
3898
3899sub git_header_html {
3900        my $status = shift || "200 OK";
3901        my $expires = shift;
3902        my %opts = @_;
3903
3904        my $title = get_page_title();
3905        my $content_type = get_content_type_html();
3906        print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3907                           -status=> $status, -expires => $expires)
3908                unless ($opts{'-no_http_header'});
3909        my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3910        print <<EOF;
3911<?xml version="1.0" encoding="utf-8"?>
3912<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3913<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3914<!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3915<!-- git core binaries version $git_version -->
3916<head>
3917<meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3918<meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3919<meta name="robots" content="index, nofollow"/>
3920<title>$title</title>
3921EOF
3922        # the stylesheet, favicon etc urls won't work correctly with path_info
3923        # unless we set the appropriate base URL
3924        if ($ENV{'PATH_INFO'}) {
3925                print "<base href=\"".esc_url($base_url)."\" />\n";
3926        }
3927        print_header_links($status);
3928
3929        if (defined $site_html_head_string) {
3930                print to_utf8($site_html_head_string);
3931        }
3932
3933        print "</head>\n" .
3934              "<body>\n";
3935
3936        if (defined $site_header && -f $site_header) {
3937                insert_file($site_header);
3938        }
3939
3940        print "<div class=\"page_header\">\n";
3941        if (defined $logo) {
3942                print $cgi->a({-href => esc_url($logo_url),
3943                               -title => $logo_label},
3944                              $cgi->img({-src => esc_url($logo),
3945                                         -width => 72, -height => 27,
3946                                         -alt => "git",
3947                                         -class => "logo"}));
3948        }
3949        print_nav_breadcrumbs(%opts);
3950        print "</div>\n";
3951
3952        my $have_search = gitweb_check_feature('search');
3953        if (defined $project && $have_search) {
3954                print_search_form();
3955        }
3956}
3957
3958sub git_footer_html {
3959        my $feed_class = 'rss_logo';
3960
3961        print "<div class=\"page_footer\">\n";
3962        if (defined $project) {
3963                my $descr = git_get_project_description($project);
3964                if (defined $descr) {
3965                        print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3966                }
3967
3968                my %href_params = get_feed_info();
3969                if (!%href_params) {
3970                        $feed_class .= ' generic';
3971                }
3972                $href_params{'-title'} ||= 'log';
3973
3974                foreach my $format (qw(RSS Atom)) {
3975                        $href_params{'action'} = lc($format);
3976                        print $cgi->a({-href => href(%href_params),
3977                                      -title => "$href_params{'-title'} $format feed",
3978                                      -class => $feed_class}, $format)."\n";
3979                }
3980
3981        } else {
3982                print $cgi->a({-href => href(project=>undef, action=>"opml",
3983                                             project_filter => $project_filter),
3984                              -class => $feed_class}, "OPML") . " ";
3985                print $cgi->a({-href => href(project=>undef, action=>"project_index",
3986                                             project_filter => $project_filter),
3987                              -class => $feed_class}, "TXT") . "\n";
3988        }
3989        print "</div>\n"; # class="page_footer"
3990
3991        if (defined $t0 && gitweb_check_feature('timed')) {
3992                print "<div id=\"generating_info\">\n";
3993                print 'This page took '.
3994                      '<span id="generating_time" class="time_span">'.
3995                      tv_interval($t0, [ gettimeofday() ]).
3996                      ' seconds </span>'.
3997                      ' and '.
3998                      '<span id="generating_cmd">'.
3999                      $number_of_git_cmds.
4000                      '</span> git commands '.
4001                      " to generate.\n";
4002                print "</div>\n"; # class="page_footer"
4003        }
4004
4005        if (defined $site_footer && -f $site_footer) {
4006                insert_file($site_footer);
4007        }
4008
4009        print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
4010        if (defined $action &&
4011            $action eq 'blame_incremental') {
4012                print qq!<script type="text/javascript">\n!.
4013                      qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
4014                      qq!           "!. href() .qq!");\n!.
4015                      qq!</script>\n!;
4016        } else {
4017                my ($jstimezone, $tz_cookie, $datetime_class) =
4018                        gitweb_get_feature('javascript-timezone');
4019
4020                print qq!<script type="text/javascript">\n!.
4021                      qq!window.onload = function () {\n!;
4022                if (gitweb_check_feature('javascript-actions')) {
4023                        print qq!       fixLinks();\n!;
4024                }
4025                if ($jstimezone && $tz_cookie && $datetime_class) {
4026                        print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4027                              qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4028                }
4029                print qq!};\n!.
4030                      qq!</script>\n!;
4031        }
4032
4033        print "</body>\n" .
4034              "</html>";
4035}
4036
4037# die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4038# Example: die_error(404, 'Hash not found')
4039# By convention, use the following status codes (as defined in RFC 2616):
4040# 400: Invalid or missing CGI parameters, or
4041#      requested object exists but has wrong type.
4042# 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4043#      this server or project.
4044# 404: Requested object/revision/project doesn't exist.
4045# 500: The server isn't configured properly, or
4046#      an internal error occurred (e.g. failed assertions caused by bugs), or
4047#      an unknown error occurred (e.g. the git binary died unexpectedly).
4048# 503: The server is currently unavailable (because it is overloaded,
4049#      or down for maintenance).  Generally, this is a temporary state.
4050sub die_error {
4051        my $status = shift || 500;
4052        my $error = esc_html(shift) || "Internal Server Error";
4053        my $extra = shift;
4054        my %opts = @_;
4055
4056        my %http_responses = (
4057                400 => '400 Bad Request',
4058                403 => '403 Forbidden',
4059                404 => '404 Not Found',
4060                500 => '500 Internal Server Error',
4061                503 => '503 Service Unavailable',
4062        );
4063        git_header_html($http_responses{$status}, undef, %opts);
4064        print <<EOF;
4065<div class="page_body">
4066<br /><br />
4067$status - $error
4068<br />
4069EOF
4070        if (defined $extra) {
4071                print "<hr />\n" .
4072                      "$extra\n";
4073        }
4074        print "</div>\n";
4075
4076        git_footer_html();
4077        goto DONE_GITWEB
4078                unless ($opts{'-error_handler'});
4079}
4080
4081## ----------------------------------------------------------------------
4082## functions printing or outputting HTML: navigation
4083
4084sub git_print_page_nav {
4085        my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4086        $extra = '' if !defined $extra; # pager or formats
4087
4088        my @navs = qw(summary shortlog log commit commitdiff tree);
4089        if ($suppress) {
4090                @navs = grep { $_ ne $suppress } @navs;
4091        }
4092
4093        my %arg = map { $_ => {action=>$_} } @navs;
4094        if (defined $head) {
4095                for (qw(commit commitdiff)) {
4096                        $arg{$_}{'hash'} = $head;
4097                }
4098                if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4099                        for (qw(shortlog log)) {
4100                                $arg{$_}{'hash'} = $head;
4101                        }
4102                }
4103        }
4104
4105        $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4106        $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4107
4108        my @actions = gitweb_get_feature('actions');
4109        my %repl = (
4110                '%' => '%',
4111                'n' => $project,         # project name
4112                'f' => $git_dir,         # project path within filesystem
4113                'h' => $treehead || '',  # current hash ('h' parameter)
4114                'b' => $treebase || '',  # hash base ('hb' parameter)
4115        );
4116        while (@actions) {
4117                my ($label, $link, $pos) = splice(@actions,0,3);
4118                # insert
4119                @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4120                # munch munch
4121                $link =~ s/%([%nfhb])/$repl{$1}/g;
4122                $arg{$label}{'_href'} = $link;
4123        }
4124
4125        print "<div class=\"page_nav\">\n" .
4126                (join " | ",
4127                 map { $_ eq $current ?
4128                       $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4129                 } @navs);
4130        print "<br/>\n$extra<br/>\n" .
4131              "</div>\n";
4132}
4133
4134# returns a submenu for the nagivation of the refs views (tags, heads,
4135# remotes) with the current view disabled and the remotes view only
4136# available if the feature is enabled
4137sub format_ref_views {
4138        my ($current) = @_;
4139        my @ref_views = qw{tags heads};
4140        push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4141        return join " | ", map {
4142                $_ eq $current ? $_ :
4143                $cgi->a({-href => href(action=>$_)}, $_)
4144        } @ref_views
4145}
4146
4147sub format_paging_nav {
4148        my ($action, $page, $has_next_link) = @_;
4149        my $paging_nav;
4150
4151
4152        if ($page > 0) {
4153                $paging_nav .=
4154                        $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4155                        " &sdot; " .
4156                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
4157                                 -accesskey => "p", -title => "Alt-p"}, "prev");
4158        } else {
4159                $paging_nav .= "first &sdot; prev";
4160        }
4161
4162        if ($has_next_link) {
4163                $paging_nav .= " &sdot; " .
4164                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
4165                                 -accesskey => "n", -title => "Alt-n"}, "next");
4166        } else {
4167                $paging_nav .= " &sdot; next";
4168        }
4169
4170        return $paging_nav;
4171}
4172
4173## ......................................................................
4174## functions printing or outputting HTML: div
4175
4176sub git_print_header_div {
4177        my ($action, $title, $hash, $hash_base) = @_;
4178        my %args = ();
4179
4180        $args{'action'} = $action;
4181        $args{'hash'} = $hash if $hash;
4182        $args{'hash_base'} = $hash_base if $hash_base;
4183
4184        print "<div class=\"header\">\n" .
4185              $cgi->a({-href => href(%args), -class => "title"},
4186              $title ? $title : $action) .
4187              "\n</div>\n";
4188}
4189
4190sub format_repo_url {
4191        my ($name, $url) = @_;
4192        return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4193}
4194
4195# Group output by placing it in a DIV element and adding a header.
4196# Options for start_div() can be provided by passing a hash reference as the
4197# first parameter to the function.
4198# Options to git_print_header_div() can be provided by passing an array
4199# reference. This must follow the options to start_div if they are present.
4200# The content can be a scalar, which is output as-is, a scalar reference, which
4201# is output after html escaping, an IO handle passed either as *handle or
4202# *handle{IO}, or a function reference. In the latter case all following
4203# parameters will be taken as argument to the content function call.
4204sub git_print_section {
4205        my ($div_args, $header_args, $content);
4206        my $arg = shift;
4207        if (ref($arg) eq 'HASH') {
4208                $div_args = $arg;
4209                $arg = shift;
4210        }
4211        if (ref($arg) eq 'ARRAY') {
4212                $header_args = $arg;
4213                $arg = shift;
4214        }
4215        $content = $arg;
4216
4217        print $cgi->start_div($div_args);
4218        git_print_header_div(@$header_args);
4219
4220        if (ref($content) eq 'CODE') {
4221                $content->(@_);
4222        } elsif (ref($content) eq 'SCALAR') {
4223                print esc_html($$content);
4224        } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4225                print <$content>;
4226        } elsif (!ref($content) && defined($content)) {
4227                print $content;
4228        }
4229
4230        print $cgi->end_div;
4231}
4232
4233sub format_timestamp_html {
4234        my $date = shift;
4235        my $strtime = $date->{'rfc2822'};
4236
4237        my (undef, undef, $datetime_class) =
4238                gitweb_get_feature('javascript-timezone');
4239        if ($datetime_class) {
4240                $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4241        }
4242
4243        my $localtime_format = '(%02d:%02d %s)';
4244        if ($date->{'hour_local'} < 6) {
4245                $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4246        }
4247        $strtime .= ' ' .
4248                    sprintf($localtime_format,
4249                            $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4250
4251        return $strtime;
4252}
4253
4254# Outputs the author name and date in long form
4255sub git_print_authorship {
4256        my $co = shift;
4257        my %opts = @_;
4258        my $tag = $opts{-tag} || 'div';
4259        my $author = $co->{'author_name'};
4260
4261        my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4262        print "<$tag class=\"author_date\">" .
4263              format_search_author($author, "author", esc_html($author)) .
4264              " [".format_timestamp_html(\%ad)."]".
4265              git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4266              "</$tag>\n";
4267}
4268
4269# Outputs table rows containing the full author or committer information,
4270# in the format expected for 'commit' view (& similar).
4271# Parameters are a commit hash reference, followed by the list of people
4272# to output information for. If the list is empty it defaults to both
4273# author and committer.
4274sub git_print_authorship_rows {
4275        my $co = shift;
4276        # too bad we can't use @people = @_ || ('author', 'committer')
4277        my @people = @_;
4278        @people = ('author', 'committer') unless @people;
4279        foreach my $who (@people) {
4280                my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4281                print "<tr><td>$who</td><td>" .
4282                      format_search_author($co->{"${who}_name"}, $who,
4283                                           esc_html($co->{"${who}_name"})) . " " .
4284                      format_search_author($co->{"${who}_email"}, $who,
4285                                           esc_html("<" . $co->{"${who}_email"} . ">")) .
4286                      "</td><td rowspan=\"2\">" .
4287                      git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4288                      "</td></tr>\n" .
4289                      "<tr>" .
4290                      "<td></td><td>" .
4291                      format_timestamp_html(\%wd) .
4292                      "</td>" .
4293                      "</tr>\n";
4294        }
4295}
4296
4297sub git_print_page_path {
4298        my $name = shift;
4299        my $type = shift;
4300        my $hb = shift;
4301
4302
4303        print "<div class=\"page_path\">";
4304        print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4305                      -title => 'tree root'}, to_utf8("[$project]"));
4306        print " / ";
4307        if (defined $name) {
4308                my @dirname = split '/', $name;
4309                my $basename = pop @dirname;
4310                my $fullname = '';
4311
4312                foreach my $dir (@dirname) {
4313                        $fullname .= ($fullname ? '/' : '') . $dir;
4314                        print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4315                                                     hash_base=>$hb),
4316                                      -title => $fullname}, esc_path($dir));
4317                        print " / ";
4318                }
4319                if (defined $type && $type eq 'blob') {
4320                        print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4321                                                     hash_base=>$hb),
4322                                      -title => $name}, esc_path($basename));
4323                } elsif (defined $type && $type eq 'tree') {
4324                        print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4325                                                     hash_base=>$hb),
4326                                      -title => $name}, esc_path($basename));
4327                        print " / ";
4328                } else {
4329                        print esc_path($basename);
4330                }
4331        }
4332        print "<br/></div>\n";
4333}
4334
4335sub git_print_log {
4336        my $log = shift;
4337        my %opts = @_;
4338
4339        if ($opts{'-remove_title'}) {
4340                # remove title, i.e. first line of log
4341                shift @$log;
4342        }
4343        # remove leading empty lines
4344        while (defined $log->[0] && $log->[0] eq "") {
4345                shift @$log;
4346        }
4347
4348        # print log
4349        my $signoff = 0;
4350        my $empty = 0;
4351        foreach my $line (@$log) {
4352                if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4353                        $signoff = 1;
4354                        $empty = 0;
4355                        if (! $opts{'-remove_signoff'}) {
4356                                print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4357                                next;
4358                        } else {
4359                                # remove signoff lines
4360                                next;
4361                        }
4362                } else {
4363                        $signoff = 0;
4364                }
4365
4366                # print only one empty line
4367                # do not print empty line after signoff
4368                if ($line eq "") {
4369                        next if ($empty || $signoff);
4370                        $empty = 1;
4371                } else {
4372                        $empty = 0;
4373                }
4374
4375                print format_log_line_html($line) . "<br/>\n";
4376        }
4377
4378        if ($opts{'-final_empty_line'}) {
4379                # end with single empty line
4380                print "<br/>\n" unless $empty;
4381        }
4382}
4383
4384# return link target (what link points to)
4385sub git_get_link_target {
4386        my $hash = shift;
4387        my $link_target;
4388
4389        # read link
4390        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4391                or return;
4392        {
4393                local $/ = undef;
4394                $link_target = <$fd>;
4395        }
4396        close $fd
4397                or return;
4398
4399        return $link_target;
4400}
4401
4402# given link target, and the directory (basedir) the link is in,
4403# return target of link relative to top directory (top tree);
4404# return undef if it is not possible (including absolute links).
4405sub normalize_link_target {
4406        my ($link_target, $basedir) = @_;
4407
4408        # absolute symlinks (beginning with '/') cannot be normalized
4409        return if (substr($link_target, 0, 1) eq '/');
4410
4411        # normalize link target to path from top (root) tree (dir)
4412        my $path;
4413        if ($basedir) {
4414                $path = $basedir . '/' . $link_target;
4415        } else {
4416                # we are in top (root) tree (dir)
4417                $path = $link_target;
4418        }
4419
4420        # remove //, /./, and /../
4421        my @path_parts;
4422        foreach my $part (split('/', $path)) {
4423                # discard '.' and ''
4424                next if (!$part || $part eq '.');
4425                # handle '..'
4426                if ($part eq '..') {
4427                        if (@path_parts) {
4428                                pop @path_parts;
4429                        } else {
4430                                # link leads outside repository (outside top dir)
4431                                return;
4432                        }
4433                } else {
4434                        push @path_parts, $part;
4435                }
4436        }
4437        $path = join('/', @path_parts);
4438
4439        return $path;
4440}
4441
4442# print tree entry (row of git_tree), but without encompassing <tr> element
4443sub git_print_tree_entry {
4444        my ($t, $basedir, $hash_base, $have_blame) = @_;
4445
4446        my %base_key = ();
4447        $base_key{'hash_base'} = $hash_base if defined $hash_base;
4448
4449        # The format of a table row is: mode list link.  Where mode is
4450        # the mode of the entry, list is the name of the entry, an href,
4451        # and link is the action links of the entry.
4452
4453        print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4454        if (exists $t->{'size'}) {
4455                print "<td class=\"size\">$t->{'size'}</td>\n";
4456        }
4457        if ($t->{'type'} eq "blob") {
4458                print "<td class=\"list\">" .
4459                        $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4460                                               file_name=>"$basedir$t->{'name'}", %base_key),
4461                                -class => "list"}, esc_path($t->{'name'}));
4462                if (S_ISLNK(oct $t->{'mode'})) {
4463                        my $link_target = git_get_link_target($t->{'hash'});
4464                        if ($link_target) {
4465                                my $norm_target = normalize_link_target($link_target, $basedir);
4466                                if (defined $norm_target) {
4467                                        print " -> " .
4468                                              $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4469                                                                     file_name=>$norm_target),
4470                                                       -title => $norm_target}, esc_path($link_target));
4471                                } else {
4472                                        print " -> " . esc_path($link_target);
4473                                }
4474                        }
4475                }
4476                print "</td>\n";
4477                print "<td class=\"link\">";
4478                print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4479                                             file_name=>"$basedir$t->{'name'}", %base_key)},
4480                              "blob");
4481                if ($have_blame) {
4482                        print " | " .
4483                              $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4484                                                     file_name=>"$basedir$t->{'name'}", %base_key)},
4485                                      "blame");
4486                }
4487                if (defined $hash_base) {
4488                        print " | " .
4489                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4490                                                     hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4491                                      "history");
4492                }
4493                print " | " .
4494                        $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4495                                               file_name=>"$basedir$t->{'name'}")},
4496                                "raw");
4497                print "</td>\n";
4498
4499        } elsif ($t->{'type'} eq "tree") {
4500                print "<td class=\"list\">";
4501                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4502                                             file_name=>"$basedir$t->{'name'}",
4503                                             %base_key)},
4504                              esc_path($t->{'name'}));
4505                print "</td>\n";
4506                print "<td class=\"link\">";
4507                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4508                                             file_name=>"$basedir$t->{'name'}",
4509                                             %base_key)},
4510                              "tree");
4511                if (defined $hash_base) {
4512                        print " | " .
4513                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4514                                                     file_name=>"$basedir$t->{'name'}")},
4515                                      "history");
4516                }
4517                print "</td>\n";
4518        } else {
4519                # unknown object: we can only present history for it
4520                # (this includes 'commit' object, i.e. submodule support)
4521                print "<td class=\"list\">" .
4522                      esc_path($t->{'name'}) .
4523                      "</td>\n";
4524                print "<td class=\"link\">";
4525                if (defined $hash_base) {
4526                        print $cgi->a({-href => href(action=>"history",
4527                                                     hash_base=>$hash_base,
4528                                                     file_name=>"$basedir$t->{'name'}")},
4529                                      "history");
4530                }
4531                print "</td>\n";
4532        }
4533}
4534
4535## ......................................................................
4536## functions printing large fragments of HTML
4537
4538# get pre-image filenames for merge (combined) diff
4539sub fill_from_file_info {
4540        my ($diff, @parents) = @_;
4541
4542        $diff->{'from_file'} = [ ];
4543        $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4544        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4545                if ($diff->{'status'}[$i] eq 'R' ||
4546                    $diff->{'status'}[$i] eq 'C') {
4547                        $diff->{'from_file'}[$i] =
4548                                git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4549                }
4550        }
4551
4552        return $diff;
4553}
4554
4555# is current raw difftree line of file deletion
4556sub is_deleted {
4557        my $diffinfo = shift;
4558
4559        return $diffinfo->{'to_id'} eq ('0' x 40);
4560}
4561
4562# does patch correspond to [previous] difftree raw line
4563# $diffinfo  - hashref of parsed raw diff format
4564# $patchinfo - hashref of parsed patch diff format
4565#              (the same keys as in $diffinfo)
4566sub is_patch_split {
4567        my ($diffinfo, $patchinfo) = @_;
4568
4569        return defined $diffinfo && defined $patchinfo
4570                && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4571}
4572
4573
4574sub git_difftree_body {
4575        my ($difftree, $hash, @parents) = @_;
4576        my ($parent) = $parents[0];
4577        my $have_blame = gitweb_check_feature('blame');
4578        print "<div class=\"list_head\">\n";
4579        if ($#{$difftree} > 10) {
4580                print(($#{$difftree} + 1) . " files changed:\n");
4581        }
4582        print "</div>\n";
4583
4584        print "<table class=\"" .
4585              (@parents > 1 ? "combined " : "") .
4586              "diff_tree\">\n";
4587
4588        # header only for combined diff in 'commitdiff' view
4589        my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4590        if ($has_header) {
4591                # table header
4592                print "<thead><tr>\n" .
4593                       "<th></th><th></th>\n"; # filename, patchN link
4594                for (my $i = 0; $i < @parents; $i++) {
4595                        my $par = $parents[$i];
4596                        print "<th>" .
4597                              $cgi->a({-href => href(action=>"commitdiff",
4598                                                     hash=>$hash, hash_parent=>$par),
4599                                       -title => 'commitdiff to parent number ' .
4600                                                  ($i+1) . ': ' . substr($par,0,7)},
4601                                      $i+1) .
4602                              "&nbsp;</th>\n";
4603                }
4604                print "</tr></thead>\n<tbody>\n";
4605        }
4606
4607        my $alternate = 1;
4608        my $patchno = 0;
4609        foreach my $line (@{$difftree}) {
4610                my $diff = parsed_difftree_line($line);
4611
4612                if ($alternate) {
4613                        print "<tr class=\"dark\">\n";
4614                } else {
4615                        print "<tr class=\"light\">\n";
4616                }
4617                $alternate ^= 1;
4618
4619                if (exists $diff->{'nparents'}) { # combined diff
4620
4621                        fill_from_file_info($diff, @parents)
4622                                unless exists $diff->{'from_file'};
4623
4624                        if (!is_deleted($diff)) {
4625                                # file exists in the result (child) commit
4626                                print "<td>" .
4627                                      $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4628                                                             file_name=>$diff->{'to_file'},
4629                                                             hash_base=>$hash),
4630                                              -class => "list"}, esc_path($diff->{'to_file'})) .
4631                                      "</td>\n";
4632                        } else {
4633                                print "<td>" .
4634                                      esc_path($diff->{'to_file'}) .
4635                                      "</td>\n";
4636                        }
4637
4638                        if ($action eq 'commitdiff') {
4639                                # link to patch
4640                                $patchno++;
4641                                print "<td class=\"link\">" .
4642                                      $cgi->a({-href => href(-anchor=>"patch$patchno")},
4643                                              "patch") .
4644                                      " | " .
4645                                      "</td>\n";
4646                        }
4647
4648                        my $has_history = 0;
4649                        my $not_deleted = 0;
4650                        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4651                                my $hash_parent = $parents[$i];
4652                                my $from_hash = $diff->{'from_id'}[$i];
4653                                my $from_path = $diff->{'from_file'}[$i];
4654                                my $status = $diff->{'status'}[$i];
4655
4656                                $has_history ||= ($status ne 'A');
4657                                $not_deleted ||= ($status ne 'D');
4658
4659                                if ($status eq 'A') {
4660                                        print "<td  class=\"link\" align=\"right\"> | </td>\n";
4661                                } elsif ($status eq 'D') {
4662                                        print "<td class=\"link\">" .
4663                                              $cgi->a({-href => href(action=>"blob",
4664                                                                     hash_base=>$hash,
4665                                                                     hash=>$from_hash,
4666                                                                     file_name=>$from_path)},
4667                                                      "blob" . ($i+1)) .
4668                                              " | </td>\n";
4669                                } else {
4670                                        if ($diff->{'to_id'} eq $from_hash) {
4671                                                print "<td class=\"link nochange\">";
4672                                        } else {
4673                                                print "<td class=\"link\">";
4674                                        }
4675                                        print $cgi->a({-href => href(action=>"blobdiff",
4676                                                                     hash=>$diff->{'to_id'},
4677                                                                     hash_parent=>$from_hash,
4678                                                                     hash_base=>$hash,
4679                                                                     hash_parent_base=>$hash_parent,
4680                                                                     file_name=>$diff->{'to_file'},
4681                                                                     file_parent=>$from_path)},
4682                                                      "diff" . ($i+1)) .
4683                                              " | </td>\n";
4684                                }
4685                        }
4686
4687                        print "<td class=\"link\">";
4688                        if ($not_deleted) {
4689                                print $cgi->a({-href => href(action=>"blob",
4690                                                             hash=>$diff->{'to_id'},
4691                                                             file_name=>$diff->{'to_file'},
4692                                                             hash_base=>$hash)},
4693                                              "blob");
4694                                print " | " if ($has_history);
4695                        }
4696                        if ($has_history) {
4697                                print $cgi->a({-href => href(action=>"history",
4698                                                             file_name=>$diff->{'to_file'},
4699                                                             hash_base=>$hash)},
4700                                              "history");
4701                        }
4702                        print "</td>\n";
4703
4704                        print "</tr>\n";
4705                        next; # instead of 'else' clause, to avoid extra indent
4706                }
4707                # else ordinary diff
4708
4709                my ($to_mode_oct, $to_mode_str, $to_file_type);
4710                my ($from_mode_oct, $from_mode_str, $from_file_type);
4711                if ($diff->{'to_mode'} ne ('0' x 6)) {
4712                        $to_mode_oct = oct $diff->{'to_mode'};
4713                        if (S_ISREG($to_mode_oct)) { # only for regular file
4714                                $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4715                        }
4716                        $to_file_type = file_type($diff->{'to_mode'});
4717                }
4718                if ($diff->{'from_mode'} ne ('0' x 6)) {
4719                        $from_mode_oct = oct $diff->{'from_mode'};
4720                        if (S_ISREG($from_mode_oct)) { # only for regular file
4721                                $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4722                        }
4723                        $from_file_type = file_type($diff->{'from_mode'});
4724                }
4725
4726                if ($diff->{'status'} eq "A") { # created
4727                        my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4728                        $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4729                        $mode_chng   .= "]</span>";
4730                        print "<td>";
4731                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4732                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4733                                      -class => "list"}, esc_path($diff->{'file'}));
4734                        print "</td>\n";
4735                        print "<td>$mode_chng</td>\n";
4736                        print "<td class=\"link\">";
4737                        if ($action eq 'commitdiff') {
4738                                # link to patch
4739                                $patchno++;
4740                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4741                                              "patch") .
4742                                      " | ";
4743                        }
4744                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4745                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4746                                      "blob");
4747                        print "</td>\n";
4748
4749                } elsif ($diff->{'status'} eq "D") { # deleted
4750                        my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4751                        print "<td>";
4752                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4753                                                     hash_base=>$parent, file_name=>$diff->{'file'}),
4754                                       -class => "list"}, esc_path($diff->{'file'}));
4755                        print "</td>\n";
4756                        print "<td>$mode_chng</td>\n";
4757                        print "<td class=\"link\">";
4758                        if ($action eq 'commitdiff') {
4759                                # link to patch
4760                                $patchno++;
4761                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4762                                              "patch") .
4763                                      " | ";
4764                        }
4765                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4766                                                     hash_base=>$parent, file_name=>$diff->{'file'})},
4767                                      "blob") . " | ";
4768                        if ($have_blame) {
4769                                print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4770                                                             file_name=>$diff->{'file'})},
4771                                              "blame") . " | ";
4772                        }
4773                        print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4774                                                     file_name=>$diff->{'file'})},
4775                                      "history");
4776                        print "</td>\n";
4777
4778                } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4779                        my $mode_chnge = "";
4780                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4781                                $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4782                                if ($from_file_type ne $to_file_type) {
4783                                        $mode_chnge .= " from $from_file_type to $to_file_type";
4784                                }
4785                                if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4786                                        if ($from_mode_str && $to_mode_str) {
4787                                                $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4788                                        } elsif ($to_mode_str) {
4789                                                $mode_chnge .= " mode: $to_mode_str";
4790                                        }
4791                                }
4792                                $mode_chnge .= "]</span>\n";
4793                        }
4794                        print "<td>";
4795                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4796                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4797                                      -class => "list"}, esc_path($diff->{'file'}));
4798                        print "</td>\n";
4799                        print "<td>$mode_chnge</td>\n";
4800                        print "<td class=\"link\">";
4801                        if ($action eq 'commitdiff') {
4802                                # link to patch
4803                                $patchno++;
4804                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4805                                              "patch") .
4806                                      " | ";
4807                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4808                                # "commit" view and modified file (not onlu mode changed)
4809                                print $cgi->a({-href => href(action=>"blobdiff",
4810                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4811                                                             hash_base=>$hash, hash_parent_base=>$parent,
4812                                                             file_name=>$diff->{'file'})},
4813                                              "diff") .
4814                                      " | ";
4815                        }
4816                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4817                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4818                                       "blob") . " | ";
4819                        if ($have_blame) {
4820                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4821                                                             file_name=>$diff->{'file'})},
4822                                              "blame") . " | ";
4823                        }
4824                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4825                                                     file_name=>$diff->{'file'})},
4826                                      "history");
4827                        print "</td>\n";
4828
4829                } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4830                        my %status_name = ('R' => 'moved', 'C' => 'copied');
4831                        my $nstatus = $status_name{$diff->{'status'}};
4832                        my $mode_chng = "";
4833                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4834                                # mode also for directories, so we cannot use $to_mode_str
4835                                $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4836                        }
4837                        print "<td>" .
4838                              $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4839                                                     hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4840                                      -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4841                              "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4842                              $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4843                                                     hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4844                                      -class => "list"}, esc_path($diff->{'from_file'})) .
4845                              " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4846                              "<td class=\"link\">";
4847                        if ($action eq 'commitdiff') {
4848                                # link to patch
4849                                $patchno++;
4850                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4851                                              "patch") .
4852                                      " | ";
4853                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4854                                # "commit" view and modified file (not only pure rename or copy)
4855                                print $cgi->a({-href => href(action=>"blobdiff",
4856                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4857                                                             hash_base=>$hash, hash_parent_base=>$parent,
4858                                                             file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4859                                              "diff") .
4860                                      " | ";
4861                        }
4862                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4863                                                     hash_base=>$parent, file_name=>$diff->{'to_file'})},
4864                                      "blob") . " | ";
4865                        if ($have_blame) {
4866                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4867                                                             file_name=>$diff->{'to_file'})},
4868                                              "blame") . " | ";
4869                        }
4870                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4871                                                    file_name=>$diff->{'to_file'})},
4872                                      "history");
4873                        print "</td>\n";
4874
4875                } # we should not encounter Unmerged (U) or Unknown (X) status
4876                print "</tr>\n";
4877        }
4878        print "</tbody>" if $has_header;
4879        print "</table>\n";
4880}
4881
4882sub print_sidebyside_diff_chunk {
4883        my @chunk = @_;
4884        my (@ctx, @rem, @add);
4885
4886        return unless @chunk;
4887
4888        # incomplete last line might be among removed or added lines,
4889        # or both, or among context lines: find which
4890        for (my $i = 1; $i < @chunk; $i++) {
4891                if ($chunk[$i][0] eq 'incomplete') {
4892                        $chunk[$i][0] = $chunk[$i-1][0];
4893                }
4894        }
4895
4896        # guardian
4897        push @chunk, ["", ""];
4898
4899        foreach my $line_info (@chunk) {
4900                my ($class, $line) = @$line_info;
4901
4902                # print chunk headers
4903                if ($class && $class eq 'chunk_header') {
4904                        print $line;
4905                        next;
4906                }
4907
4908                ## print from accumulator when type of class of lines change
4909                # empty contents block on start rem/add block, or end of chunk
4910                if (@ctx && (!$class || $class eq 'rem' || $class eq 'add')) {
4911                        print join '',
4912                                '<div class="chunk_block ctx">',
4913                                        '<div class="old">',
4914                                        @ctx,
4915                                        '</div>',
4916                                        '<div class="new">',
4917                                        @ctx,
4918                                        '</div>',
4919                                '</div>';
4920                        @ctx = ();
4921                }
4922                # empty add/rem block on start context block, or end of chunk
4923                if ((@rem || @add) && (!$class || $class eq 'ctx')) {
4924                        if (!@add) {
4925                                # pure removal
4926                                print join '',
4927                                        '<div class="chunk_block rem">',
4928                                                '<div class="old">',
4929                                                @rem,
4930                                                '</div>',
4931                                        '</div>';
4932                        } elsif (!@rem) {
4933                                # pure addition
4934                                print join '',
4935                                        '<div class="chunk_block add">',
4936                                                '<div class="new">',
4937                                                @add,
4938                                                '</div>',
4939                                        '</div>';
4940                        } else {
4941                                # assume that it is change
4942                                print join '',
4943                                        '<div class="chunk_block chg">',
4944                                                '<div class="old">',
4945                                                @rem,
4946                                                '</div>',
4947                                                '<div class="new">',
4948                                                @add,
4949                                                '</div>',
4950                                        '</div>';
4951                        }
4952                        @rem = @add = ();
4953                }
4954
4955                ## adding lines to accumulator
4956                # guardian value
4957                last unless $line;
4958                # rem, add or change
4959                if ($class eq 'rem') {
4960                        push @rem, $line;
4961                } elsif ($class eq 'add') {
4962                        push @add, $line;
4963                }
4964                # context line
4965                if ($class eq 'ctx') {
4966                        push @ctx, $line;
4967                }
4968        }
4969}
4970
4971sub git_patchset_body {
4972        my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
4973        my ($hash_parent) = $hash_parents[0];
4974
4975        my $is_combined = (@hash_parents > 1);
4976        my $patch_idx = 0;
4977        my $patch_number = 0;
4978        my $patch_line;
4979        my $diffinfo;
4980        my $to_name;
4981        my (%from, %to);
4982        my @chunk; # for side-by-side diff
4983
4984        print "<div class=\"patchset\">\n";
4985
4986        # skip to first patch
4987        while ($patch_line = <$fd>) {
4988                chomp $patch_line;
4989
4990                last if ($patch_line =~ m/^diff /);
4991        }
4992
4993 PATCH:
4994        while ($patch_line) {
4995
4996                # parse "git diff" header line
4997                if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
4998                        # $1 is from_name, which we do not use
4999                        $to_name = unquote($2);
5000                        $to_name =~ s!^b/!!;
5001                } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
5002                        # $1 is 'cc' or 'combined', which we do not use
5003                        $to_name = unquote($2);
5004                } else {
5005                        $to_name = undef;
5006                }
5007
5008                # check if current patch belong to current raw line
5009                # and parse raw git-diff line if needed
5010                if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
5011                        # this is continuation of a split patch
5012                        print "<div class=\"patch cont\">\n";
5013                } else {
5014                        # advance raw git-diff output if needed
5015                        $patch_idx++ if defined $diffinfo;
5016
5017                        # read and prepare patch information
5018                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5019
5020                        # compact combined diff output can have some patches skipped
5021                        # find which patch (using pathname of result) we are at now;
5022                        if ($is_combined) {
5023                                while ($to_name ne $diffinfo->{'to_file'}) {
5024                                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5025                                              format_diff_cc_simplified($diffinfo, @hash_parents) .
5026                                              "</div>\n";  # class="patch"
5027
5028                                        $patch_idx++;
5029                                        $patch_number++;
5030
5031                                        last if $patch_idx > $#$difftree;
5032                                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5033                                }
5034                        }
5035
5036                        # modifies %from, %to hashes
5037                        parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5038
5039                        # this is first patch for raw difftree line with $patch_idx index
5040                        # we index @$difftree array from 0, but number patches from 1
5041                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5042                }
5043
5044                # git diff header
5045                #assert($patch_line =~ m/^diff /) if DEBUG;
5046                #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5047                $patch_number++;
5048                # print "git diff" header
5049                print format_git_diff_header_line($patch_line, $diffinfo,
5050                                                  \%from, \%to);
5051
5052                # print extended diff header
5053                print "<div class=\"diff extended_header\">\n";
5054        EXTENDED_HEADER:
5055                while ($patch_line = <$fd>) {
5056                        chomp $patch_line;
5057
5058                        last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5059
5060                        print format_extended_diff_header_line($patch_line, $diffinfo,
5061                                                               \%from, \%to);
5062                }
5063                print "</div>\n"; # class="diff extended_header"
5064
5065                # from-file/to-file diff header
5066                if (! $patch_line) {
5067                        print "</div>\n"; # class="patch"
5068                        last PATCH;
5069                }
5070                next PATCH if ($patch_line =~ m/^diff /);
5071                #assert($patch_line =~ m/^---/) if DEBUG;
5072
5073                my $last_patch_line = $patch_line;
5074                $patch_line = <$fd>;
5075                chomp $patch_line;
5076                #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5077
5078                print format_diff_from_to_header($last_patch_line, $patch_line,
5079                                                 $diffinfo, \%from, \%to,
5080                                                 @hash_parents);
5081
5082                # the patch itself
5083        LINE:
5084                while ($patch_line = <$fd>) {
5085                        chomp $patch_line;
5086
5087                        next PATCH if ($patch_line =~ m/^diff /);
5088
5089                        my ($class, $line) = process_diff_line($patch_line, \%from, \%to);
5090                        my $diff_classes = "diff";
5091                        $diff_classes .= " $class" if ($class);
5092                        $line = "<div class=\"$diff_classes\">$line</div>\n";
5093
5094                        if ($diff_style eq 'sidebyside' && !$is_combined) {
5095                                if ($class eq 'chunk_header') {
5096                                        print_sidebyside_diff_chunk(@chunk);
5097                                        @chunk = ( [ $class, $line ] );
5098                                } else {
5099                                        push @chunk, [ $class, $line ];
5100                                }
5101                        } else {
5102                                # default 'inline' style and unknown styles
5103                                print $line;
5104                        }
5105                }
5106
5107        } continue {
5108                if (@chunk) {
5109                        print_sidebyside_diff_chunk(@chunk);
5110                        @chunk = ();
5111                }
5112                print "</div>\n"; # class="patch"
5113        }
5114
5115        # for compact combined (--cc) format, with chunk and patch simplification
5116        # the patchset might be empty, but there might be unprocessed raw lines
5117        for (++$patch_idx if $patch_number > 0;
5118             $patch_idx < @$difftree;
5119             ++$patch_idx) {
5120                # read and prepare patch information
5121                $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5122
5123                # generate anchor for "patch" links in difftree / whatchanged part
5124                print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5125                      format_diff_cc_simplified($diffinfo, @hash_parents) .
5126                      "</div>\n";  # class="patch"
5127
5128                $patch_number++;
5129        }
5130
5131        if ($patch_number == 0) {
5132                if (@hash_parents > 1) {
5133                        print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5134                } else {
5135                        print "<div class=\"diff nodifferences\">No differences found</div>\n";
5136                }
5137        }
5138
5139        print "</div>\n"; # class="patchset"
5140}
5141
5142# . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5143
5144# fills project list info (age, description, owner, category, forks)
5145# for each project in the list, removing invalid projects from
5146# returned list
5147# NOTE: modifies $projlist, but does not remove entries from it
5148sub fill_project_list_info {
5149        my $projlist = shift;
5150        my @projects;
5151
5152        my $show_ctags = gitweb_check_feature('ctags');
5153 PROJECT:
5154        foreach my $pr (@$projlist) {
5155                my (@activity) = git_get_last_activity($pr->{'path'});
5156                unless (@activity) {
5157                        next PROJECT;
5158                }
5159                ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5160                if (!defined $pr->{'descr'}) {
5161                        my $descr = git_get_project_description($pr->{'path'}) || "";
5162                        $descr = to_utf8($descr);
5163                        $pr->{'descr_long'} = $descr;
5164                        $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5165                }
5166                if (!defined $pr->{'owner'}) {
5167                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5168                }
5169                if ($show_ctags) {
5170                        $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5171                }
5172                if ($projects_list_group_categories && !defined $pr->{'category'}) {
5173                        my $cat = git_get_project_category($pr->{'path'}) ||
5174                                                           $project_list_default_category;
5175                        $pr->{'category'} = to_utf8($cat);
5176                }
5177
5178                push @projects, $pr;
5179        }
5180
5181        return @projects;
5182}
5183
5184sub sort_projects_list {
5185        my ($projlist, $order) = @_;
5186        my @projects;
5187
5188        my %order_info = (
5189                project => { key => 'path', type => 'str' },
5190                descr => { key => 'descr_long', type => 'str' },
5191                owner => { key => 'owner', type => 'str' },
5192                age => { key => 'age', type => 'num' }
5193        );
5194        my $oi = $order_info{$order};
5195        return @$projlist unless defined $oi;
5196        if ($oi->{'type'} eq 'str') {
5197                @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5198        } else {
5199                @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5200        }
5201
5202        return @projects;
5203}
5204
5205# returns a hash of categories, containing the list of project
5206# belonging to each category
5207sub build_projlist_by_category {
5208        my ($projlist, $from, $to) = @_;
5209        my %categories;
5210
5211        $from = 0 unless defined $from;
5212        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5213
5214        for (my $i = $from; $i <= $to; $i++) {
5215                my $pr = $projlist->[$i];
5216                push @{$categories{ $pr->{'category'} }}, $pr;
5217        }
5218
5219        return wantarray ? %categories : \%categories;
5220}
5221
5222# print 'sort by' <th> element, generating 'sort by $name' replay link
5223# if that order is not selected
5224sub print_sort_th {
5225        print format_sort_th(@_);
5226}
5227
5228sub format_sort_th {
5229        my ($name, $order, $header) = @_;
5230        my $sort_th = "";
5231        $header ||= ucfirst($name);
5232
5233        if ($order eq $name) {
5234                $sort_th .= "<th>$header</th>\n";
5235        } else {
5236                $sort_th .= "<th>" .
5237                            $cgi->a({-href => href(-replay=>1, order=>$name),
5238                                     -class => "header"}, $header) .
5239                            "</th>\n";
5240        }
5241
5242        return $sort_th;
5243}
5244
5245sub git_project_list_rows {
5246        my ($projlist, $from, $to, $check_forks) = @_;
5247
5248        $from = 0 unless defined $from;
5249        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5250
5251        my $alternate = 1;
5252        for (my $i = $from; $i <= $to; $i++) {
5253                my $pr = $projlist->[$i];
5254
5255                if ($alternate) {
5256                        print "<tr class=\"dark\">\n";
5257                } else {
5258                        print "<tr class=\"light\">\n";
5259                }
5260                $alternate ^= 1;
5261
5262                if ($check_forks) {
5263                        print "<td>";
5264                        if ($pr->{'forks'}) {
5265                                my $nforks = scalar @{$pr->{'forks'}};
5266                                if ($nforks > 0) {
5267                                        print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5268                                                       -title => "$nforks forks"}, "+");
5269                                } else {
5270                                        print $cgi->span({-title => "$nforks forks"}, "+");
5271                                }
5272                        }
5273                        print "</td>\n";
5274                }
5275                print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5276                                        -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
5277                      "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5278                                        -class => "list", -title => $pr->{'descr_long'}},
5279                                        esc_html($pr->{'descr'})) . "</td>\n" .
5280                      "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5281                print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5282                      (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
5283                      "<td class=\"link\">" .
5284                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5285                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5286                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5287                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5288                      ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5289                      "</td>\n" .
5290                      "</tr>\n";
5291        }
5292}
5293
5294sub git_project_list_body {
5295        # actually uses global variable $project
5296        my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5297        my @projects = @$projlist;
5298
5299        my $check_forks = gitweb_check_feature('forks');
5300        my $show_ctags  = gitweb_check_feature('ctags');
5301        my $tagfilter = $show_ctags ? $cgi->param('by_tag') : undef;
5302        $check_forks = undef
5303                if ($tagfilter || $searchtext);
5304
5305        # filtering out forks before filling info allows to do less work
5306        @projects = filter_forks_from_projects_list(\@projects)
5307                if ($check_forks);
5308        @projects = fill_project_list_info(\@projects);
5309        # searching projects require filling to be run before it
5310        @projects = search_projects_list(\@projects,
5311                                         'searchtext' => $searchtext,
5312                                         'tagfilter'  => $tagfilter)
5313                if ($tagfilter || $searchtext);
5314
5315        $order ||= $default_projects_order;
5316        $from = 0 unless defined $from;
5317        $to = $#projects if (!defined $to || $#projects < $to);
5318
5319        # short circuit
5320        if ($from > $to) {
5321                print "<center>\n".
5322                      "<b>No such projects found</b><br />\n".
5323                      "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5324                      "</center>\n<br />\n";
5325                return;
5326        }
5327
5328        @projects = sort_projects_list(\@projects, $order);
5329
5330        if ($show_ctags) {
5331                my $ctags = git_gather_all_ctags(\@projects);
5332                my $cloud = git_populate_project_tagcloud($ctags);
5333                print git_show_project_tagcloud($cloud, 64);
5334        }
5335
5336        print "<table class=\"project_list\">\n";
5337        unless ($no_header) {
5338                print "<tr>\n";
5339                if ($check_forks) {
5340                        print "<th></th>\n";
5341                }
5342                print_sort_th('project', $order, 'Project');
5343                print_sort_th('descr', $order, 'Description');
5344                print_sort_th('owner', $order, 'Owner');
5345                print_sort_th('age', $order, 'Last Change');
5346                print "<th></th>\n" . # for links
5347                      "</tr>\n";
5348        }
5349
5350        if ($projects_list_group_categories) {
5351                # only display categories with projects in the $from-$to window
5352                @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5353                my %categories = build_projlist_by_category(\@projects, $from, $to);
5354                foreach my $cat (sort keys %categories) {
5355                        unless ($cat eq "") {
5356                                print "<tr>\n";
5357                                if ($check_forks) {
5358                                        print "<td></td>\n";
5359                                }
5360                                print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5361                                print "</tr>\n";
5362                        }
5363
5364                        git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5365                }
5366        } else {
5367                git_project_list_rows(\@projects, $from, $to, $check_forks);
5368        }
5369
5370        if (defined $extra) {
5371                print "<tr>\n";
5372                if ($check_forks) {
5373                        print "<td></td>\n";
5374                }
5375                print "<td colspan=\"5\">$extra</td>\n" .
5376                      "</tr>\n";
5377        }
5378        print "</table>\n";
5379}
5380
5381sub git_log_body {
5382        # uses global variable $project
5383        my ($commitlist, $from, $to, $refs, $extra) = @_;
5384
5385        $from = 0 unless defined $from;
5386        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5387
5388        for (my $i = 0; $i <= $to; $i++) {
5389                my %co = %{$commitlist->[$i]};
5390                next if !%co;
5391                my $commit = $co{'id'};
5392                my $ref = format_ref_marker($refs, $commit);
5393                git_print_header_div('commit',
5394                               "<span class=\"age\">$co{'age_string'}</span>" .
5395                               esc_html($co{'title'}) . $ref,
5396                               $commit);
5397                print "<div class=\"title_text\">\n" .
5398                      "<div class=\"log_link\">\n" .
5399                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5400                      " | " .
5401                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5402                      " | " .
5403                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5404                      "<br/>\n" .
5405                      "</div>\n";
5406                      git_print_authorship(\%co, -tag => 'span');
5407                      print "<br/>\n</div>\n";
5408
5409                print "<div class=\"log_body\">\n";
5410                git_print_log($co{'comment'}, -final_empty_line=> 1);
5411                print "</div>\n";
5412        }
5413        if ($extra) {
5414                print "<div class=\"page_nav\">\n";
5415                print "$extra\n";
5416                print "</div>\n";
5417        }
5418}
5419
5420sub git_shortlog_body {
5421        # uses global variable $project
5422        my ($commitlist, $from, $to, $refs, $extra) = @_;
5423
5424        $from = 0 unless defined $from;
5425        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5426
5427        print "<table class=\"shortlog\">\n";
5428        my $alternate = 1;
5429        for (my $i = $from; $i <= $to; $i++) {
5430                my %co = %{$commitlist->[$i]};
5431                my $commit = $co{'id'};
5432                my $ref = format_ref_marker($refs, $commit);
5433                if ($alternate) {
5434                        print "<tr class=\"dark\">\n";
5435                } else {
5436                        print "<tr class=\"light\">\n";
5437                }
5438                $alternate ^= 1;
5439                # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5440                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5441                      format_author_html('td', \%co, 10) . "<td>";
5442                print format_subject_html($co{'title'}, $co{'title_short'},
5443                                          href(action=>"commit", hash=>$commit), $ref);
5444                print "</td>\n" .
5445                      "<td class=\"link\">" .
5446                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5447                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5448                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5449                my $snapshot_links = format_snapshot_links($commit);
5450                if (defined $snapshot_links) {
5451                        print " | " . $snapshot_links;
5452                }
5453                print "</td>\n" .
5454                      "</tr>\n";
5455        }
5456        if (defined $extra) {
5457                print "<tr>\n" .
5458                      "<td colspan=\"4\">$extra</td>\n" .
5459                      "</tr>\n";
5460        }
5461        print "</table>\n";
5462}
5463
5464sub git_history_body {
5465        # Warning: assumes constant type (blob or tree) during history
5466        my ($commitlist, $from, $to, $refs, $extra,
5467            $file_name, $file_hash, $ftype) = @_;
5468
5469        $from = 0 unless defined $from;
5470        $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5471
5472        print "<table class=\"history\">\n";
5473        my $alternate = 1;
5474        for (my $i = $from; $i <= $to; $i++) {
5475                my %co = %{$commitlist->[$i]};
5476                if (!%co) {
5477                        next;
5478                }
5479                my $commit = $co{'id'};
5480
5481                my $ref = format_ref_marker($refs, $commit);
5482
5483                if ($alternate) {
5484                        print "<tr class=\"dark\">\n";
5485                } else {
5486                        print "<tr class=\"light\">\n";
5487                }
5488                $alternate ^= 1;
5489                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5490        # shortlog:   format_author_html('td', \%co, 10)
5491                      format_author_html('td', \%co, 15, 3) . "<td>";
5492                # originally git_history used chop_str($co{'title'}, 50)
5493                print format_subject_html($co{'title'}, $co{'title_short'},
5494                                          href(action=>"commit", hash=>$commit), $ref);
5495                print "</td>\n" .
5496                      "<td class=\"link\">" .
5497                      $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5498                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5499
5500                if ($ftype eq 'blob') {
5501                        my $blob_current = $file_hash;
5502                        my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5503                        if (defined $blob_current && defined $blob_parent &&
5504                                        $blob_current ne $blob_parent) {
5505                                print " | " .
5506                                        $cgi->a({-href => href(action=>"blobdiff",
5507                                                               hash=>$blob_current, hash_parent=>$blob_parent,
5508                                                               hash_base=>$hash_base, hash_parent_base=>$commit,
5509                                                               file_name=>$file_name)},
5510                                                "diff to current");
5511                        }
5512                }
5513                print "</td>\n" .
5514                      "</tr>\n";
5515        }
5516        if (defined $extra) {
5517                print "<tr>\n" .
5518                      "<td colspan=\"4\">$extra</td>\n" .
5519                      "</tr>\n";
5520        }
5521        print "</table>\n";
5522}
5523
5524sub git_tags_body {
5525        # uses global variable $project
5526        my ($taglist, $from, $to, $extra) = @_;
5527        $from = 0 unless defined $from;
5528        $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5529
5530        print "<table class=\"tags\">\n";
5531        my $alternate = 1;
5532        for (my $i = $from; $i <= $to; $i++) {
5533                my $entry = $taglist->[$i];
5534                my %tag = %$entry;
5535                my $comment = $tag{'subject'};
5536                my $comment_short;
5537                if (defined $comment) {
5538                        $comment_short = chop_str($comment, 30, 5);
5539                }
5540                if ($alternate) {
5541                        print "<tr class=\"dark\">\n";
5542                } else {
5543                        print "<tr class=\"light\">\n";
5544                }
5545                $alternate ^= 1;
5546                if (defined $tag{'age'}) {
5547                        print "<td><i>$tag{'age'}</i></td>\n";
5548                } else {
5549                        print "<td></td>\n";
5550                }
5551                print "<td>" .
5552                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5553                               -class => "list name"}, esc_html($tag{'name'})) .
5554                      "</td>\n" .
5555                      "<td>";
5556                if (defined $comment) {
5557                        print format_subject_html($comment, $comment_short,
5558                                                  href(action=>"tag", hash=>$tag{'id'}));
5559                }
5560                print "</td>\n" .
5561                      "<td class=\"selflink\">";
5562                if ($tag{'type'} eq "tag") {
5563                        print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5564                } else {
5565                        print "&nbsp;";
5566                }
5567                print "</td>\n" .
5568                      "<td class=\"link\">" . " | " .
5569                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5570                if ($tag{'reftype'} eq "commit") {
5571                        print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5572                              " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5573                } elsif ($tag{'reftype'} eq "blob") {
5574                        print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5575                }
5576                print "</td>\n" .
5577                      "</tr>";
5578        }
5579        if (defined $extra) {
5580                print "<tr>\n" .
5581                      "<td colspan=\"5\">$extra</td>\n" .
5582                      "</tr>\n";
5583        }
5584        print "</table>\n";
5585}
5586
5587sub git_heads_body {
5588        # uses global variable $project
5589        my ($headlist, $head, $from, $to, $extra) = @_;
5590        $from = 0 unless defined $from;
5591        $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5592
5593        print "<table class=\"heads\">\n";
5594        my $alternate = 1;
5595        for (my $i = $from; $i <= $to; $i++) {
5596                my $entry = $headlist->[$i];
5597                my %ref = %$entry;
5598                my $curr = $ref{'id'} eq $head;
5599                if ($alternate) {
5600                        print "<tr class=\"dark\">\n";
5601                } else {
5602                        print "<tr class=\"light\">\n";
5603                }
5604                $alternate ^= 1;
5605                print "<td><i>$ref{'age'}</i></td>\n" .
5606                      ($curr ? "<td class=\"current_head\">" : "<td>") .
5607                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5608                               -class => "list name"},esc_html($ref{'name'})) .
5609                      "</td>\n" .
5610                      "<td class=\"link\">" .
5611                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5612                      $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5613                      $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5614                      "</td>\n" .
5615                      "</tr>";
5616        }
5617        if (defined $extra) {
5618                print "<tr>\n" .
5619                      "<td colspan=\"3\">$extra</td>\n" .
5620                      "</tr>\n";
5621        }
5622        print "</table>\n";
5623}
5624
5625# Display a single remote block
5626sub git_remote_block {
5627        my ($remote, $rdata, $limit, $head) = @_;
5628
5629        my $heads = $rdata->{'heads'};
5630        my $fetch = $rdata->{'fetch'};
5631        my $push = $rdata->{'push'};
5632
5633        my $urls_table = "<table class=\"projects_list\">\n" ;
5634
5635        if (defined $fetch) {
5636                if ($fetch eq $push) {
5637                        $urls_table .= format_repo_url("URL", $fetch);
5638                } else {
5639                        $urls_table .= format_repo_url("Fetch URL", $fetch);
5640                        $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5641                }
5642        } elsif (defined $push) {
5643                $urls_table .= format_repo_url("Push URL", $push);
5644        } else {
5645                $urls_table .= format_repo_url("", "No remote URL");
5646        }
5647
5648        $urls_table .= "</table>\n";
5649
5650        my $dots;
5651        if (defined $limit && $limit < @$heads) {
5652                $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5653        }
5654
5655        print $urls_table;
5656        git_heads_body($heads, $head, 0, $limit, $dots);
5657}
5658
5659# Display a list of remote names with the respective fetch and push URLs
5660sub git_remotes_list {
5661        my ($remotedata, $limit) = @_;
5662        print "<table class=\"heads\">\n";
5663        my $alternate = 1;
5664        my @remotes = sort keys %$remotedata;
5665
5666        my $limited = $limit && $limit < @remotes;
5667
5668        $#remotes = $limit - 1 if $limited;
5669
5670        while (my $remote = shift @remotes) {
5671                my $rdata = $remotedata->{$remote};
5672                my $fetch = $rdata->{'fetch'};
5673                my $push = $rdata->{'push'};
5674                if ($alternate) {
5675                        print "<tr class=\"dark\">\n";
5676                } else {
5677                        print "<tr class=\"light\">\n";
5678                }
5679                $alternate ^= 1;
5680                print "<td>" .
5681                      $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5682                               -class=> "list name"},esc_html($remote)) .
5683                      "</td>";
5684                print "<td class=\"link\">" .
5685                      (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5686                      " | " .
5687                      (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5688                      "</td>";
5689
5690                print "</tr>\n";
5691        }
5692
5693        if ($limited) {
5694                print "<tr>\n" .
5695                      "<td colspan=\"3\">" .
5696                      $cgi->a({-href => href(action=>"remotes")}, "...") .
5697                      "</td>\n" . "</tr>\n";
5698        }
5699
5700        print "</table>";
5701}
5702
5703# Display remote heads grouped by remote, unless there are too many
5704# remotes, in which case we only display the remote names
5705sub git_remotes_body {
5706        my ($remotedata, $limit, $head) = @_;
5707        if ($limit and $limit < keys %$remotedata) {
5708                git_remotes_list($remotedata, $limit);
5709        } else {
5710                fill_remote_heads($remotedata);
5711                while (my ($remote, $rdata) = each %$remotedata) {
5712                        git_print_section({-class=>"remote", -id=>$remote},
5713                                ["remotes", $remote, $remote], sub {
5714                                        git_remote_block($remote, $rdata, $limit, $head);
5715                                });
5716                }
5717        }
5718}
5719
5720sub git_search_message {
5721        my %co = @_;
5722
5723        my $greptype;
5724        if ($searchtype eq 'commit') {
5725                $greptype = "--grep=";
5726        } elsif ($searchtype eq 'author') {
5727                $greptype = "--author=";
5728        } elsif ($searchtype eq 'committer') {
5729                $greptype = "--committer=";
5730        }
5731        $greptype .= $searchtext;
5732        my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
5733                                       $greptype, '--regexp-ignore-case',
5734                                       $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
5735
5736        my $paging_nav = '';
5737        if ($page > 0) {
5738                $paging_nav .=
5739                        $cgi->a({-href => href(-replay=>1, page=>undef)},
5740                                "first") .
5741                        " &sdot; " .
5742                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
5743                                 -accesskey => "p", -title => "Alt-p"}, "prev");
5744        } else {
5745                $paging_nav .= "first &sdot; prev";
5746        }
5747        my $next_link = '';
5748        if ($#commitlist >= 100) {
5749                $next_link =
5750                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
5751                                 -accesskey => "n", -title => "Alt-n"}, "next");
5752                $paging_nav .= " &sdot; $next_link";
5753        } else {
5754                $paging_nav .= " &sdot; next";
5755        }
5756
5757        git_header_html();
5758
5759        git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
5760        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5761        if ($page == 0 && !@commitlist) {
5762                print "<p>No match.</p>\n";
5763        } else {
5764                git_search_grep_body(\@commitlist, 0, 99, $next_link);
5765        }
5766
5767        git_footer_html();
5768}
5769
5770sub git_search_changes {
5771        my %co = @_;
5772
5773        local $/ = "\n";
5774        open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
5775                '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
5776                ($search_use_regexp ? '--pickaxe-regex' : ())
5777                        or die_error(500, "Open git-log failed");
5778
5779        git_header_html();
5780
5781        git_print_page_nav('','', $hash,$co{'tree'},$hash);
5782        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5783
5784        print "<table class=\"pickaxe search\">\n";
5785        my $alternate = 1;
5786        undef %co;
5787        my @files;
5788        while (my $line = <$fd>) {
5789                chomp $line;
5790                next unless $line;
5791
5792                my %set = parse_difftree_raw_line($line);
5793                if (defined $set{'commit'}) {
5794                        # finish previous commit
5795                        if (%co) {
5796                                print "</td>\n" .
5797                                      "<td class=\"link\">" .
5798                                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5799                                              "commit") .
5800                                      " | " .
5801                                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5802                                                             hash_base=>$co{'id'})},
5803                                              "tree") .
5804                                      "</td>\n" .
5805                                      "</tr>\n";
5806                        }
5807
5808                        if ($alternate) {
5809                                print "<tr class=\"dark\">\n";
5810                        } else {
5811                                print "<tr class=\"light\">\n";
5812                        }
5813                        $alternate ^= 1;
5814                        %co = parse_commit($set{'commit'});
5815                        my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
5816                        print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5817                              "<td><i>$author</i></td>\n" .
5818                              "<td>" .
5819                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5820                                      -class => "list subject"},
5821                                      chop_and_escape_str($co{'title'}, 50) . "<br/>");
5822                } elsif (defined $set{'to_id'}) {
5823                        next if ($set{'to_id'} =~ m/^0{40}$/);
5824
5825                        print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
5826                                                     hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
5827                                      -class => "list"},
5828                                      "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
5829                              "<br/>\n";
5830                }
5831        }
5832        close $fd;
5833
5834        # finish last commit (warning: repetition!)
5835        if (%co) {
5836                print "</td>\n" .
5837                      "<td class=\"link\">" .
5838                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5839                              "commit") .
5840                      " | " .
5841                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5842                                             hash_base=>$co{'id'})},
5843                              "tree") .
5844                      "</td>\n" .
5845                      "</tr>\n";
5846        }
5847
5848        print "</table>\n";
5849
5850        git_footer_html();
5851}
5852
5853sub git_search_files {
5854        my %co = @_;
5855
5856        local $/ = "\n";
5857        open my $fd, "-|", git_cmd(), 'grep', '-n', '-z',
5858                $search_use_regexp ? ('-E', '-i') : '-F',
5859                $searchtext, $co{'tree'}
5860                        or die_error(500, "Open git-grep failed");
5861
5862        git_header_html();
5863
5864        git_print_page_nav('','', $hash,$co{'tree'},$hash);
5865        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5866
5867        print "<table class=\"grep_search\">\n";
5868        my $alternate = 1;
5869        my $matches = 0;
5870        my $lastfile = '';
5871        while (my $line = <$fd>) {
5872                chomp $line;
5873                my ($file, $file_href, $lno, $ltext, $binary);
5874                last if ($matches++ > 1000);
5875                if ($line =~ /^Binary file (.+) matches$/) {
5876                        $file = $1;
5877                        $binary = 1;
5878                } else {
5879                        ($file, $lno, $ltext) = split(/\0/, $line, 3);
5880                        $file =~ s/^$co{'tree'}://;
5881                }
5882                if ($file ne $lastfile) {
5883                        $lastfile and print "</td></tr>\n";
5884                        if ($alternate++) {
5885                                print "<tr class=\"dark\">\n";
5886                        } else {
5887                                print "<tr class=\"light\">\n";
5888                        }
5889                        $file_href = href(action=>"blob", hash_base=>$co{'id'},
5890                                          file_name=>$file);
5891                        print "<td class=\"list\">".
5892                                $cgi->a({-href => $file_href, -class => "list"}, esc_path($file));
5893                        print "</td><td>\n";
5894                        $lastfile = $file;
5895                }
5896                if ($binary) {
5897                        print "<div class=\"binary\">Binary file</div>\n";
5898                } else {
5899                        $ltext = untabify($ltext);
5900                        if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
5901                                $ltext = esc_html($1, -nbsp=>1);
5902                                $ltext .= '<span class="match">';
5903                                $ltext .= esc_html($2, -nbsp=>1);
5904                                $ltext .= '</span>';
5905                                $ltext .= esc_html($3, -nbsp=>1);
5906                        } else {
5907                                $ltext = esc_html($ltext, -nbsp=>1);
5908                        }
5909                        print "<div class=\"pre\">" .
5910                                $cgi->a({-href => $file_href.'#l'.$lno,
5911                                        -class => "linenr"}, sprintf('%4i', $lno)) .
5912                                ' ' .  $ltext . "</div>\n";
5913                }
5914        }
5915        if ($lastfile) {
5916                print "</td></tr>\n";
5917                if ($matches > 1000) {
5918                        print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
5919                }
5920        } else {
5921                print "<div class=\"diff nodifferences\">No matches found</div>\n";
5922        }
5923        close $fd;
5924
5925        print "</table>\n";
5926
5927        git_footer_html();
5928}
5929
5930sub git_search_grep_body {
5931        my ($commitlist, $from, $to, $extra) = @_;
5932        $from = 0 unless defined $from;
5933        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5934
5935        print "<table class=\"commit_search\">\n";
5936        my $alternate = 1;
5937        for (my $i = $from; $i <= $to; $i++) {
5938                my %co = %{$commitlist->[$i]};
5939                if (!%co) {
5940                        next;
5941                }
5942                my $commit = $co{'id'};
5943                if ($alternate) {
5944                        print "<tr class=\"dark\">\n";
5945                } else {
5946                        print "<tr class=\"light\">\n";
5947                }
5948                $alternate ^= 1;
5949                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5950                      format_author_html('td', \%co, 15, 5) .
5951                      "<td>" .
5952                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5953                               -class => "list subject"},
5954                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
5955                my $comment = $co{'comment'};
5956                foreach my $line (@$comment) {
5957                        if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
5958                                my ($lead, $match, $trail) = ($1, $2, $3);
5959                                $match = chop_str($match, 70, 5, 'center');
5960                                my $contextlen = int((80 - length($match))/2);
5961                                $contextlen = 30 if ($contextlen > 30);
5962                                $lead  = chop_str($lead,  $contextlen, 10, 'left');
5963                                $trail = chop_str($trail, $contextlen, 10, 'right');
5964
5965                                $lead  = esc_html($lead);
5966                                $match = esc_html($match);
5967                                $trail = esc_html($trail);
5968
5969                                print "$lead<span class=\"match\">$match</span>$trail<br />";
5970                        }
5971                }
5972                print "</td>\n" .
5973                      "<td class=\"link\">" .
5974                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5975                      " | " .
5976                      $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5977                      " | " .
5978                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5979                print "</td>\n" .
5980                      "</tr>\n";
5981        }
5982        if (defined $extra) {
5983                print "<tr>\n" .
5984                      "<td colspan=\"3\">$extra</td>\n" .
5985                      "</tr>\n";
5986        }
5987        print "</table>\n";
5988}
5989
5990## ======================================================================
5991## ======================================================================
5992## actions
5993
5994sub git_project_list {
5995        my $order = $input_params{'order'};
5996        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5997                die_error(400, "Unknown order parameter");
5998        }
5999
6000        my @list = git_get_projects_list($project_filter, $strict_export);
6001        if (!@list) {
6002                die_error(404, "No projects found");
6003        }
6004
6005        git_header_html();
6006        if (defined $home_text && -f $home_text) {
6007                print "<div class=\"index_include\">\n";
6008                insert_file($home_text);
6009                print "</div>\n";
6010        }
6011        print $cgi->startform(-method => "get") .
6012              "<p class=\"projsearch\">Search:\n" .
6013              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
6014              "</p>" .
6015              $cgi->end_form() . "\n";
6016        git_project_list_body(\@list, $order);
6017        git_footer_html();
6018}
6019
6020sub git_forks {
6021        my $order = $input_params{'order'};
6022        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6023                die_error(400, "Unknown order parameter");
6024        }
6025
6026        my $filter = $project;
6027        $filter =~ s/\.git$//;
6028        my @list = git_get_projects_list($filter);
6029        if (!@list) {
6030                die_error(404, "No forks found");
6031        }
6032
6033        git_header_html();
6034        git_print_page_nav('','');
6035        git_print_header_div('summary', "$project forks");
6036        git_project_list_body(\@list, $order);
6037        git_footer_html();
6038}
6039
6040sub git_project_index {
6041        my @projects = git_get_projects_list($project_filter, $strict_export);
6042        if (!@projects) {
6043                die_error(404, "No projects found");
6044        }
6045
6046        print $cgi->header(
6047                -type => 'text/plain',
6048                -charset => 'utf-8',
6049                -content_disposition => 'inline; filename="index.aux"');
6050
6051        foreach my $pr (@projects) {
6052                if (!exists $pr->{'owner'}) {
6053                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6054                }
6055
6056                my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6057                # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6058                $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6059                $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6060                $path  =~ s/ /\+/g;
6061                $owner =~ s/ /\+/g;
6062
6063                print "$path $owner\n";
6064        }
6065}
6066
6067sub git_summary {
6068        my $descr = git_get_project_description($project) || "none";
6069        my %co = parse_commit("HEAD");
6070        my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6071        my $head = $co{'id'};
6072        my $remote_heads = gitweb_check_feature('remote_heads');
6073
6074        my $owner = git_get_project_owner($project);
6075
6076        my $refs = git_get_references();
6077        # These get_*_list functions return one more to allow us to see if
6078        # there are more ...
6079        my @taglist  = git_get_tags_list(16);
6080        my @headlist = git_get_heads_list(16);
6081        my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6082        my @forklist;
6083        my $check_forks = gitweb_check_feature('forks');
6084
6085        if ($check_forks) {
6086                # find forks of a project
6087                my $filter = $project;
6088                $filter =~ s/\.git$//;
6089                @forklist = git_get_projects_list($filter);
6090                # filter out forks of forks
6091                @forklist = filter_forks_from_projects_list(\@forklist)
6092                        if (@forklist);
6093        }
6094
6095        git_header_html();
6096        git_print_page_nav('summary','', $head);
6097
6098        print "<div class=\"title\">&nbsp;</div>\n";
6099        print "<table class=\"projects_list\">\n" .
6100              "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
6101              "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6102        if (defined $cd{'rfc2822'}) {
6103                print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6104                      "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6105        }
6106
6107        # use per project git URL list in $projectroot/$project/cloneurl
6108        # or make project git URL from git base URL and project name
6109        my $url_tag = "URL";
6110        my @url_list = git_get_project_url_list($project);
6111        @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6112        foreach my $git_url (@url_list) {
6113                next unless $git_url;
6114                print format_repo_url($url_tag, $git_url);
6115                $url_tag = "";
6116        }
6117
6118        # Tag cloud
6119        my $show_ctags = gitweb_check_feature('ctags');
6120        if ($show_ctags) {
6121                my $ctags = git_get_project_ctags($project);
6122                if (%$ctags) {
6123                        # without ability to add tags, don't show if there are none
6124                        my $cloud = git_populate_project_tagcloud($ctags);
6125                        print "<tr id=\"metadata_ctags\">" .
6126                              "<td>content tags</td>" .
6127                              "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6128                              "</tr>\n";
6129                }
6130        }
6131
6132        print "</table>\n";
6133
6134        # If XSS prevention is on, we don't include README.html.
6135        # TODO: Allow a readme in some safe format.
6136        if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6137                print "<div class=\"title\">readme</div>\n" .
6138                      "<div class=\"readme\">\n";
6139                insert_file("$projectroot/$project/README.html");
6140                print "\n</div>\n"; # class="readme"
6141        }
6142
6143        # we need to request one more than 16 (0..15) to check if
6144        # those 16 are all
6145        my @commitlist = $head ? parse_commits($head, 17) : ();
6146        if (@commitlist) {
6147                git_print_header_div('shortlog');
6148                git_shortlog_body(\@commitlist, 0, 15, $refs,
6149                                  $#commitlist <=  15 ? undef :
6150                                  $cgi->a({-href => href(action=>"shortlog")}, "..."));
6151        }
6152
6153        if (@taglist) {
6154                git_print_header_div('tags');
6155                git_tags_body(\@taglist, 0, 15,
6156                              $#taglist <=  15 ? undef :
6157                              $cgi->a({-href => href(action=>"tags")}, "..."));
6158        }
6159
6160        if (@headlist) {
6161                git_print_header_div('heads');
6162                git_heads_body(\@headlist, $head, 0, 15,
6163                               $#headlist <= 15 ? undef :
6164                               $cgi->a({-href => href(action=>"heads")}, "..."));
6165        }
6166
6167        if (%remotedata) {
6168                git_print_header_div('remotes');
6169                git_remotes_body(\%remotedata, 15, $head);
6170        }
6171
6172        if (@forklist) {
6173                git_print_header_div('forks');
6174                git_project_list_body(\@forklist, 'age', 0, 15,
6175                                      $#forklist <= 15 ? undef :
6176                                      $cgi->a({-href => href(action=>"forks")}, "..."),
6177                                      'no_header');
6178        }
6179
6180        git_footer_html();
6181}
6182
6183sub git_tag {
6184        my %tag = parse_tag($hash);
6185
6186        if (! %tag) {
6187                die_error(404, "Unknown tag object");
6188        }
6189
6190        my $head = git_get_head_hash($project);
6191        git_header_html();
6192        git_print_page_nav('','', $head,undef,$head);
6193        git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6194        print "<div class=\"title_text\">\n" .
6195              "<table class=\"object_header\">\n" .
6196              "<tr>\n" .
6197              "<td>object</td>\n" .
6198              "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6199                               $tag{'object'}) . "</td>\n" .
6200              "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6201                                              $tag{'type'}) . "</td>\n" .
6202              "</tr>\n";
6203        if (defined($tag{'author'})) {
6204                git_print_authorship_rows(\%tag, 'author');
6205        }
6206        print "</table>\n\n" .
6207              "</div>\n";
6208        print "<div class=\"page_body\">";
6209        my $comment = $tag{'comment'};
6210        foreach my $line (@$comment) {
6211                chomp $line;
6212                print esc_html($line, -nbsp=>1) . "<br/>\n";
6213        }
6214        print "</div>\n";
6215        git_footer_html();
6216}
6217
6218sub git_blame_common {
6219        my $format = shift || 'porcelain';
6220        if ($format eq 'porcelain' && $cgi->param('js')) {
6221                $format = 'incremental';
6222                $action = 'blame_incremental'; # for page title etc
6223        }
6224
6225        # permissions
6226        gitweb_check_feature('blame')
6227                or die_error(403, "Blame view not allowed");
6228
6229        # error checking
6230        die_error(400, "No file name given") unless $file_name;
6231        $hash_base ||= git_get_head_hash($project);
6232        die_error(404, "Couldn't find base commit") unless $hash_base;
6233        my %co = parse_commit($hash_base)
6234                or die_error(404, "Commit not found");
6235        my $ftype = "blob";
6236        if (!defined $hash) {
6237                $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6238                        or die_error(404, "Error looking up file");
6239        } else {
6240                $ftype = git_get_type($hash);
6241                if ($ftype !~ "blob") {
6242                        die_error(400, "Object is not a blob");
6243                }
6244        }
6245
6246        my $fd;
6247        if ($format eq 'incremental') {
6248                # get file contents (as base)
6249                open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6250                        or die_error(500, "Open git-cat-file failed");
6251        } elsif ($format eq 'data') {
6252                # run git-blame --incremental
6253                open $fd, "-|", git_cmd(), "blame", "--incremental",
6254                        $hash_base, "--", $file_name
6255                        or die_error(500, "Open git-blame --incremental failed");
6256        } else {
6257                # run git-blame --porcelain
6258                open $fd, "-|", git_cmd(), "blame", '-p',
6259                        $hash_base, '--', $file_name
6260                        or die_error(500, "Open git-blame --porcelain failed");
6261        }
6262
6263        # incremental blame data returns early
6264        if ($format eq 'data') {
6265                print $cgi->header(
6266                        -type=>"text/plain", -charset => "utf-8",
6267                        -status=> "200 OK");
6268                local $| = 1; # output autoflush
6269                while (my $line = <$fd>) {
6270                        print to_utf8($line);
6271                }
6272                close $fd
6273                        or print "ERROR $!\n";
6274
6275                print 'END';
6276                if (defined $t0 && gitweb_check_feature('timed')) {
6277                        print ' '.
6278                              tv_interval($t0, [ gettimeofday() ]).
6279                              ' '.$number_of_git_cmds;
6280                }
6281                print "\n";
6282
6283                return;
6284        }
6285
6286        # page header
6287        git_header_html();
6288        my $formats_nav =
6289                $cgi->a({-href => href(action=>"blob", -replay=>1)},
6290                        "blob") .
6291                " | ";
6292        if ($format eq 'incremental') {
6293                $formats_nav .=
6294                        $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6295                                "blame") . " (non-incremental)";
6296        } else {
6297                $formats_nav .=
6298                        $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6299                                "blame") . " (incremental)";
6300        }
6301        $formats_nav .=
6302                " | " .
6303                $cgi->a({-href => href(action=>"history", -replay=>1)},
6304                        "history") .
6305                " | " .
6306                $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6307                        "HEAD");
6308        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6309        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6310        git_print_page_path($file_name, $ftype, $hash_base);
6311
6312        # page body
6313        if ($format eq 'incremental') {
6314                print "<noscript>\n<div class=\"error\"><center><b>\n".
6315                      "This page requires JavaScript to run.\n Use ".
6316                      $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6317                              'this page').
6318                      " instead.\n".
6319                      "</b></center></div>\n</noscript>\n";
6320
6321                print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6322        }
6323
6324        print qq!<div class="page_body">\n!;
6325        print qq!<div id="progress_info">... / ...</div>\n!
6326                if ($format eq 'incremental');
6327        print qq!<table id="blame_table" class="blame" width="100%">\n!.
6328              #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6329              qq!<thead>\n!.
6330              qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6331              qq!</thead>\n!.
6332              qq!<tbody>\n!;
6333
6334        my @rev_color = qw(light dark);
6335        my $num_colors = scalar(@rev_color);
6336        my $current_color = 0;
6337
6338        if ($format eq 'incremental') {
6339                my $color_class = $rev_color[$current_color];
6340
6341                #contents of a file
6342                my $linenr = 0;
6343        LINE:
6344                while (my $line = <$fd>) {
6345                        chomp $line;
6346                        $linenr++;
6347
6348                        print qq!<tr id="l$linenr" class="$color_class">!.
6349                              qq!<td class="sha1"><a href=""> </a></td>!.
6350                              qq!<td class="linenr">!.
6351                              qq!<a class="linenr" href="">$linenr</a></td>!;
6352                        print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6353                        print qq!</tr>\n!;
6354                }
6355
6356        } else { # porcelain, i.e. ordinary blame
6357                my %metainfo = (); # saves information about commits
6358
6359                # blame data
6360        LINE:
6361                while (my $line = <$fd>) {
6362                        chomp $line;
6363                        # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6364                        # no <lines in group> for subsequent lines in group of lines
6365                        my ($full_rev, $orig_lineno, $lineno, $group_size) =
6366                           ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6367                        if (!exists $metainfo{$full_rev}) {
6368                                $metainfo{$full_rev} = { 'nprevious' => 0 };
6369                        }
6370                        my $meta = $metainfo{$full_rev};
6371                        my $data;
6372                        while ($data = <$fd>) {
6373                                chomp $data;
6374                                last if ($data =~ s/^\t//); # contents of line
6375                                if ($data =~ /^(\S+)(?: (.*))?$/) {
6376                                        $meta->{$1} = $2 unless exists $meta->{$1};
6377                                }
6378                                if ($data =~ /^previous /) {
6379                                        $meta->{'nprevious'}++;
6380                                }
6381                        }
6382                        my $short_rev = substr($full_rev, 0, 8);
6383                        my $author = $meta->{'author'};
6384                        my %date =
6385                                parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6386                        my $date = $date{'iso-tz'};
6387                        if ($group_size) {
6388                                $current_color = ($current_color + 1) % $num_colors;
6389                        }
6390                        my $tr_class = $rev_color[$current_color];
6391                        $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6392                        $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6393                        $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6394                        print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6395                        if ($group_size) {
6396                                print "<td class=\"sha1\"";
6397                                print " title=\"". esc_html($author) . ", $date\"";
6398                                print " rowspan=\"$group_size\"" if ($group_size > 1);
6399                                print ">";
6400                                print $cgi->a({-href => href(action=>"commit",
6401                                                             hash=>$full_rev,
6402                                                             file_name=>$file_name)},
6403                                              esc_html($short_rev));
6404                                if ($group_size >= 2) {
6405                                        my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6406                                        if (@author_initials) {
6407                                                print "<br />" .
6408                                                      esc_html(join('', @author_initials));
6409                                                #           or join('.', ...)
6410                                        }
6411                                }
6412                                print "</td>\n";
6413                        }
6414                        # 'previous' <sha1 of parent commit> <filename at commit>
6415                        if (exists $meta->{'previous'} &&
6416                            $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6417                                $meta->{'parent'} = $1;
6418                                $meta->{'file_parent'} = unquote($2);
6419                        }
6420                        my $linenr_commit =
6421                                exists($meta->{'parent'}) ?
6422                                $meta->{'parent'} : $full_rev;
6423                        my $linenr_filename =
6424                                exists($meta->{'file_parent'}) ?
6425                                $meta->{'file_parent'} : unquote($meta->{'filename'});
6426                        my $blamed = href(action => 'blame',
6427                                          file_name => $linenr_filename,
6428                                          hash_base => $linenr_commit);
6429                        print "<td class=\"linenr\">";
6430                        print $cgi->a({ -href => "$blamed#l$orig_lineno",
6431                                        -class => "linenr" },
6432                                      esc_html($lineno));
6433                        print "</td>";
6434                        print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6435                        print "</tr>\n";
6436                } # end while
6437
6438        }
6439
6440        # footer
6441        print "</tbody>\n".
6442              "</table>\n"; # class="blame"
6443        print "</div>\n";   # class="blame_body"
6444        close $fd
6445                or print "Reading blob failed\n";
6446
6447        git_footer_html();
6448}
6449
6450sub git_blame {
6451        git_blame_common();
6452}
6453
6454sub git_blame_incremental {
6455        git_blame_common('incremental');
6456}
6457
6458sub git_blame_data {
6459        git_blame_common('data');
6460}
6461
6462sub git_tags {
6463        my $head = git_get_head_hash($project);
6464        git_header_html();
6465        git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6466        git_print_header_div('summary', $project);
6467
6468        my @tagslist = git_get_tags_list();
6469        if (@tagslist) {
6470                git_tags_body(\@tagslist);
6471        }
6472        git_footer_html();
6473}
6474
6475sub git_heads {
6476        my $head = git_get_head_hash($project);
6477        git_header_html();
6478        git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6479        git_print_header_div('summary', $project);
6480
6481        my @headslist = git_get_heads_list();
6482        if (@headslist) {
6483                git_heads_body(\@headslist, $head);
6484        }
6485        git_footer_html();
6486}
6487
6488# used both for single remote view and for list of all the remotes
6489sub git_remotes {
6490        gitweb_check_feature('remote_heads')
6491                or die_error(403, "Remote heads view is disabled");
6492
6493        my $head = git_get_head_hash($project);
6494        my $remote = $input_params{'hash'};
6495
6496        my $remotedata = git_get_remotes_list($remote);
6497        die_error(500, "Unable to get remote information") unless defined $remotedata;
6498
6499        unless (%$remotedata) {
6500                die_error(404, defined $remote ?
6501                        "Remote $remote not found" :
6502                        "No remotes found");
6503        }
6504
6505        git_header_html(undef, undef, -action_extra => $remote);
6506        git_print_page_nav('', '',  $head, undef, $head,
6507                format_ref_views($remote ? '' : 'remotes'));
6508
6509        fill_remote_heads($remotedata);
6510        if (defined $remote) {
6511                git_print_header_div('remotes', "$remote remote for $project");
6512                git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6513        } else {
6514                git_print_header_div('summary', "$project remotes");
6515                git_remotes_body($remotedata, undef, $head);
6516        }
6517
6518        git_footer_html();
6519}
6520
6521sub git_blob_plain {
6522        my $type = shift;
6523        my $expires;
6524
6525        if (!defined $hash) {
6526                if (defined $file_name) {
6527                        my $base = $hash_base || git_get_head_hash($project);
6528                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6529                                or die_error(404, "Cannot find file");
6530                } else {
6531                        die_error(400, "No file name defined");
6532                }
6533        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6534                # blobs defined by non-textual hash id's can be cached
6535                $expires = "+1d";
6536        }
6537
6538        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6539                or die_error(500, "Open git-cat-file blob '$hash' failed");
6540
6541        # content-type (can include charset)
6542        $type = blob_contenttype($fd, $file_name, $type);
6543
6544        # "save as" filename, even when no $file_name is given
6545        my $save_as = "$hash";
6546        if (defined $file_name) {
6547                $save_as = $file_name;
6548        } elsif ($type =~ m/^text\//) {
6549                $save_as .= '.txt';
6550        }
6551
6552        # With XSS prevention on, blobs of all types except a few known safe
6553        # ones are served with "Content-Disposition: attachment" to make sure
6554        # they don't run in our security domain.  For certain image types,
6555        # blob view writes an <img> tag referring to blob_plain view, and we
6556        # want to be sure not to break that by serving the image as an
6557        # attachment (though Firefox 3 doesn't seem to care).
6558        my $sandbox = $prevent_xss &&
6559                $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6560
6561        # serve text/* as text/plain
6562        if ($prevent_xss &&
6563            ($type =~ m!^text/[a-z]+\b(.*)$! ||
6564             ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
6565                my $rest = $1;
6566                $rest = defined $rest ? $rest : '';
6567                $type = "text/plain$rest";
6568        }
6569
6570        print $cgi->header(
6571                -type => $type,
6572                -expires => $expires,
6573                -content_disposition =>
6574                        ($sandbox ? 'attachment' : 'inline')
6575                        . '; filename="' . $save_as . '"');
6576        local $/ = undef;
6577        binmode STDOUT, ':raw';
6578        print <$fd>;
6579        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6580        close $fd;
6581}
6582
6583sub git_blob {
6584        my $expires;
6585
6586        if (!defined $hash) {
6587                if (defined $file_name) {
6588                        my $base = $hash_base || git_get_head_hash($project);
6589                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6590                                or die_error(404, "Cannot find file");
6591                } else {
6592                        die_error(400, "No file name defined");
6593                }
6594        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6595                # blobs defined by non-textual hash id's can be cached
6596                $expires = "+1d";
6597        }
6598
6599        my $have_blame = gitweb_check_feature('blame');
6600        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6601                or die_error(500, "Couldn't cat $file_name, $hash");
6602        my $mimetype = blob_mimetype($fd, $file_name);
6603        # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6604        if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6605                close $fd;
6606                return git_blob_plain($mimetype);
6607        }
6608        # we can have blame only for text/* mimetype
6609        $have_blame &&= ($mimetype =~ m!^text/!);
6610
6611        my $highlight = gitweb_check_feature('highlight');
6612        my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6613        $fd = run_highlighter($fd, $highlight, $syntax)
6614                if $syntax;
6615
6616        git_header_html(undef, $expires);
6617        my $formats_nav = '';
6618        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6619                if (defined $file_name) {
6620                        if ($have_blame) {
6621                                $formats_nav .=
6622                                        $cgi->a({-href => href(action=>"blame", -replay=>1)},
6623                                                "blame") .
6624                                        " | ";
6625                        }
6626                        $formats_nav .=
6627                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6628                                        "history") .
6629                                " | " .
6630                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6631                                        "raw") .
6632                                " | " .
6633                                $cgi->a({-href => href(action=>"blob",
6634                                                       hash_base=>"HEAD", file_name=>$file_name)},
6635                                        "HEAD");
6636                } else {
6637                        $formats_nav .=
6638                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6639                                        "raw");
6640                }
6641                git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6642                git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6643        } else {
6644                print "<div class=\"page_nav\">\n" .
6645                      "<br/><br/></div>\n" .
6646                      "<div class=\"title\">".esc_html($hash)."</div>\n";
6647        }
6648        git_print_page_path($file_name, "blob", $hash_base);
6649        print "<div class=\"page_body\">\n";
6650        if ($mimetype =~ m!^image/!) {
6651                print qq!<img type="!.esc_attr($mimetype).qq!"!;
6652                if ($file_name) {
6653                        print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
6654                }
6655                print qq! src="! .
6656                      href(action=>"blob_plain", hash=>$hash,
6657                           hash_base=>$hash_base, file_name=>$file_name) .
6658                      qq!" />\n!;
6659        } else {
6660                my $nr;
6661                while (my $line = <$fd>) {
6662                        chomp $line;
6663                        $nr++;
6664                        $line = untabify($line);
6665                        printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
6666                               $nr, esc_attr(href(-replay => 1)), $nr, $nr,
6667                               $syntax ? sanitize($line) : esc_html($line, -nbsp=>1);
6668                }
6669        }
6670        close $fd
6671                or print "Reading blob failed.\n";
6672        print "</div>";
6673        git_footer_html();
6674}
6675
6676sub git_tree {
6677        if (!defined $hash_base) {
6678                $hash_base = "HEAD";
6679        }
6680        if (!defined $hash) {
6681                if (defined $file_name) {
6682                        $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
6683                } else {
6684                        $hash = $hash_base;
6685                }
6686        }
6687        die_error(404, "No such tree") unless defined($hash);
6688
6689        my $show_sizes = gitweb_check_feature('show-sizes');
6690        my $have_blame = gitweb_check_feature('blame');
6691
6692        my @entries = ();
6693        {
6694                local $/ = "\0";
6695                open my $fd, "-|", git_cmd(), "ls-tree", '-z',
6696                        ($show_sizes ? '-l' : ()), @extra_options, $hash
6697                        or die_error(500, "Open git-ls-tree failed");
6698                @entries = map { chomp; $_ } <$fd>;
6699                close $fd
6700                        or die_error(404, "Reading tree failed");
6701        }
6702
6703        my $refs = git_get_references();
6704        my $ref = format_ref_marker($refs, $hash_base);
6705        git_header_html();
6706        my $basedir = '';
6707        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6708                my @views_nav = ();
6709                if (defined $file_name) {
6710                        push @views_nav,
6711                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6712                                        "history"),
6713                                $cgi->a({-href => href(action=>"tree",
6714                                                       hash_base=>"HEAD", file_name=>$file_name)},
6715                                        "HEAD"),
6716                }
6717                my $snapshot_links = format_snapshot_links($hash);
6718                if (defined $snapshot_links) {
6719                        # FIXME: Should be available when we have no hash base as well.
6720                        push @views_nav, $snapshot_links;
6721                }
6722                git_print_page_nav('tree','', $hash_base, undef, undef,
6723                                   join(' | ', @views_nav));
6724                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6725        } else {
6726                undef $hash_base;
6727                print "<div class=\"page_nav\">\n";
6728                print "<br/><br/></div>\n";
6729                print "<div class=\"title\">".esc_html($hash)."</div>\n";
6730        }
6731        if (defined $file_name) {
6732                $basedir = $file_name;
6733                if ($basedir ne '' && substr($basedir, -1) ne '/') {
6734                        $basedir .= '/';
6735                }
6736                git_print_page_path($file_name, 'tree', $hash_base);
6737        }
6738        print "<div class=\"page_body\">\n";
6739        print "<table class=\"tree\">\n";
6740        my $alternate = 1;
6741        # '..' (top directory) link if possible
6742        if (defined $hash_base &&
6743            defined $file_name && $file_name =~ m![^/]+$!) {
6744                if ($alternate) {
6745                        print "<tr class=\"dark\">\n";
6746                } else {
6747                        print "<tr class=\"light\">\n";
6748                }
6749                $alternate ^= 1;
6750
6751                my $up = $file_name;
6752                $up =~ s!/?[^/]+$!!;
6753                undef $up unless $up;
6754                # based on git_print_tree_entry
6755                print '<td class="mode">' . mode_str('040000') . "</td>\n";
6756                print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6757                print '<td class="list">';
6758                print $cgi->a({-href => href(action=>"tree",
6759                                             hash_base=>$hash_base,
6760                                             file_name=>$up)},
6761                              "..");
6762                print "</td>\n";
6763                print "<td class=\"link\"></td>\n";
6764
6765                print "</tr>\n";
6766        }
6767        foreach my $line (@entries) {
6768                my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6769
6770                if ($alternate) {
6771                        print "<tr class=\"dark\">\n";
6772                } else {
6773                        print "<tr class=\"light\">\n";
6774                }
6775                $alternate ^= 1;
6776
6777                git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6778
6779                print "</tr>\n";
6780        }
6781        print "</table>\n" .
6782              "</div>";
6783        git_footer_html();
6784}
6785
6786sub snapshot_name {
6787        my ($project, $hash) = @_;
6788
6789        # path/to/project.git  -> project
6790        # path/to/project/.git -> project
6791        my $name = to_utf8($project);
6792        $name =~ s,([^/])/*\.git$,$1,;
6793        $name = basename($name);
6794        # sanitize name
6795        $name =~ s/[[:cntrl:]]/?/g;
6796
6797        my $ver = $hash;
6798        if ($hash =~ /^[0-9a-fA-F]+$/) {
6799                # shorten SHA-1 hash
6800                my $full_hash = git_get_full_hash($project, $hash);
6801                if ($full_hash =~ /^$hash/ && length($hash) > 7) {
6802                        $ver = git_get_short_hash($project, $hash);
6803                }
6804        } elsif ($hash =~ m!^refs/tags/(.*)$!) {
6805                # tags don't need shortened SHA-1 hash
6806                $ver = $1;
6807        } else {
6808                # branches and other need shortened SHA-1 hash
6809                if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
6810                        $ver = $1;
6811                }
6812                $ver .= '-' . git_get_short_hash($project, $hash);
6813        }
6814        # in case of hierarchical branch names
6815        $ver =~ s!/!.!g;
6816
6817        # name = project-version_string
6818        $name = "$name-$ver";
6819
6820        return wantarray ? ($name, $name) : $name;
6821}
6822
6823sub git_snapshot {
6824        my $format = $input_params{'snapshot_format'};
6825        if (!@snapshot_fmts) {
6826                die_error(403, "Snapshots not allowed");
6827        }
6828        # default to first supported snapshot format
6829        $format ||= $snapshot_fmts[0];
6830        if ($format !~ m/^[a-z0-9]+$/) {
6831                die_error(400, "Invalid snapshot format parameter");
6832        } elsif (!exists($known_snapshot_formats{$format})) {
6833                die_error(400, "Unknown snapshot format");
6834        } elsif ($known_snapshot_formats{$format}{'disabled'}) {
6835                die_error(403, "Snapshot format not allowed");
6836        } elsif (!grep($_ eq $format, @snapshot_fmts)) {
6837                die_error(403, "Unsupported snapshot format");
6838        }
6839
6840        my $type = git_get_type("$hash^{}");
6841        if (!$type) {
6842                die_error(404, 'Object does not exist');
6843        }  elsif ($type eq 'blob') {
6844                die_error(400, 'Object is not a tree-ish');
6845        }
6846
6847        my ($name, $prefix) = snapshot_name($project, $hash);
6848        my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
6849        my $cmd = quote_command(
6850                git_cmd(), 'archive',
6851                "--format=$known_snapshot_formats{$format}{'format'}",
6852                "--prefix=$prefix/", $hash);
6853        if (exists $known_snapshot_formats{$format}{'compressor'}) {
6854                $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
6855        }
6856
6857        $filename =~ s/(["\\])/\\$1/g;
6858        print $cgi->header(
6859                -type => $known_snapshot_formats{$format}{'type'},
6860                -content_disposition => 'inline; filename="' . $filename . '"',
6861                -status => '200 OK');
6862
6863        open my $fd, "-|", $cmd
6864                or die_error(500, "Execute git-archive failed");
6865        binmode STDOUT, ':raw';
6866        print <$fd>;
6867        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6868        close $fd;
6869}
6870
6871sub git_log_generic {
6872        my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
6873
6874        my $head = git_get_head_hash($project);
6875        if (!defined $base) {
6876                $base = $head;
6877        }
6878        if (!defined $page) {
6879                $page = 0;
6880        }
6881        my $refs = git_get_references();
6882
6883        my $commit_hash = $base;
6884        if (defined $parent) {
6885                $commit_hash = "$parent..$base";
6886        }
6887        my @commitlist =
6888                parse_commits($commit_hash, 101, (100 * $page),
6889                              defined $file_name ? ($file_name, "--full-history") : ());
6890
6891        my $ftype;
6892        if (!defined $file_hash && defined $file_name) {
6893                # some commits could have deleted file in question,
6894                # and not have it in tree, but one of them has to have it
6895                for (my $i = 0; $i < @commitlist; $i++) {
6896                        $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
6897                        last if defined $file_hash;
6898                }
6899        }
6900        if (defined $file_hash) {
6901                $ftype = git_get_type($file_hash);
6902        }
6903        if (defined $file_name && !defined $ftype) {
6904                die_error(500, "Unknown type of object");
6905        }
6906        my %co;
6907        if (defined $file_name) {
6908                %co = parse_commit($base)
6909                        or die_error(404, "Unknown commit object");
6910        }
6911
6912
6913        my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
6914        my $next_link = '';
6915        if ($#commitlist >= 100) {
6916                $next_link =
6917                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
6918                                 -accesskey => "n", -title => "Alt-n"}, "next");
6919        }
6920        my $patch_max = gitweb_get_feature('patches');
6921        if ($patch_max && !defined $file_name) {
6922                if ($patch_max < 0 || @commitlist <= $patch_max) {
6923                        $paging_nav .= " &sdot; " .
6924                                $cgi->a({-href => href(action=>"patches", -replay=>1)},
6925                                        "patches");
6926                }
6927        }
6928
6929        git_header_html();
6930        git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
6931        if (defined $file_name) {
6932                git_print_header_div('commit', esc_html($co{'title'}), $base);
6933        } else {
6934                git_print_header_div('summary', $project)
6935        }
6936        git_print_page_path($file_name, $ftype, $hash_base)
6937                if (defined $file_name);
6938
6939        $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
6940                     $file_name, $file_hash, $ftype);
6941
6942        git_footer_html();
6943}
6944
6945sub git_log {
6946        git_log_generic('log', \&git_log_body,
6947                        $hash, $hash_parent);
6948}
6949
6950sub git_commit {
6951        $hash ||= $hash_base || "HEAD";
6952        my %co = parse_commit($hash)
6953            or die_error(404, "Unknown commit object");
6954
6955        my $parent  = $co{'parent'};
6956        my $parents = $co{'parents'}; # listref
6957
6958        # we need to prepare $formats_nav before any parameter munging
6959        my $formats_nav;
6960        if (!defined $parent) {
6961                # --root commitdiff
6962                $formats_nav .= '(initial)';
6963        } elsif (@$parents == 1) {
6964                # single parent commit
6965                $formats_nav .=
6966                        '(parent: ' .
6967                        $cgi->a({-href => href(action=>"commit",
6968                                               hash=>$parent)},
6969                                esc_html(substr($parent, 0, 7))) .
6970                        ')';
6971        } else {
6972                # merge commit
6973                $formats_nav .=
6974                        '(merge: ' .
6975                        join(' ', map {
6976                                $cgi->a({-href => href(action=>"commit",
6977                                                       hash=>$_)},
6978                                        esc_html(substr($_, 0, 7)));
6979                        } @$parents ) .
6980                        ')';
6981        }
6982        if (gitweb_check_feature('patches') && @$parents <= 1) {
6983                $formats_nav .= " | " .
6984                        $cgi->a({-href => href(action=>"patch", -replay=>1)},
6985                                "patch");
6986        }
6987
6988        if (!defined $parent) {
6989                $parent = "--root";
6990        }
6991        my @difftree;
6992        open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
6993                @diff_opts,
6994                (@$parents <= 1 ? $parent : '-c'),
6995                $hash, "--"
6996                or die_error(500, "Open git-diff-tree failed");
6997        @difftree = map { chomp; $_ } <$fd>;
6998        close $fd or die_error(404, "Reading git-diff-tree failed");
6999
7000        # non-textual hash id's can be cached
7001        my $expires;
7002        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7003                $expires = "+1d";
7004        }
7005        my $refs = git_get_references();
7006        my $ref = format_ref_marker($refs, $co{'id'});
7007
7008        git_header_html(undef, $expires);
7009        git_print_page_nav('commit', '',
7010                           $hash, $co{'tree'}, $hash,
7011                           $formats_nav);
7012
7013        if (defined $co{'parent'}) {
7014                git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
7015        } else {
7016                git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
7017        }
7018        print "<div class=\"title_text\">\n" .
7019              "<table class=\"object_header\">\n";
7020        git_print_authorship_rows(\%co);
7021        print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
7022        print "<tr>" .
7023              "<td>tree</td>" .
7024              "<td class=\"sha1\">" .
7025              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7026                       class => "list"}, $co{'tree'}) .
7027              "</td>" .
7028              "<td class=\"link\">" .
7029              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7030                      "tree");
7031        my $snapshot_links = format_snapshot_links($hash);
7032        if (defined $snapshot_links) {
7033                print " | " . $snapshot_links;
7034        }
7035        print "</td>" .
7036              "</tr>\n";
7037
7038        foreach my $par (@$parents) {
7039                print "<tr>" .
7040                      "<td>parent</td>" .
7041                      "<td class=\"sha1\">" .
7042                      $cgi->a({-href => href(action=>"commit", hash=>$par),
7043                               class => "list"}, $par) .
7044                      "</td>" .
7045                      "<td class=\"link\">" .
7046                      $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7047                      " | " .
7048                      $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7049                      "</td>" .
7050                      "</tr>\n";
7051        }
7052        print "</table>".
7053              "</div>\n";
7054
7055        print "<div class=\"page_body\">\n";
7056        git_print_log($co{'comment'});
7057        print "</div>\n";
7058
7059        git_difftree_body(\@difftree, $hash, @$parents);
7060
7061        git_footer_html();
7062}
7063
7064sub git_object {
7065        # object is defined by:
7066        # - hash or hash_base alone
7067        # - hash_base and file_name
7068        my $type;
7069
7070        # - hash or hash_base alone
7071        if ($hash || ($hash_base && !defined $file_name)) {
7072                my $object_id = $hash || $hash_base;
7073
7074                open my $fd, "-|", quote_command(
7075                        git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7076                        or die_error(404, "Object does not exist");
7077                $type = <$fd>;
7078                chomp $type;
7079                close $fd
7080                        or die_error(404, "Object does not exist");
7081
7082        # - hash_base and file_name
7083        } elsif ($hash_base && defined $file_name) {
7084                $file_name =~ s,/+$,,;
7085
7086                system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7087                        or die_error(404, "Base object does not exist");
7088
7089                # here errors should not hapen
7090                open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7091                        or die_error(500, "Open git-ls-tree failed");
7092                my $line = <$fd>;
7093                close $fd;
7094
7095                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7096                unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7097                        die_error(404, "File or directory for given base does not exist");
7098                }
7099                $type = $2;
7100                $hash = $3;
7101        } else {
7102                die_error(400, "Not enough information to find object");
7103        }
7104
7105        print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7106                                          hash=>$hash, hash_base=>$hash_base,
7107                                          file_name=>$file_name),
7108                             -status => '302 Found');
7109}
7110
7111sub git_blobdiff {
7112        my $format = shift || 'html';
7113        my $diff_style = $input_params{'diff_style'} || 'inline';
7114
7115        my $fd;
7116        my @difftree;
7117        my %diffinfo;
7118        my $expires;
7119
7120        # preparing $fd and %diffinfo for git_patchset_body
7121        # new style URI
7122        if (defined $hash_base && defined $hash_parent_base) {
7123                if (defined $file_name) {
7124                        # read raw output
7125                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7126                                $hash_parent_base, $hash_base,
7127                                "--", (defined $file_parent ? $file_parent : ()), $file_name
7128                                or die_error(500, "Open git-diff-tree failed");
7129                        @difftree = map { chomp; $_ } <$fd>;
7130                        close $fd
7131                                or die_error(404, "Reading git-diff-tree failed");
7132                        @difftree
7133                                or die_error(404, "Blob diff not found");
7134
7135                } elsif (defined $hash &&
7136                         $hash =~ /[0-9a-fA-F]{40}/) {
7137                        # try to find filename from $hash
7138
7139                        # read filtered raw output
7140                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7141                                $hash_parent_base, $hash_base, "--"
7142                                or die_error(500, "Open git-diff-tree failed");
7143                        @difftree =
7144                                # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7145                                # $hash == to_id
7146                                grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7147                                map { chomp; $_ } <$fd>;
7148                        close $fd
7149                                or die_error(404, "Reading git-diff-tree failed");
7150                        @difftree
7151                                or die_error(404, "Blob diff not found");
7152
7153                } else {
7154                        die_error(400, "Missing one of the blob diff parameters");
7155                }
7156
7157                if (@difftree > 1) {
7158                        die_error(400, "Ambiguous blob diff specification");
7159                }
7160
7161                %diffinfo = parse_difftree_raw_line($difftree[0]);
7162                $file_parent ||= $diffinfo{'from_file'} || $file_name;
7163                $file_name   ||= $diffinfo{'to_file'};
7164
7165                $hash_parent ||= $diffinfo{'from_id'};
7166                $hash        ||= $diffinfo{'to_id'};
7167
7168                # non-textual hash id's can be cached
7169                if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7170                    $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7171                        $expires = '+1d';
7172                }
7173
7174                # open patch output
7175                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7176                        '-p', ($format eq 'html' ? "--full-index" : ()),
7177                        $hash_parent_base, $hash_base,
7178                        "--", (defined $file_parent ? $file_parent : ()), $file_name
7179                        or die_error(500, "Open git-diff-tree failed");
7180        }
7181
7182        # old/legacy style URI -- not generated anymore since 1.4.3.
7183        if (!%diffinfo) {
7184                die_error('404 Not Found', "Missing one of the blob diff parameters")
7185        }
7186
7187        # header
7188        if ($format eq 'html') {
7189                my $formats_nav =
7190                        $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7191                                "raw");
7192                $formats_nav .= diff_style_nav($diff_style);
7193                git_header_html(undef, $expires);
7194                if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7195                        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7196                        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7197                } else {
7198                        print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7199                        print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7200                }
7201                if (defined $file_name) {
7202                        git_print_page_path($file_name, "blob", $hash_base);
7203                } else {
7204                        print "<div class=\"page_path\"></div>\n";
7205                }
7206
7207        } elsif ($format eq 'plain') {
7208                print $cgi->header(
7209                        -type => 'text/plain',
7210                        -charset => 'utf-8',
7211                        -expires => $expires,
7212                        -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7213
7214                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7215
7216        } else {
7217                die_error(400, "Unknown blobdiff format");
7218        }
7219
7220        # patch
7221        if ($format eq 'html') {
7222                print "<div class=\"page_body\">\n";
7223
7224                git_patchset_body($fd, $diff_style,
7225                                  [ \%diffinfo ], $hash_base, $hash_parent_base);
7226                close $fd;
7227
7228                print "</div>\n"; # class="page_body"
7229                git_footer_html();
7230
7231        } else {
7232                while (my $line = <$fd>) {
7233                        $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7234                        $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7235
7236                        print $line;
7237
7238                        last if $line =~ m!^\+\+\+!;
7239                }
7240                local $/ = undef;
7241                print <$fd>;
7242                close $fd;
7243        }
7244}
7245
7246sub git_blobdiff_plain {
7247        git_blobdiff('plain');
7248}
7249
7250# assumes that it is added as later part of already existing navigation,
7251# so it returns "| foo | bar" rather than just "foo | bar"
7252sub diff_style_nav {
7253        my ($diff_style, $is_combined) = @_;
7254        $diff_style ||= 'inline';
7255
7256        return "" if ($is_combined);
7257
7258        my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7259        my %styles = @styles;
7260        @styles =
7261                @styles[ map { $_ * 2 } 0..$#styles/2 ];
7262
7263        return join '',
7264                map { " | ".$_ }
7265                map {
7266                        $_ eq $diff_style ? $styles{$_} :
7267                        $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7268                } @styles;
7269}
7270
7271sub git_commitdiff {
7272        my %params = @_;
7273        my $format = $params{-format} || 'html';
7274        my $diff_style = $input_params{'diff_style'} || 'inline';
7275
7276        my ($patch_max) = gitweb_get_feature('patches');
7277        if ($format eq 'patch') {
7278                die_error(403, "Patch view not allowed") unless $patch_max;
7279        }
7280
7281        $hash ||= $hash_base || "HEAD";
7282        my %co = parse_commit($hash)
7283            or die_error(404, "Unknown commit object");
7284
7285        # choose format for commitdiff for merge
7286        if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7287                $hash_parent = '--cc';
7288        }
7289        # we need to prepare $formats_nav before almost any parameter munging
7290        my $formats_nav;
7291        if ($format eq 'html') {
7292                $formats_nav =
7293                        $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7294                                "raw");
7295                if ($patch_max && @{$co{'parents'}} <= 1) {
7296                        $formats_nav .= " | " .
7297                                $cgi->a({-href => href(action=>"patch", -replay=>1)},
7298                                        "patch");
7299                }
7300                $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7301
7302                if (defined $hash_parent &&
7303                    $hash_parent ne '-c' && $hash_parent ne '--cc') {
7304                        # commitdiff with two commits given
7305                        my $hash_parent_short = $hash_parent;
7306                        if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7307                                $hash_parent_short = substr($hash_parent, 0, 7);
7308                        }
7309                        $formats_nav .=
7310                                ' (from';
7311                        for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7312                                if ($co{'parents'}[$i] eq $hash_parent) {
7313                                        $formats_nav .= ' parent ' . ($i+1);
7314                                        last;
7315                                }
7316                        }
7317                        $formats_nav .= ': ' .
7318                                $cgi->a({-href => href(-replay=>1,
7319                                                       hash=>$hash_parent, hash_base=>undef)},
7320                                        esc_html($hash_parent_short)) .
7321                                ')';
7322                } elsif (!$co{'parent'}) {
7323                        # --root commitdiff
7324                        $formats_nav .= ' (initial)';
7325                } elsif (scalar @{$co{'parents'}} == 1) {
7326                        # single parent commit
7327                        $formats_nav .=
7328                                ' (parent: ' .
7329                                $cgi->a({-href => href(-replay=>1,
7330                                                       hash=>$co{'parent'}, hash_base=>undef)},
7331                                        esc_html(substr($co{'parent'}, 0, 7))) .
7332                                ')';
7333                } else {
7334                        # merge commit
7335                        if ($hash_parent eq '--cc') {
7336                                $formats_nav .= ' | ' .
7337                                        $cgi->a({-href => href(-replay=>1,
7338                                                               hash=>$hash, hash_parent=>'-c')},
7339                                                'combined');
7340                        } else { # $hash_parent eq '-c'
7341                                $formats_nav .= ' | ' .
7342                                        $cgi->a({-href => href(-replay=>1,
7343                                                               hash=>$hash, hash_parent=>'--cc')},
7344                                                'compact');
7345                        }
7346                        $formats_nav .=
7347                                ' (merge: ' .
7348                                join(' ', map {
7349                                        $cgi->a({-href => href(-replay=>1,
7350                                                               hash=>$_, hash_base=>undef)},
7351                                                esc_html(substr($_, 0, 7)));
7352                                } @{$co{'parents'}} ) .
7353                                ')';
7354                }
7355        }
7356
7357        my $hash_parent_param = $hash_parent;
7358        if (!defined $hash_parent_param) {
7359                # --cc for multiple parents, --root for parentless
7360                $hash_parent_param =
7361                        @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7362        }
7363
7364        # read commitdiff
7365        my $fd;
7366        my @difftree;
7367        if ($format eq 'html') {
7368                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7369                        "--no-commit-id", "--patch-with-raw", "--full-index",
7370                        $hash_parent_param, $hash, "--"
7371                        or die_error(500, "Open git-diff-tree failed");
7372
7373                while (my $line = <$fd>) {
7374                        chomp $line;
7375                        # empty line ends raw part of diff-tree output
7376                        last unless $line;
7377                        push @difftree, scalar parse_difftree_raw_line($line);
7378                }
7379
7380        } elsif ($format eq 'plain') {
7381                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7382                        '-p', $hash_parent_param, $hash, "--"
7383                        or die_error(500, "Open git-diff-tree failed");
7384        } elsif ($format eq 'patch') {
7385                # For commit ranges, we limit the output to the number of
7386                # patches specified in the 'patches' feature.
7387                # For single commits, we limit the output to a single patch,
7388                # diverging from the git-format-patch default.
7389                my @commit_spec = ();
7390                if ($hash_parent) {
7391                        if ($patch_max > 0) {
7392                                push @commit_spec, "-$patch_max";
7393                        }
7394                        push @commit_spec, '-n', "$hash_parent..$hash";
7395                } else {
7396                        if ($params{-single}) {
7397                                push @commit_spec, '-1';
7398                        } else {
7399                                if ($patch_max > 0) {
7400                                        push @commit_spec, "-$patch_max";
7401                                }
7402                                push @commit_spec, "-n";
7403                        }
7404                        push @commit_spec, '--root', $hash;
7405                }
7406                open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7407                        '--encoding=utf8', '--stdout', @commit_spec
7408                        or die_error(500, "Open git-format-patch failed");
7409        } else {
7410                die_error(400, "Unknown commitdiff format");
7411        }
7412
7413        # non-textual hash id's can be cached
7414        my $expires;
7415        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7416                $expires = "+1d";
7417        }
7418
7419        # write commit message
7420        if ($format eq 'html') {
7421                my $refs = git_get_references();
7422                my $ref = format_ref_marker($refs, $co{'id'});
7423
7424                git_header_html(undef, $expires);
7425                git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7426                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7427                print "<div class=\"title_text\">\n" .
7428                      "<table class=\"object_header\">\n";
7429                git_print_authorship_rows(\%co);
7430                print "</table>".
7431                      "</div>\n";
7432                print "<div class=\"page_body\">\n";
7433                if (@{$co{'comment'}} > 1) {
7434                        print "<div class=\"log\">\n";
7435                        git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7436                        print "</div>\n"; # class="log"
7437                }
7438
7439        } elsif ($format eq 'plain') {
7440                my $refs = git_get_references("tags");
7441                my $tagname = git_get_rev_name_tags($hash);
7442                my $filename = basename($project) . "-$hash.patch";
7443
7444                print $cgi->header(
7445                        -type => 'text/plain',
7446                        -charset => 'utf-8',
7447                        -expires => $expires,
7448                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7449                my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7450                print "From: " . to_utf8($co{'author'}) . "\n";
7451                print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7452                print "Subject: " . to_utf8($co{'title'}) . "\n";
7453
7454                print "X-Git-Tag: $tagname\n" if $tagname;
7455                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7456
7457                foreach my $line (@{$co{'comment'}}) {
7458                        print to_utf8($line) . "\n";
7459                }
7460                print "---\n\n";
7461        } elsif ($format eq 'patch') {
7462                my $filename = basename($project) . "-$hash.patch";
7463
7464                print $cgi->header(
7465                        -type => 'text/plain',
7466                        -charset => 'utf-8',
7467                        -expires => $expires,
7468                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7469        }
7470
7471        # write patch
7472        if ($format eq 'html') {
7473                my $use_parents = !defined $hash_parent ||
7474                        $hash_parent eq '-c' || $hash_parent eq '--cc';
7475                git_difftree_body(\@difftree, $hash,
7476                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7477                print "<br/>\n";
7478
7479                git_patchset_body($fd, $diff_style,
7480                                  \@difftree, $hash,
7481                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7482                close $fd;
7483                print "</div>\n"; # class="page_body"
7484                git_footer_html();
7485
7486        } elsif ($format eq 'plain') {
7487                local $/ = undef;
7488                print <$fd>;
7489                close $fd
7490                        or print "Reading git-diff-tree failed\n";
7491        } elsif ($format eq 'patch') {
7492                local $/ = undef;
7493                print <$fd>;
7494                close $fd
7495                        or print "Reading git-format-patch failed\n";
7496        }
7497}
7498
7499sub git_commitdiff_plain {
7500        git_commitdiff(-format => 'plain');
7501}
7502
7503# format-patch-style patches
7504sub git_patch {
7505        git_commitdiff(-format => 'patch', -single => 1);
7506}
7507
7508sub git_patches {
7509        git_commitdiff(-format => 'patch');
7510}
7511
7512sub git_history {
7513        git_log_generic('history', \&git_history_body,
7514                        $hash_base, $hash_parent_base,
7515                        $file_name, $hash);
7516}
7517
7518sub git_search {
7519        $searchtype ||= 'commit';
7520
7521        # check if appropriate features are enabled
7522        gitweb_check_feature('search')
7523                or die_error(403, "Search is disabled");
7524        if ($searchtype eq 'pickaxe') {
7525                # pickaxe may take all resources of your box and run for several minutes
7526                # with every query - so decide by yourself how public you make this feature
7527                gitweb_check_feature('pickaxe')
7528                        or die_error(403, "Pickaxe search is disabled");
7529        }
7530        if ($searchtype eq 'grep') {
7531                # grep search might be potentially CPU-intensive, too
7532                gitweb_check_feature('grep')
7533                        or die_error(403, "Grep search is disabled");
7534        }
7535
7536        if (!defined $searchtext) {
7537                die_error(400, "Text field is empty");
7538        }
7539        if (!defined $hash) {
7540                $hash = git_get_head_hash($project);
7541        }
7542        my %co = parse_commit($hash);
7543        if (!%co) {
7544                die_error(404, "Unknown commit object");
7545        }
7546        if (!defined $page) {
7547                $page = 0;
7548        }
7549
7550        if ($searchtype eq 'commit' ||
7551            $searchtype eq 'author' ||
7552            $searchtype eq 'committer') {
7553                git_search_message(%co);
7554        } elsif ($searchtype eq 'pickaxe') {
7555                git_search_changes(%co);
7556        } elsif ($searchtype eq 'grep') {
7557                git_search_files(%co);
7558        } else {
7559                die_error(400, "Unknown search type");
7560        }
7561}
7562
7563sub git_search_help {
7564        git_header_html();
7565        git_print_page_nav('','', $hash,$hash,$hash);
7566        print <<EOT;
7567<p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7568regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7569the pattern entered is recognized as the POSIX extended
7570<a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7571insensitive).</p>
7572<dl>
7573<dt><b>commit</b></dt>
7574<dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7575EOT
7576        my $have_grep = gitweb_check_feature('grep');
7577        if ($have_grep) {
7578                print <<EOT;
7579<dt><b>grep</b></dt>
7580<dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7581    a different one) are searched for the given pattern. On large trees, this search can take
7582a while and put some strain on the server, so please use it with some consideration. Note that
7583due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7584case-sensitive.</dd>
7585EOT
7586        }
7587        print <<EOT;
7588<dt><b>author</b></dt>
7589<dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7590<dt><b>committer</b></dt>
7591<dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7592EOT
7593        my $have_pickaxe = gitweb_check_feature('pickaxe');
7594        if ($have_pickaxe) {
7595                print <<EOT;
7596<dt><b>pickaxe</b></dt>
7597<dd>All commits that caused the string to appear or disappear from any file (changes that
7598added, removed or "modified" the string) will be listed. This search can take a while and
7599takes a lot of strain on the server, so please use it wisely. Note that since you may be
7600interested even in changes just changing the case as well, this search is case sensitive.</dd>
7601EOT
7602        }
7603        print "</dl>\n";
7604        git_footer_html();
7605}
7606
7607sub git_shortlog {
7608        git_log_generic('shortlog', \&git_shortlog_body,
7609                        $hash, $hash_parent);
7610}
7611
7612## ......................................................................
7613## feeds (RSS, Atom; OPML)
7614
7615sub git_feed {
7616        my $format = shift || 'atom';
7617        my $have_blame = gitweb_check_feature('blame');
7618
7619        # Atom: http://www.atomenabled.org/developers/syndication/
7620        # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7621        if ($format ne 'rss' && $format ne 'atom') {
7622                die_error(400, "Unknown web feed format");
7623        }
7624
7625        # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7626        my $head = $hash || 'HEAD';
7627        my @commitlist = parse_commits($head, 150, 0, $file_name);
7628
7629        my %latest_commit;
7630        my %latest_date;
7631        my $content_type = "application/$format+xml";
7632        if (defined $cgi->http('HTTP_ACCEPT') &&
7633                 $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7634                # browser (feed reader) prefers text/xml
7635                $content_type = 'text/xml';
7636        }
7637        if (defined($commitlist[0])) {
7638                %latest_commit = %{$commitlist[0]};
7639                my $latest_epoch = $latest_commit{'committer_epoch'};
7640                %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7641                my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7642                if (defined $if_modified) {
7643                        my $since;
7644                        if (eval { require HTTP::Date; 1; }) {
7645                                $since = HTTP::Date::str2time($if_modified);
7646                        } elsif (eval { require Time::ParseDate; 1; }) {
7647                                $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7648                        }
7649                        if (defined $since && $latest_epoch <= $since) {
7650                                print $cgi->header(
7651                                        -type => $content_type,
7652                                        -charset => 'utf-8',
7653                                        -last_modified => $latest_date{'rfc2822'},
7654                                        -status => '304 Not Modified');
7655                                return;
7656                        }
7657                }
7658                print $cgi->header(
7659                        -type => $content_type,
7660                        -charset => 'utf-8',
7661                        -last_modified => $latest_date{'rfc2822'});
7662        } else {
7663                print $cgi->header(
7664                        -type => $content_type,
7665                        -charset => 'utf-8');
7666        }
7667
7668        # Optimization: skip generating the body if client asks only
7669        # for Last-Modified date.
7670        return if ($cgi->request_method() eq 'HEAD');
7671
7672        # header variables
7673        my $title = "$site_name - $project/$action";
7674        my $feed_type = 'log';
7675        if (defined $hash) {
7676                $title .= " - '$hash'";
7677                $feed_type = 'branch log';
7678                if (defined $file_name) {
7679                        $title .= " :: $file_name";
7680                        $feed_type = 'history';
7681                }
7682        } elsif (defined $file_name) {
7683                $title .= " - $file_name";
7684                $feed_type = 'history';
7685        }
7686        $title .= " $feed_type";
7687        my $descr = git_get_project_description($project);
7688        if (defined $descr) {
7689                $descr = esc_html($descr);
7690        } else {
7691                $descr = "$project " .
7692                         ($format eq 'rss' ? 'RSS' : 'Atom') .
7693                         " feed";
7694        }
7695        my $owner = git_get_project_owner($project);
7696        $owner = esc_html($owner);
7697
7698        #header
7699        my $alt_url;
7700        if (defined $file_name) {
7701                $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7702        } elsif (defined $hash) {
7703                $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7704        } else {
7705                $alt_url = href(-full=>1, action=>"summary");
7706        }
7707        print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7708        if ($format eq 'rss') {
7709                print <<XML;
7710<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7711<channel>
7712XML
7713                print "<title>$title</title>\n" .
7714                      "<link>$alt_url</link>\n" .
7715                      "<description>$descr</description>\n" .
7716                      "<language>en</language>\n" .
7717                      # project owner is responsible for 'editorial' content
7718                      "<managingEditor>$owner</managingEditor>\n";
7719                if (defined $logo || defined $favicon) {
7720                        # prefer the logo to the favicon, since RSS
7721                        # doesn't allow both
7722                        my $img = esc_url($logo || $favicon);
7723                        print "<image>\n" .
7724                              "<url>$img</url>\n" .
7725                              "<title>$title</title>\n" .
7726                              "<link>$alt_url</link>\n" .
7727                              "</image>\n";
7728                }
7729                if (%latest_date) {
7730                        print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7731                        print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7732                }
7733                print "<generator>gitweb v.$version/$git_version</generator>\n";
7734        } elsif ($format eq 'atom') {
7735                print <<XML;
7736<feed xmlns="http://www.w3.org/2005/Atom">
7737XML
7738                print "<title>$title</title>\n" .
7739                      "<subtitle>$descr</subtitle>\n" .
7740                      '<link rel="alternate" type="text/html" href="' .
7741                      $alt_url . '" />' . "\n" .
7742                      '<link rel="self" type="' . $content_type . '" href="' .
7743                      $cgi->self_url() . '" />' . "\n" .
7744                      "<id>" . href(-full=>1) . "</id>\n" .
7745                      # use project owner for feed author
7746                      "<author><name>$owner</name></author>\n";
7747                if (defined $favicon) {
7748                        print "<icon>" . esc_url($favicon) . "</icon>\n";
7749                }
7750                if (defined $logo) {
7751                        # not twice as wide as tall: 72 x 27 pixels
7752                        print "<logo>" . esc_url($logo) . "</logo>\n";
7753                }
7754                if (! %latest_date) {
7755                        # dummy date to keep the feed valid until commits trickle in:
7756                        print "<updated>1970-01-01T00:00:00Z</updated>\n";
7757                } else {
7758                        print "<updated>$latest_date{'iso-8601'}</updated>\n";
7759                }
7760                print "<generator version='$version/$git_version'>gitweb</generator>\n";
7761        }
7762
7763        # contents
7764        for (my $i = 0; $i <= $#commitlist; $i++) {
7765                my %co = %{$commitlist[$i]};
7766                my $commit = $co{'id'};
7767                # we read 150, we always show 30 and the ones more recent than 48 hours
7768                if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7769                        last;
7770                }
7771                my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7772
7773                # get list of changed files
7774                open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7775                        $co{'parent'} || "--root",
7776                        $co{'id'}, "--", (defined $file_name ? $file_name : ())
7777                        or next;
7778                my @difftree = map { chomp; $_ } <$fd>;
7779                close $fd
7780                        or next;
7781
7782                # print element (entry, item)
7783                my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7784                if ($format eq 'rss') {
7785                        print "<item>\n" .
7786                              "<title>" . esc_html($co{'title'}) . "</title>\n" .
7787                              "<author>" . esc_html($co{'author'}) . "</author>\n" .
7788                              "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7789                              "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7790                              "<link>$co_url</link>\n" .
7791                              "<description>" . esc_html($co{'title'}) . "</description>\n" .
7792                              "<content:encoded>" .
7793                              "<![CDATA[\n";
7794                } elsif ($format eq 'atom') {
7795                        print "<entry>\n" .
7796                              "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7797                              "<updated>$cd{'iso-8601'}</updated>\n" .
7798                              "<author>\n" .
7799                              "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7800                        if ($co{'author_email'}) {
7801                                print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7802                        }
7803                        print "</author>\n" .
7804                              # use committer for contributor
7805                              "<contributor>\n" .
7806                              "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7807                        if ($co{'committer_email'}) {
7808                                print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7809                        }
7810                        print "</contributor>\n" .
7811                              "<published>$cd{'iso-8601'}</published>\n" .
7812                              "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7813                              "<id>$co_url</id>\n" .
7814                              "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
7815                              "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
7816                }
7817                my $comment = $co{'comment'};
7818                print "<pre>\n";
7819                foreach my $line (@$comment) {
7820                        $line = esc_html($line);
7821                        print "$line\n";
7822                }
7823                print "</pre><ul>\n";
7824                foreach my $difftree_line (@difftree) {
7825                        my %difftree = parse_difftree_raw_line($difftree_line);
7826                        next if !$difftree{'from_id'};
7827
7828                        my $file = $difftree{'file'} || $difftree{'to_file'};
7829
7830                        print "<li>" .
7831                              "[" .
7832                              $cgi->a({-href => href(-full=>1, action=>"blobdiff",
7833                                                     hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
7834                                                     hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
7835                                                     file_name=>$file, file_parent=>$difftree{'from_file'}),
7836                                      -title => "diff"}, 'D');
7837                        if ($have_blame) {
7838                                print $cgi->a({-href => href(-full=>1, action=>"blame",
7839                                                             file_name=>$file, hash_base=>$commit),
7840                                              -title => "blame"}, 'B');
7841                        }
7842                        # if this is not a feed of a file history
7843                        if (!defined $file_name || $file_name ne $file) {
7844                                print $cgi->a({-href => href(-full=>1, action=>"history",
7845                                                             file_name=>$file, hash=>$commit),
7846                                              -title => "history"}, 'H');
7847                        }
7848                        $file = esc_path($file);
7849                        print "] ".
7850                              "$file</li>\n";
7851                }
7852                if ($format eq 'rss') {
7853                        print "</ul>]]>\n" .
7854                              "</content:encoded>\n" .
7855                              "</item>\n";
7856                } elsif ($format eq 'atom') {
7857                        print "</ul>\n</div>\n" .
7858                              "</content>\n" .
7859                              "</entry>\n";
7860                }
7861        }
7862
7863        # end of feed
7864        if ($format eq 'rss') {
7865                print "</channel>\n</rss>\n";
7866        } elsif ($format eq 'atom') {
7867                print "</feed>\n";
7868        }
7869}
7870
7871sub git_rss {
7872        git_feed('rss');
7873}
7874
7875sub git_atom {
7876        git_feed('atom');
7877}
7878
7879sub git_opml {
7880        my @list = git_get_projects_list($project_filter, $strict_export);
7881        if (!@list) {
7882                die_error(404, "No projects found");
7883        }
7884
7885        print $cgi->header(
7886                -type => 'text/xml',
7887                -charset => 'utf-8',
7888                -content_disposition => 'inline; filename="opml.xml"');
7889
7890        my $title = esc_html($site_name);
7891        my $filter = " within subdirectory ";
7892        if (defined $project_filter) {
7893                $filter .= esc_html($project_filter);
7894        } else {
7895                $filter = "";
7896        }
7897        print <<XML;
7898<?xml version="1.0" encoding="utf-8"?>
7899<opml version="1.0">
7900<head>
7901  <title>$title OPML Export$filter</title>
7902</head>
7903<body>
7904<outline text="git RSS feeds">
7905XML
7906
7907        foreach my $pr (@list) {
7908                my %proj = %$pr;
7909                my $head = git_get_head_hash($proj{'path'});
7910                if (!defined $head) {
7911                        next;
7912                }
7913                $git_dir = "$projectroot/$proj{'path'}";
7914                my %co = parse_commit($head);
7915                if (!%co) {
7916                        next;
7917                }
7918
7919                my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7920                my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7921                my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7922                print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7923        }
7924        print <<XML;
7925</outline>
7926</body>
7927</opml>
7928XML
7929}