7d36f563e4236ce03acfda403b11f10f4eccf5b1
   1#!/usr/bin/perl
   2
   3# gitweb - simple web interface to track changes in git repositories
   4#
   5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
   6# (C) 2005, Christian Gierke
   7#
   8# This program is licensed under the GPLv2
   9
  10use 5.008;
  11use strict;
  12use warnings;
  13use CGI qw(:standard :escapeHTML -nosticky);
  14use CGI::Util qw(unescape);
  15use CGI::Carp qw(fatalsToBrowser set_message);
  16use Encode;
  17use Fcntl ':mode';
  18use File::Find qw();
  19use File::Basename qw(basename);
  20use Time::HiRes qw(gettimeofday tv_interval);
  21binmode STDOUT, ':utf8';
  22
  23our $t0 = [ gettimeofday() ];
  24our $number_of_git_cmds = 0;
  25
  26BEGIN {
  27        CGI->compile() if $ENV{'MOD_PERL'};
  28}
  29
  30our $version = "++GIT_VERSION++";
  31
  32our ($my_url, $my_uri, $base_url, $path_info, $home_link);
  33sub evaluate_uri {
  34        our $cgi;
  35
  36        our $my_url = $cgi->url();
  37        our $my_uri = $cgi->url(-absolute => 1);
  38
  39        # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
  40        # needed and used only for URLs with nonempty PATH_INFO
  41        our $base_url = $my_url;
  42
  43        # When the script is used as DirectoryIndex, the URL does not contain the name
  44        # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
  45        # have to do it ourselves. We make $path_info global because it's also used
  46        # later on.
  47        #
  48        # Another issue with the script being the DirectoryIndex is that the resulting
  49        # $my_url data is not the full script URL: this is good, because we want
  50        # generated links to keep implying the script name if it wasn't explicitly
  51        # indicated in the URL we're handling, but it means that $my_url cannot be used
  52        # as base URL.
  53        # Therefore, if we needed to strip PATH_INFO, then we know that we have
  54        # to build the base URL ourselves:
  55        our $path_info = $ENV{"PATH_INFO"};
  56        if ($path_info) {
  57                if ($my_url =~ s,\Q$path_info\E$,, &&
  58                    $my_uri =~ s,\Q$path_info\E$,, &&
  59                    defined $ENV{'SCRIPT_NAME'}) {
  60                        $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
  61                }
  62        }
  63
  64        # target of the home link on top of all pages
  65        our $home_link = $my_uri || "/";
  66}
  67
  68# core git executable to use
  69# this can just be "git" if your webserver has a sensible PATH
  70our $GIT = "++GIT_BINDIR++/git";
  71
  72# absolute fs-path which will be prepended to the project path
  73#our $projectroot = "/pub/scm";
  74our $projectroot = "++GITWEB_PROJECTROOT++";
  75
  76# fs traversing limit for getting project list
  77# the number is relative to the projectroot
  78our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
  79
  80# string of the home link on top of all pages
  81our $home_link_str = "++GITWEB_HOME_LINK_STR++";
  82
  83# name of your site or organization to appear in page titles
  84# replace this with something more descriptive for clearer bookmarks
  85our $site_name = "++GITWEB_SITENAME++"
  86                 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
  87
  88# html snippet to include in the <head> section of each page
  89our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
  90# filename of html text to include at top of each page
  91our $site_header = "++GITWEB_SITE_HEADER++";
  92# html text to include at home page
  93our $home_text = "++GITWEB_HOMETEXT++";
  94# filename of html text to include at bottom of each page
  95our $site_footer = "++GITWEB_SITE_FOOTER++";
  96
  97# URI of stylesheets
  98our @stylesheets = ("++GITWEB_CSS++");
  99# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
 100our $stylesheet = undef;
 101# URI of GIT logo (72x27 size)
 102our $logo = "++GITWEB_LOGO++";
 103# URI of GIT favicon, assumed to be image/png type
 104our $favicon = "++GITWEB_FAVICON++";
 105# URI of gitweb.js (JavaScript code for gitweb)
 106our $javascript = "++GITWEB_JS++";
 107
 108# URI and label (title) of GIT logo link
 109#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
 110#our $logo_label = "git documentation";
 111our $logo_url = "http://git-scm.com/";
 112our $logo_label = "git homepage";
 113
 114# source of projects list
 115our $projects_list = "++GITWEB_LIST++";
 116
 117# the width (in characters) of the projects list "Description" column
 118our $projects_list_description_width = 25;
 119
 120# group projects by category on the projects list
 121# (enabled if this variable evaluates to true)
 122our $projects_list_group_categories = 0;
 123
 124# default category if none specified
 125# (leave the empty string for no category)
 126our $project_list_default_category = "";
 127
 128# default order of projects list
 129# valid values are none, project, descr, owner, and age
 130our $default_projects_order = "project";
 131
 132# show repository only if this file exists
 133# (only effective if this variable evaluates to true)
 134our $export_ok = "++GITWEB_EXPORT_OK++";
 135
 136# show repository only if this subroutine returns true
 137# when given the path to the project, for example:
 138#    sub { return -e "$_[0]/git-daemon-export-ok"; }
 139our $export_auth_hook = undef;
 140
 141# only allow viewing of repositories also shown on the overview page
 142our $strict_export = "++GITWEB_STRICT_EXPORT++";
 143
 144# list of git base URLs used for URL to where fetch project from,
 145# i.e. full URL is "$git_base_url/$project"
 146our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
 147
 148# default blob_plain mimetype and default charset for text/plain blob
 149our $default_blob_plain_mimetype = 'text/plain';
 150our $default_text_plain_charset  = undef;
 151
 152# file to use for guessing MIME types before trying /etc/mime.types
 153# (relative to the current git repository)
 154our $mimetypes_file = undef;
 155
 156# assume this charset if line contains non-UTF-8 characters;
 157# it should be valid encoding (see Encoding::Supported(3pm) for list),
 158# for which encoding all byte sequences are valid, for example
 159# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
 160# could be even 'utf-8' for the old behavior)
 161our $fallback_encoding = 'latin1';
 162
 163# rename detection options for git-diff and git-diff-tree
 164# - default is '-M', with the cost proportional to
 165#   (number of removed files) * (number of new files).
 166# - more costly is '-C' (which implies '-M'), with the cost proportional to
 167#   (number of changed files + number of removed files) * (number of new files)
 168# - even more costly is '-C', '--find-copies-harder' with cost
 169#   (number of files in the original tree) * (number of new files)
 170# - one might want to include '-B' option, e.g. '-B', '-M'
 171our @diff_opts = ('-M'); # taken from git_commit
 172
 173# Disables features that would allow repository owners to inject script into
 174# the gitweb domain.
 175our $prevent_xss = 0;
 176
 177# Path to the highlight executable to use (must be the one from
 178# http://www.andre-simon.de due to assumptions about parameters and output).
 179# Useful if highlight is not installed on your webserver's PATH.
 180# [Default: highlight]
 181our $highlight_bin = "++HIGHLIGHT_BIN++";
 182
 183# information about snapshot formats that gitweb is capable of serving
 184our %known_snapshot_formats = (
 185        # name => {
 186        #       'display' => display name,
 187        #       'type' => mime type,
 188        #       'suffix' => filename suffix,
 189        #       'format' => --format for git-archive,
 190        #       'compressor' => [compressor command and arguments]
 191        #                       (array reference, optional)
 192        #       'disabled' => boolean (optional)}
 193        #
 194        'tgz' => {
 195                'display' => 'tar.gz',
 196                'type' => 'application/x-gzip',
 197                'suffix' => '.tar.gz',
 198                'format' => 'tar',
 199                'compressor' => ['gzip', '-n']},
 200
 201        'tbz2' => {
 202                'display' => 'tar.bz2',
 203                'type' => 'application/x-bzip2',
 204                'suffix' => '.tar.bz2',
 205                'format' => 'tar',
 206                'compressor' => ['bzip2']},
 207
 208        'txz' => {
 209                'display' => 'tar.xz',
 210                'type' => 'application/x-xz',
 211                'suffix' => '.tar.xz',
 212                'format' => 'tar',
 213                'compressor' => ['xz'],
 214                'disabled' => 1},
 215
 216        'zip' => {
 217                'display' => 'zip',
 218                'type' => 'application/x-zip',
 219                'suffix' => '.zip',
 220                'format' => 'zip'},
 221);
 222
 223# Aliases so we understand old gitweb.snapshot values in repository
 224# configuration.
 225our %known_snapshot_format_aliases = (
 226        'gzip'  => 'tgz',
 227        'bzip2' => 'tbz2',
 228        'xz'    => 'txz',
 229
 230        # backward compatibility: legacy gitweb config support
 231        'x-gzip' => undef, 'gz' => undef,
 232        'x-bzip2' => undef, 'bz2' => undef,
 233        'x-zip' => undef, '' => undef,
 234);
 235
 236# Pixel sizes for icons and avatars. If the default font sizes or lineheights
 237# are changed, it may be appropriate to change these values too via
 238# $GITWEB_CONFIG.
 239our %avatar_size = (
 240        'default' => 16,
 241        'double'  => 32
 242);
 243
 244# Used to set the maximum load that we will still respond to gitweb queries.
 245# If server load exceed this value then return "503 server busy" error.
 246# If gitweb cannot determined server load, it is taken to be 0.
 247# Leave it undefined (or set to 'undef') to turn off load checking.
 248our $maxload = 300;
 249
 250# configuration for 'highlight' (http://www.andre-simon.de/)
 251# match by basename
 252our %highlight_basename = (
 253        #'Program' => 'py',
 254        #'Library' => 'py',
 255        'SConstruct' => 'py', # SCons equivalent of Makefile
 256        'Makefile' => 'make',
 257);
 258# match by extension
 259our %highlight_ext = (
 260        # main extensions, defining name of syntax;
 261        # see files in /usr/share/highlight/langDefs/ directory
 262        map { $_ => $_ }
 263                qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
 264        # alternate extensions, see /etc/highlight/filetypes.conf
 265        'h' => 'c',
 266        map { $_ => 'sh'  } qw(bash zsh ksh),
 267        map { $_ => 'cpp' } qw(cxx c++ cc),
 268        map { $_ => 'php' } qw(php3 php4 php5 phps),
 269        map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
 270        map { $_ => 'make'} qw(mak mk),
 271        map { $_ => 'xml' } qw(xhtml html htm),
 272);
 273
 274# You define site-wide feature defaults here; override them with
 275# $GITWEB_CONFIG as necessary.
 276our %feature = (
 277        # feature => {
 278        #       'sub' => feature-sub (subroutine),
 279        #       'override' => allow-override (boolean),
 280        #       'default' => [ default options...] (array reference)}
 281        #
 282        # if feature is overridable (it means that allow-override has true value),
 283        # then feature-sub will be called with default options as parameters;
 284        # return value of feature-sub indicates if to enable specified feature
 285        #
 286        # if there is no 'sub' key (no feature-sub), then feature cannot be
 287        # overridden
 288        #
 289        # use gitweb_get_feature(<feature>) to retrieve the <feature> value
 290        # (an array) or gitweb_check_feature(<feature>) to check if <feature>
 291        # is enabled
 292
 293        # Enable the 'blame' blob view, showing the last commit that modified
 294        # each line in the file. This can be very CPU-intensive.
 295
 296        # To enable system wide have in $GITWEB_CONFIG
 297        # $feature{'blame'}{'default'} = [1];
 298        # To have project specific config enable override in $GITWEB_CONFIG
 299        # $feature{'blame'}{'override'} = 1;
 300        # and in project config gitweb.blame = 0|1;
 301        'blame' => {
 302                'sub' => sub { feature_bool('blame', @_) },
 303                'override' => 0,
 304                'default' => [0]},
 305
 306        # Enable the 'snapshot' link, providing a compressed archive of any
 307        # tree. This can potentially generate high traffic if you have large
 308        # project.
 309
 310        # Value is a list of formats defined in %known_snapshot_formats that
 311        # you wish to offer.
 312        # To disable system wide have in $GITWEB_CONFIG
 313        # $feature{'snapshot'}{'default'} = [];
 314        # To have project specific config enable override in $GITWEB_CONFIG
 315        # $feature{'snapshot'}{'override'} = 1;
 316        # and in project config, a comma-separated list of formats or "none"
 317        # to disable.  Example: gitweb.snapshot = tbz2,zip;
 318        'snapshot' => {
 319                'sub' => \&feature_snapshot,
 320                'override' => 0,
 321                'default' => ['tgz']},
 322
 323        # Enable text search, which will list the commits which match author,
 324        # committer or commit text to a given string.  Enabled by default.
 325        # Project specific override is not supported.
 326        #
 327        # Note that this controls all search features, which means that if
 328        # it is disabled, then 'grep' and 'pickaxe' search would also be
 329        # disabled.
 330        'search' => {
 331                'override' => 0,
 332                'default' => [1]},
 333
 334        # Enable grep search, which will list the files in currently selected
 335        # tree containing the given string. Enabled by default. This can be
 336        # potentially CPU-intensive, of course.
 337        # Note that you need to have 'search' feature enabled too.
 338
 339        # To enable system wide have in $GITWEB_CONFIG
 340        # $feature{'grep'}{'default'} = [1];
 341        # To have project specific config enable override in $GITWEB_CONFIG
 342        # $feature{'grep'}{'override'} = 1;
 343        # and in project config gitweb.grep = 0|1;
 344        'grep' => {
 345                'sub' => sub { feature_bool('grep', @_) },
 346                'override' => 0,
 347                'default' => [1]},
 348
 349        # Enable the pickaxe search, which will list the commits that modified
 350        # a given string in a file. This can be practical and quite faster
 351        # alternative to 'blame', but still potentially CPU-intensive.
 352        # Note that you need to have 'search' feature enabled too.
 353
 354        # To enable system wide have in $GITWEB_CONFIG
 355        # $feature{'pickaxe'}{'default'} = [1];
 356        # To have project specific config enable override in $GITWEB_CONFIG
 357        # $feature{'pickaxe'}{'override'} = 1;
 358        # and in project config gitweb.pickaxe = 0|1;
 359        'pickaxe' => {
 360                'sub' => sub { feature_bool('pickaxe', @_) },
 361                'override' => 0,
 362                'default' => [1]},
 363
 364        # Enable showing size of blobs in a 'tree' view, in a separate
 365        # column, similar to what 'ls -l' does.  This cost a bit of IO.
 366
 367        # To disable system wide have in $GITWEB_CONFIG
 368        # $feature{'show-sizes'}{'default'} = [0];
 369        # To have project specific config enable override in $GITWEB_CONFIG
 370        # $feature{'show-sizes'}{'override'} = 1;
 371        # and in project config gitweb.showsizes = 0|1;
 372        'show-sizes' => {
 373                'sub' => sub { feature_bool('showsizes', @_) },
 374                'override' => 0,
 375                'default' => [1]},
 376
 377        # Make gitweb use an alternative format of the URLs which can be
 378        # more readable and natural-looking: project name is embedded
 379        # directly in the path and the query string contains other
 380        # auxiliary information. All gitweb installations recognize
 381        # URL in either format; this configures in which formats gitweb
 382        # generates links.
 383
 384        # To enable system wide have in $GITWEB_CONFIG
 385        # $feature{'pathinfo'}{'default'} = [1];
 386        # Project specific override is not supported.
 387
 388        # Note that you will need to change the default location of CSS,
 389        # favicon, logo and possibly other files to an absolute URL. Also,
 390        # if gitweb.cgi serves as your indexfile, you will need to force
 391        # $my_uri to contain the script name in your $GITWEB_CONFIG.
 392        'pathinfo' => {
 393                'override' => 0,
 394                'default' => [0]},
 395
 396        # Make gitweb consider projects in project root subdirectories
 397        # to be forks of existing projects. Given project $projname.git,
 398        # projects matching $projname/*.git will not be shown in the main
 399        # projects list, instead a '+' mark will be added to $projname
 400        # there and a 'forks' view will be enabled for the project, listing
 401        # all the forks. If project list is taken from a file, forks have
 402        # to be listed after the main project.
 403
 404        # To enable system wide have in $GITWEB_CONFIG
 405        # $feature{'forks'}{'default'} = [1];
 406        # Project specific override is not supported.
 407        'forks' => {
 408                'override' => 0,
 409                'default' => [0]},
 410
 411        # Insert custom links to the action bar of all project pages.
 412        # This enables you mainly to link to third-party scripts integrating
 413        # into gitweb; e.g. git-browser for graphical history representation
 414        # or custom web-based repository administration interface.
 415
 416        # The 'default' value consists of a list of triplets in the form
 417        # (label, link, position) where position is the label after which
 418        # to insert the link and link is a format string where %n expands
 419        # to the project name, %f to the project path within the filesystem,
 420        # %h to the current hash (h gitweb parameter) and %b to the current
 421        # hash base (hb gitweb parameter); %% expands to %.
 422
 423        # To enable system wide have in $GITWEB_CONFIG e.g.
 424        # $feature{'actions'}{'default'} = [('graphiclog',
 425        #       '/git-browser/by-commit.html?r=%n', 'summary')];
 426        # Project specific override is not supported.
 427        'actions' => {
 428                'override' => 0,
 429                'default' => []},
 430
 431        # Allow gitweb scan project content tags of project repository,
 432        # and display the popular Web 2.0-ish "tag cloud" near the projects
 433        # list.  Note that this is something COMPLETELY different from the
 434        # normal Git tags.
 435
 436        # gitweb by itself can show existing tags, but it does not handle
 437        # tagging itself; you need to do it externally, outside gitweb.
 438        # The format is described in git_get_project_ctags() subroutine.
 439        # You may want to install the HTML::TagCloud Perl module to get
 440        # a pretty tag cloud instead of just a list of tags.
 441
 442        # To enable system wide have in $GITWEB_CONFIG
 443        # $feature{'ctags'}{'default'} = [1];
 444        # Project specific override is not supported.
 445
 446        # In the future whether ctags editing is enabled might depend
 447        # on the value, but using 1 should always mean no editing of ctags.
 448        'ctags' => {
 449                'override' => 0,
 450                'default' => [0]},
 451
 452        # The maximum number of patches in a patchset generated in patch
 453        # view. Set this to 0 or undef to disable patch view, or to a
 454        # negative number to remove any limit.
 455
 456        # To disable system wide have in $GITWEB_CONFIG
 457        # $feature{'patches'}{'default'} = [0];
 458        # To have project specific config enable override in $GITWEB_CONFIG
 459        # $feature{'patches'}{'override'} = 1;
 460        # and in project config gitweb.patches = 0|n;
 461        # where n is the maximum number of patches allowed in a patchset.
 462        'patches' => {
 463                'sub' => \&feature_patches,
 464                'override' => 0,
 465                'default' => [16]},
 466
 467        # Avatar support. When this feature is enabled, views such as
 468        # shortlog or commit will display an avatar associated with
 469        # the email of the committer(s) and/or author(s).
 470
 471        # Currently available providers are gravatar and picon.
 472        # If an unknown provider is specified, the feature is disabled.
 473
 474        # Gravatar depends on Digest::MD5.
 475        # Picon currently relies on the indiana.edu database.
 476
 477        # To enable system wide have in $GITWEB_CONFIG
 478        # $feature{'avatar'}{'default'} = ['<provider>'];
 479        # where <provider> is either gravatar or picon.
 480        # To have project specific config enable override in $GITWEB_CONFIG
 481        # $feature{'avatar'}{'override'} = 1;
 482        # and in project config gitweb.avatar = <provider>;
 483        'avatar' => {
 484                'sub' => \&feature_avatar,
 485                'override' => 0,
 486                'default' => ['']},
 487
 488        # Enable displaying how much time and how many git commands
 489        # it took to generate and display page.  Disabled by default.
 490        # Project specific override is not supported.
 491        'timed' => {
 492                'override' => 0,
 493                'default' => [0]},
 494
 495        # Enable turning some links into links to actions which require
 496        # JavaScript to run (like 'blame_incremental').  Not enabled by
 497        # default.  Project specific override is currently not supported.
 498        'javascript-actions' => {
 499                'override' => 0,
 500                'default' => [0]},
 501
 502        # Enable and configure ability to change common timezone for dates
 503        # in gitweb output via JavaScript.  Enabled by default.
 504        # Project specific override is not supported.
 505        'javascript-timezone' => {
 506                'override' => 0,
 507                'default' => [
 508                        'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
 509                                     # or undef to turn off this feature
 510                        'gitweb_tz', # name of cookie where to store selected timezone
 511                        'datetime',  # CSS class used to mark up dates for manipulation
 512                ]},
 513
 514        # Syntax highlighting support. This is based on Daniel Svensson's
 515        # and Sham Chukoury's work in gitweb-xmms2.git.
 516        # It requires the 'highlight' program present in $PATH,
 517        # and therefore is disabled by default.
 518
 519        # To enable system wide have in $GITWEB_CONFIG
 520        # $feature{'highlight'}{'default'} = [1];
 521
 522        'highlight' => {
 523                'sub' => sub { feature_bool('highlight', @_) },
 524                'override' => 0,
 525                'default' => [0]},
 526
 527        # Enable displaying of remote heads in the heads list
 528
 529        # To enable system wide have in $GITWEB_CONFIG
 530        # $feature{'remote_heads'}{'default'} = [1];
 531        # To have project specific config enable override in $GITWEB_CONFIG
 532        # $feature{'remote_heads'}{'override'} = 1;
 533        # and in project config gitweb.remote_heads = 0|1;
 534        'remote_heads' => {
 535                'sub' => sub { feature_bool('remote_heads', @_) },
 536                'override' => 0,
 537                'default' => [0]},
 538);
 539
 540sub gitweb_get_feature {
 541        my ($name) = @_;
 542        return unless exists $feature{$name};
 543        my ($sub, $override, @defaults) = (
 544                $feature{$name}{'sub'},
 545                $feature{$name}{'override'},
 546                @{$feature{$name}{'default'}});
 547        # project specific override is possible only if we have project
 548        our $git_dir; # global variable, declared later
 549        if (!$override || !defined $git_dir) {
 550                return @defaults;
 551        }
 552        if (!defined $sub) {
 553                warn "feature $name is not overridable";
 554                return @defaults;
 555        }
 556        return $sub->(@defaults);
 557}
 558
 559# A wrapper to check if a given feature is enabled.
 560# With this, you can say
 561#
 562#   my $bool_feat = gitweb_check_feature('bool_feat');
 563#   gitweb_check_feature('bool_feat') or somecode;
 564#
 565# instead of
 566#
 567#   my ($bool_feat) = gitweb_get_feature('bool_feat');
 568#   (gitweb_get_feature('bool_feat'))[0] or somecode;
 569#
 570sub gitweb_check_feature {
 571        return (gitweb_get_feature(@_))[0];
 572}
 573
 574
 575sub feature_bool {
 576        my $key = shift;
 577        my ($val) = git_get_project_config($key, '--bool');
 578
 579        if (!defined $val) {
 580                return ($_[0]);
 581        } elsif ($val eq 'true') {
 582                return (1);
 583        } elsif ($val eq 'false') {
 584                return (0);
 585        }
 586}
 587
 588sub feature_snapshot {
 589        my (@fmts) = @_;
 590
 591        my ($val) = git_get_project_config('snapshot');
 592
 593        if ($val) {
 594                @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
 595        }
 596
 597        return @fmts;
 598}
 599
 600sub feature_patches {
 601        my @val = (git_get_project_config('patches', '--int'));
 602
 603        if (@val) {
 604                return @val;
 605        }
 606
 607        return ($_[0]);
 608}
 609
 610sub feature_avatar {
 611        my @val = (git_get_project_config('avatar'));
 612
 613        return @val ? @val : @_;
 614}
 615
 616# checking HEAD file with -e is fragile if the repository was
 617# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
 618# and then pruned.
 619sub check_head_link {
 620        my ($dir) = @_;
 621        my $headfile = "$dir/HEAD";
 622        return ((-e $headfile) ||
 623                (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
 624}
 625
 626sub check_export_ok {
 627        my ($dir) = @_;
 628        return (check_head_link($dir) &&
 629                (!$export_ok || -e "$dir/$export_ok") &&
 630                (!$export_auth_hook || $export_auth_hook->($dir)));
 631}
 632
 633# process alternate names for backward compatibility
 634# filter out unsupported (unknown) snapshot formats
 635sub filter_snapshot_fmts {
 636        my @fmts = @_;
 637
 638        @fmts = map {
 639                exists $known_snapshot_format_aliases{$_} ?
 640                       $known_snapshot_format_aliases{$_} : $_} @fmts;
 641        @fmts = grep {
 642                exists $known_snapshot_formats{$_} &&
 643                !$known_snapshot_formats{$_}{'disabled'}} @fmts;
 644}
 645
 646# If it is set to code reference, it is code that it is to be run once per
 647# request, allowing updating configurations that change with each request,
 648# while running other code in config file only once.
 649#
 650# Otherwise, if it is false then gitweb would process config file only once;
 651# if it is true then gitweb config would be run for each request.
 652our $per_request_config = 1;
 653
 654# read and parse gitweb config file given by its parameter.
 655# returns true on success, false on recoverable error, allowing
 656# to chain this subroutine, using first file that exists.
 657# dies on errors during parsing config file, as it is unrecoverable.
 658sub read_config_file {
 659        my $filename = shift;
 660        return unless defined $filename;
 661        # die if there are errors parsing config file
 662        if (-e $filename) {
 663                do $filename;
 664                die $@ if $@;
 665                return 1;
 666        }
 667        return;
 668}
 669
 670our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
 671sub evaluate_gitweb_config {
 672        our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
 673        our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
 674        our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
 675
 676        # Protect agains duplications of file names, to not read config twice.
 677        # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
 678        # there possibility of duplication of filename there doesn't matter.
 679        $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
 680        $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
 681
 682        # Common system-wide settings for convenience.
 683        # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
 684        read_config_file($GITWEB_CONFIG_COMMON);
 685
 686        # Use first config file that exists.  This means use the per-instance
 687        # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
 688        read_config_file($GITWEB_CONFIG) and return;
 689        read_config_file($GITWEB_CONFIG_SYSTEM);
 690}
 691
 692# Get loadavg of system, to compare against $maxload.
 693# Currently it requires '/proc/loadavg' present to get loadavg;
 694# if it is not present it returns 0, which means no load checking.
 695sub get_loadavg {
 696        if( -e '/proc/loadavg' ){
 697                open my $fd, '<', '/proc/loadavg'
 698                        or return 0;
 699                my @load = split(/\s+/, scalar <$fd>);
 700                close $fd;
 701
 702                # The first three columns measure CPU and IO utilization of the last one,
 703                # five, and 10 minute periods.  The fourth column shows the number of
 704                # currently running processes and the total number of processes in the m/n
 705                # format.  The last column displays the last process ID used.
 706                return $load[0] || 0;
 707        }
 708        # additional checks for load average should go here for things that don't export
 709        # /proc/loadavg
 710
 711        return 0;
 712}
 713
 714# version of the core git binary
 715our $git_version;
 716sub evaluate_git_version {
 717        our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
 718        $number_of_git_cmds++;
 719}
 720
 721sub check_loadavg {
 722        if (defined $maxload && get_loadavg() > $maxload) {
 723                die_error(503, "The load average on the server is too high");
 724        }
 725}
 726
 727# ======================================================================
 728# input validation and dispatch
 729
 730# input parameters can be collected from a variety of sources (presently, CGI
 731# and PATH_INFO), so we define an %input_params hash that collects them all
 732# together during validation: this allows subsequent uses (e.g. href()) to be
 733# agnostic of the parameter origin
 734
 735our %input_params = ();
 736
 737# input parameters are stored with the long parameter name as key. This will
 738# also be used in the href subroutine to convert parameters to their CGI
 739# equivalent, and since the href() usage is the most frequent one, we store
 740# the name -> CGI key mapping here, instead of the reverse.
 741#
 742# XXX: Warning: If you touch this, check the search form for updating,
 743# too.
 744
 745our @cgi_param_mapping = (
 746        project => "p",
 747        action => "a",
 748        file_name => "f",
 749        file_parent => "fp",
 750        hash => "h",
 751        hash_parent => "hp",
 752        hash_base => "hb",
 753        hash_parent_base => "hpb",
 754        page => "pg",
 755        order => "o",
 756        searchtext => "s",
 757        searchtype => "st",
 758        snapshot_format => "sf",
 759        extra_options => "opt",
 760        search_use_regexp => "sr",
 761        ctag => "by_tag",
 762        diff_style => "ds",
 763        project_filter => "pf",
 764        # this must be last entry (for manipulation from JavaScript)
 765        javascript => "js"
 766);
 767our %cgi_param_mapping = @cgi_param_mapping;
 768
 769# we will also need to know the possible actions, for validation
 770our %actions = (
 771        "blame" => \&git_blame,
 772        "blame_incremental" => \&git_blame_incremental,
 773        "blame_data" => \&git_blame_data,
 774        "blobdiff" => \&git_blobdiff,
 775        "blobdiff_plain" => \&git_blobdiff_plain,
 776        "blob" => \&git_blob,
 777        "blob_plain" => \&git_blob_plain,
 778        "commitdiff" => \&git_commitdiff,
 779        "commitdiff_plain" => \&git_commitdiff_plain,
 780        "commit" => \&git_commit,
 781        "forks" => \&git_forks,
 782        "heads" => \&git_heads,
 783        "history" => \&git_history,
 784        "log" => \&git_log,
 785        "patch" => \&git_patch,
 786        "patches" => \&git_patches,
 787        "remotes" => \&git_remotes,
 788        "rss" => \&git_rss,
 789        "atom" => \&git_atom,
 790        "search" => \&git_search,
 791        "search_help" => \&git_search_help,
 792        "shortlog" => \&git_shortlog,
 793        "summary" => \&git_summary,
 794        "tag" => \&git_tag,
 795        "tags" => \&git_tags,
 796        "tree" => \&git_tree,
 797        "snapshot" => \&git_snapshot,
 798        "object" => \&git_object,
 799        # those below don't need $project
 800        "opml" => \&git_opml,
 801        "project_list" => \&git_project_list,
 802        "project_index" => \&git_project_index,
 803);
 804
 805# finally, we have the hash of allowed extra_options for the commands that
 806# allow them
 807our %allowed_options = (
 808        "--no-merges" => [ qw(rss atom log shortlog history) ],
 809);
 810
 811# fill %input_params with the CGI parameters. All values except for 'opt'
 812# should be single values, but opt can be an array. We should probably
 813# build an array of parameters that can be multi-valued, but since for the time
 814# being it's only this one, we just single it out
 815sub evaluate_query_params {
 816        our $cgi;
 817
 818        while (my ($name, $symbol) = each %cgi_param_mapping) {
 819                if ($symbol eq 'opt') {
 820                        $input_params{$name} = [ $cgi->param($symbol) ];
 821                } else {
 822                        $input_params{$name} = $cgi->param($symbol);
 823                }
 824        }
 825}
 826
 827# now read PATH_INFO and update the parameter list for missing parameters
 828sub evaluate_path_info {
 829        return if defined $input_params{'project'};
 830        return if !$path_info;
 831        $path_info =~ s,^/+,,;
 832        return if !$path_info;
 833
 834        # find which part of PATH_INFO is project
 835        my $project = $path_info;
 836        $project =~ s,/+$,,;
 837        while ($project && !check_head_link("$projectroot/$project")) {
 838                $project =~ s,/*[^/]*$,,;
 839        }
 840        return unless $project;
 841        $input_params{'project'} = $project;
 842
 843        # do not change any parameters if an action is given using the query string
 844        return if $input_params{'action'};
 845        $path_info =~ s,^\Q$project\E/*,,;
 846
 847        # next, check if we have an action
 848        my $action = $path_info;
 849        $action =~ s,/.*$,,;
 850        if (exists $actions{$action}) {
 851                $path_info =~ s,^$action/*,,;
 852                $input_params{'action'} = $action;
 853        }
 854
 855        # list of actions that want hash_base instead of hash, but can have no
 856        # pathname (f) parameter
 857        my @wants_base = (
 858                'tree',
 859                'history',
 860        );
 861
 862        # we want to catch, among others
 863        # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
 864        my ($parentrefname, $parentpathname, $refname, $pathname) =
 865                ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
 866
 867        # first, analyze the 'current' part
 868        if (defined $pathname) {
 869                # we got "branch:filename" or "branch:dir/"
 870                # we could use git_get_type(branch:pathname), but:
 871                # - it needs $git_dir
 872                # - it does a git() call
 873                # - the convention of terminating directories with a slash
 874                #   makes it superfluous
 875                # - embedding the action in the PATH_INFO would make it even
 876                #   more superfluous
 877                $pathname =~ s,^/+,,;
 878                if (!$pathname || substr($pathname, -1) eq "/") {
 879                        $input_params{'action'} ||= "tree";
 880                        $pathname =~ s,/$,,;
 881                } else {
 882                        # the default action depends on whether we had parent info
 883                        # or not
 884                        if ($parentrefname) {
 885                                $input_params{'action'} ||= "blobdiff_plain";
 886                        } else {
 887                                $input_params{'action'} ||= "blob_plain";
 888                        }
 889                }
 890                $input_params{'hash_base'} ||= $refname;
 891                $input_params{'file_name'} ||= $pathname;
 892        } elsif (defined $refname) {
 893                # we got "branch". In this case we have to choose if we have to
 894                # set hash or hash_base.
 895                #
 896                # Most of the actions without a pathname only want hash to be
 897                # set, except for the ones specified in @wants_base that want
 898                # hash_base instead. It should also be noted that hand-crafted
 899                # links having 'history' as an action and no pathname or hash
 900                # set will fail, but that happens regardless of PATH_INFO.
 901                if (defined $parentrefname) {
 902                        # if there is parent let the default be 'shortlog' action
 903                        # (for http://git.example.com/repo.git/A..B links); if there
 904                        # is no parent, dispatch will detect type of object and set
 905                        # action appropriately if required (if action is not set)
 906                        $input_params{'action'} ||= "shortlog";
 907                }
 908                if ($input_params{'action'} &&
 909                    grep { $_ eq $input_params{'action'} } @wants_base) {
 910                        $input_params{'hash_base'} ||= $refname;
 911                } else {
 912                        $input_params{'hash'} ||= $refname;
 913                }
 914        }
 915
 916        # next, handle the 'parent' part, if present
 917        if (defined $parentrefname) {
 918                # a missing pathspec defaults to the 'current' filename, allowing e.g.
 919                # someproject/blobdiff/oldrev..newrev:/filename
 920                if ($parentpathname) {
 921                        $parentpathname =~ s,^/+,,;
 922                        $parentpathname =~ s,/$,,;
 923                        $input_params{'file_parent'} ||= $parentpathname;
 924                } else {
 925                        $input_params{'file_parent'} ||= $input_params{'file_name'};
 926                }
 927                # we assume that hash_parent_base is wanted if a path was specified,
 928                # or if the action wants hash_base instead of hash
 929                if (defined $input_params{'file_parent'} ||
 930                        grep { $_ eq $input_params{'action'} } @wants_base) {
 931                        $input_params{'hash_parent_base'} ||= $parentrefname;
 932                } else {
 933                        $input_params{'hash_parent'} ||= $parentrefname;
 934                }
 935        }
 936
 937        # for the snapshot action, we allow URLs in the form
 938        # $project/snapshot/$hash.ext
 939        # where .ext determines the snapshot and gets removed from the
 940        # passed $refname to provide the $hash.
 941        #
 942        # To be able to tell that $refname includes the format extension, we
 943        # require the following two conditions to be satisfied:
 944        # - the hash input parameter MUST have been set from the $refname part
 945        #   of the URL (i.e. they must be equal)
 946        # - the snapshot format MUST NOT have been defined already (e.g. from
 947        #   CGI parameter sf)
 948        # It's also useless to try any matching unless $refname has a dot,
 949        # so we check for that too
 950        if (defined $input_params{'action'} &&
 951                $input_params{'action'} eq 'snapshot' &&
 952                defined $refname && index($refname, '.') != -1 &&
 953                $refname eq $input_params{'hash'} &&
 954                !defined $input_params{'snapshot_format'}) {
 955                # We loop over the known snapshot formats, checking for
 956                # extensions. Allowed extensions are both the defined suffix
 957                # (which includes the initial dot already) and the snapshot
 958                # format key itself, with a prepended dot
 959                while (my ($fmt, $opt) = each %known_snapshot_formats) {
 960                        my $hash = $refname;
 961                        unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
 962                                next;
 963                        }
 964                        my $sfx = $1;
 965                        # a valid suffix was found, so set the snapshot format
 966                        # and reset the hash parameter
 967                        $input_params{'snapshot_format'} = $fmt;
 968                        $input_params{'hash'} = $hash;
 969                        # we also set the format suffix to the one requested
 970                        # in the URL: this way a request for e.g. .tgz returns
 971                        # a .tgz instead of a .tar.gz
 972                        $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
 973                        last;
 974                }
 975        }
 976}
 977
 978our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
 979     $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
 980     $searchtext, $search_regexp, $project_filter);
 981sub evaluate_and_validate_params {
 982        our $action = $input_params{'action'};
 983        if (defined $action) {
 984                if (!validate_action($action)) {
 985                        die_error(400, "Invalid action parameter");
 986                }
 987        }
 988
 989        # parameters which are pathnames
 990        our $project = $input_params{'project'};
 991        if (defined $project) {
 992                if (!validate_project($project)) {
 993                        undef $project;
 994                        die_error(404, "No such project");
 995                }
 996        }
 997
 998        our $project_filter = $input_params{'project_filter'};
 999        if (defined $project_filter) {
1000                if (!validate_pathname($project_filter)) {
1001                        die_error(404, "Invalid project_filter parameter");
1002                }
1003        }
1004
1005        our $file_name = $input_params{'file_name'};
1006        if (defined $file_name) {
1007                if (!validate_pathname($file_name)) {
1008                        die_error(400, "Invalid file parameter");
1009                }
1010        }
1011
1012        our $file_parent = $input_params{'file_parent'};
1013        if (defined $file_parent) {
1014                if (!validate_pathname($file_parent)) {
1015                        die_error(400, "Invalid file parent parameter");
1016                }
1017        }
1018
1019        # parameters which are refnames
1020        our $hash = $input_params{'hash'};
1021        if (defined $hash) {
1022                if (!validate_refname($hash)) {
1023                        die_error(400, "Invalid hash parameter");
1024                }
1025        }
1026
1027        our $hash_parent = $input_params{'hash_parent'};
1028        if (defined $hash_parent) {
1029                if (!validate_refname($hash_parent)) {
1030                        die_error(400, "Invalid hash parent parameter");
1031                }
1032        }
1033
1034        our $hash_base = $input_params{'hash_base'};
1035        if (defined $hash_base) {
1036                if (!validate_refname($hash_base)) {
1037                        die_error(400, "Invalid hash base parameter");
1038                }
1039        }
1040
1041        our @extra_options = @{$input_params{'extra_options'}};
1042        # @extra_options is always defined, since it can only be (currently) set from
1043        # CGI, and $cgi->param() returns the empty array in array context if the param
1044        # is not set
1045        foreach my $opt (@extra_options) {
1046                if (not exists $allowed_options{$opt}) {
1047                        die_error(400, "Invalid option parameter");
1048                }
1049                if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1050                        die_error(400, "Invalid option parameter for this action");
1051                }
1052        }
1053
1054        our $hash_parent_base = $input_params{'hash_parent_base'};
1055        if (defined $hash_parent_base) {
1056                if (!validate_refname($hash_parent_base)) {
1057                        die_error(400, "Invalid hash parent base parameter");
1058                }
1059        }
1060
1061        # other parameters
1062        our $page = $input_params{'page'};
1063        if (defined $page) {
1064                if ($page =~ m/[^0-9]/) {
1065                        die_error(400, "Invalid page parameter");
1066                }
1067        }
1068
1069        our $searchtype = $input_params{'searchtype'};
1070        if (defined $searchtype) {
1071                if ($searchtype =~ m/[^a-z]/) {
1072                        die_error(400, "Invalid searchtype parameter");
1073                }
1074        }
1075
1076        our $search_use_regexp = $input_params{'search_use_regexp'};
1077
1078        our $searchtext = $input_params{'searchtext'};
1079        our $search_regexp;
1080        if (defined $searchtext) {
1081                if (length($searchtext) < 2) {
1082                        die_error(403, "At least two characters are required for search parameter");
1083                }
1084                $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
1085        }
1086}
1087
1088# path to the current git repository
1089our $git_dir;
1090sub evaluate_git_dir {
1091        our $git_dir = "$projectroot/$project" if $project;
1092}
1093
1094our (@snapshot_fmts, $git_avatar);
1095sub configure_gitweb_features {
1096        # list of supported snapshot formats
1097        our @snapshot_fmts = gitweb_get_feature('snapshot');
1098        @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1099
1100        # check that the avatar feature is set to a known provider name,
1101        # and for each provider check if the dependencies are satisfied.
1102        # if the provider name is invalid or the dependencies are not met,
1103        # reset $git_avatar to the empty string.
1104        our ($git_avatar) = gitweb_get_feature('avatar');
1105        if ($git_avatar eq 'gravatar') {
1106                $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1107        } elsif ($git_avatar eq 'picon') {
1108                # no dependencies
1109        } else {
1110                $git_avatar = '';
1111        }
1112}
1113
1114# custom error handler: 'die <message>' is Internal Server Error
1115sub handle_errors_html {
1116        my $msg = shift; # it is already HTML escaped
1117
1118        # to avoid infinite loop where error occurs in die_error,
1119        # change handler to default handler, disabling handle_errors_html
1120        set_message("Error occured when inside die_error:\n$msg");
1121
1122        # you cannot jump out of die_error when called as error handler;
1123        # the subroutine set via CGI::Carp::set_message is called _after_
1124        # HTTP headers are already written, so it cannot write them itself
1125        die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1126}
1127set_message(\&handle_errors_html);
1128
1129# dispatch
1130sub dispatch {
1131        if (!defined $action) {
1132                if (defined $hash) {
1133                        $action = git_get_type($hash);
1134                } elsif (defined $hash_base && defined $file_name) {
1135                        $action = git_get_type("$hash_base:$file_name");
1136                } elsif (defined $project) {
1137                        $action = 'summary';
1138                } else {
1139                        $action = 'project_list';
1140                }
1141        }
1142        if (!defined($actions{$action})) {
1143                die_error(400, "Unknown action");
1144        }
1145        if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1146            !$project) {
1147                die_error(400, "Project needed");
1148        }
1149        $actions{$action}->();
1150}
1151
1152sub reset_timer {
1153        our $t0 = [ gettimeofday() ]
1154                if defined $t0;
1155        our $number_of_git_cmds = 0;
1156}
1157
1158our $first_request = 1;
1159sub run_request {
1160        reset_timer();
1161
1162        evaluate_uri();
1163        if ($first_request) {
1164                evaluate_gitweb_config();
1165                evaluate_git_version();
1166        }
1167        if ($per_request_config) {
1168                if (ref($per_request_config) eq 'CODE') {
1169                        $per_request_config->();
1170                } elsif (!$first_request) {
1171                        evaluate_gitweb_config();
1172                }
1173        }
1174        check_loadavg();
1175
1176        # $projectroot and $projects_list might be set in gitweb config file
1177        $projects_list ||= $projectroot;
1178
1179        evaluate_query_params();
1180        evaluate_path_info();
1181        evaluate_and_validate_params();
1182        evaluate_git_dir();
1183
1184        configure_gitweb_features();
1185
1186        dispatch();
1187}
1188
1189our $is_last_request = sub { 1 };
1190our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1191our $CGI = 'CGI';
1192our $cgi;
1193sub configure_as_fcgi {
1194        require CGI::Fast;
1195        our $CGI = 'CGI::Fast';
1196
1197        my $request_number = 0;
1198        # let each child service 100 requests
1199        our $is_last_request = sub { ++$request_number > 100 };
1200}
1201sub evaluate_argv {
1202        my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1203        configure_as_fcgi()
1204                if $script_name =~ /\.fcgi$/;
1205
1206        return unless (@ARGV);
1207
1208        require Getopt::Long;
1209        Getopt::Long::GetOptions(
1210                'fastcgi|fcgi|f' => \&configure_as_fcgi,
1211                'nproc|n=i' => sub {
1212                        my ($arg, $val) = @_;
1213                        return unless eval { require FCGI::ProcManager; 1; };
1214                        my $proc_manager = FCGI::ProcManager->new({
1215                                n_processes => $val,
1216                        });
1217                        our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1218                        our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1219                        our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1220                },
1221        );
1222}
1223
1224sub run {
1225        evaluate_argv();
1226
1227        $first_request = 1;
1228        $pre_listen_hook->()
1229                if $pre_listen_hook;
1230
1231 REQUEST:
1232        while ($cgi = $CGI->new()) {
1233                $pre_dispatch_hook->()
1234                        if $pre_dispatch_hook;
1235
1236                run_request();
1237
1238                $post_dispatch_hook->()
1239                        if $post_dispatch_hook;
1240                $first_request = 0;
1241
1242                last REQUEST if ($is_last_request->());
1243        }
1244
1245 DONE_GITWEB:
1246        1;
1247}
1248
1249run();
1250
1251if (defined caller) {
1252        # wrapped in a subroutine processing requests,
1253        # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1254        return;
1255} else {
1256        # pure CGI script, serving single request
1257        exit;
1258}
1259
1260## ======================================================================
1261## action links
1262
1263# possible values of extra options
1264# -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1265# -replay => 1      - start from a current view (replay with modifications)
1266# -path_info => 0|1 - don't use/use path_info URL (if possible)
1267# -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1268sub href {
1269        my %params = @_;
1270        # default is to use -absolute url() i.e. $my_uri
1271        my $href = $params{-full} ? $my_url : $my_uri;
1272
1273        # implicit -replay, must be first of implicit params
1274        $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1275
1276        $params{'project'} = $project unless exists $params{'project'};
1277
1278        if ($params{-replay}) {
1279                while (my ($name, $symbol) = each %cgi_param_mapping) {
1280                        if (!exists $params{$name}) {
1281                                $params{$name} = $input_params{$name};
1282                        }
1283                }
1284        }
1285
1286        my $use_pathinfo = gitweb_check_feature('pathinfo');
1287        if (defined $params{'project'} &&
1288            (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1289                # try to put as many parameters as possible in PATH_INFO:
1290                #   - project name
1291                #   - action
1292                #   - hash_parent or hash_parent_base:/file_parent
1293                #   - hash or hash_base:/filename
1294                #   - the snapshot_format as an appropriate suffix
1295
1296                # When the script is the root DirectoryIndex for the domain,
1297                # $href here would be something like http://gitweb.example.com/
1298                # Thus, we strip any trailing / from $href, to spare us double
1299                # slashes in the final URL
1300                $href =~ s,/$,,;
1301
1302                # Then add the project name, if present
1303                $href .= "/".esc_path_info($params{'project'});
1304                delete $params{'project'};
1305
1306                # since we destructively absorb parameters, we keep this
1307                # boolean that remembers if we're handling a snapshot
1308                my $is_snapshot = $params{'action'} eq 'snapshot';
1309
1310                # Summary just uses the project path URL, any other action is
1311                # added to the URL
1312                if (defined $params{'action'}) {
1313                        $href .= "/".esc_path_info($params{'action'})
1314                                unless $params{'action'} eq 'summary';
1315                        delete $params{'action'};
1316                }
1317
1318                # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1319                # stripping nonexistent or useless pieces
1320                $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1321                        || $params{'hash_parent'} || $params{'hash'});
1322                if (defined $params{'hash_base'}) {
1323                        if (defined $params{'hash_parent_base'}) {
1324                                $href .= esc_path_info($params{'hash_parent_base'});
1325                                # skip the file_parent if it's the same as the file_name
1326                                if (defined $params{'file_parent'}) {
1327                                        if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1328                                                delete $params{'file_parent'};
1329                                        } elsif ($params{'file_parent'} !~ /\.\./) {
1330                                                $href .= ":/".esc_path_info($params{'file_parent'});
1331                                                delete $params{'file_parent'};
1332                                        }
1333                                }
1334                                $href .= "..";
1335                                delete $params{'hash_parent'};
1336                                delete $params{'hash_parent_base'};
1337                        } elsif (defined $params{'hash_parent'}) {
1338                                $href .= esc_path_info($params{'hash_parent'}). "..";
1339                                delete $params{'hash_parent'};
1340                        }
1341
1342                        $href .= esc_path_info($params{'hash_base'});
1343                        if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1344                                $href .= ":/".esc_path_info($params{'file_name'});
1345                                delete $params{'file_name'};
1346                        }
1347                        delete $params{'hash'};
1348                        delete $params{'hash_base'};
1349                } elsif (defined $params{'hash'}) {
1350                        $href .= esc_path_info($params{'hash'});
1351                        delete $params{'hash'};
1352                }
1353
1354                # If the action was a snapshot, we can absorb the
1355                # snapshot_format parameter too
1356                if ($is_snapshot) {
1357                        my $fmt = $params{'snapshot_format'};
1358                        # snapshot_format should always be defined when href()
1359                        # is called, but just in case some code forgets, we
1360                        # fall back to the default
1361                        $fmt ||= $snapshot_fmts[0];
1362                        $href .= $known_snapshot_formats{$fmt}{'suffix'};
1363                        delete $params{'snapshot_format'};
1364                }
1365        }
1366
1367        # now encode the parameters explicitly
1368        my @result = ();
1369        for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1370                my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1371                if (defined $params{$name}) {
1372                        if (ref($params{$name}) eq "ARRAY") {
1373                                foreach my $par (@{$params{$name}}) {
1374                                        push @result, $symbol . "=" . esc_param($par);
1375                                }
1376                        } else {
1377                                push @result, $symbol . "=" . esc_param($params{$name});
1378                        }
1379                }
1380        }
1381        $href .= "?" . join(';', @result) if scalar @result;
1382
1383        # final transformation: trailing spaces must be escaped (URI-encoded)
1384        $href =~ s/(\s+)$/CGI::escape($1)/e;
1385
1386        if ($params{-anchor}) {
1387                $href .= "#".esc_param($params{-anchor});
1388        }
1389
1390        return $href;
1391}
1392
1393
1394## ======================================================================
1395## validation, quoting/unquoting and escaping
1396
1397sub validate_action {
1398        my $input = shift || return undef;
1399        return undef unless exists $actions{$input};
1400        return $input;
1401}
1402
1403sub validate_project {
1404        my $input = shift || return undef;
1405        if (!validate_pathname($input) ||
1406                !(-d "$projectroot/$input") ||
1407                !check_export_ok("$projectroot/$input") ||
1408                ($strict_export && !project_in_list($input))) {
1409                return undef;
1410        } else {
1411                return $input;
1412        }
1413}
1414
1415sub validate_pathname {
1416        my $input = shift || return undef;
1417
1418        # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1419        # at the beginning, at the end, and between slashes.
1420        # also this catches doubled slashes
1421        if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1422                return undef;
1423        }
1424        # no null characters
1425        if ($input =~ m!\0!) {
1426                return undef;
1427        }
1428        return $input;
1429}
1430
1431sub validate_refname {
1432        my $input = shift || return undef;
1433
1434        # textual hashes are O.K.
1435        if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1436                return $input;
1437        }
1438        # it must be correct pathname
1439        $input = validate_pathname($input)
1440                or return undef;
1441        # restrictions on ref name according to git-check-ref-format
1442        if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1443                return undef;
1444        }
1445        return $input;
1446}
1447
1448# decode sequences of octets in utf8 into Perl's internal form,
1449# which is utf-8 with utf8 flag set if needed.  gitweb writes out
1450# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1451sub to_utf8 {
1452        my $str = shift;
1453        return undef unless defined $str;
1454
1455        if (utf8::is_utf8($str) || utf8::decode($str)) {
1456                return $str;
1457        } else {
1458                return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1459        }
1460}
1461
1462# quote unsafe chars, but keep the slash, even when it's not
1463# correct, but quoted slashes look too horrible in bookmarks
1464sub esc_param {
1465        my $str = shift;
1466        return undef unless defined $str;
1467        $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1468        $str =~ s/ /\+/g;
1469        return $str;
1470}
1471
1472# the quoting rules for path_info fragment are slightly different
1473sub esc_path_info {
1474        my $str = shift;
1475        return undef unless defined $str;
1476
1477        # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1478        $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1479
1480        return $str;
1481}
1482
1483# quote unsafe chars in whole URL, so some characters cannot be quoted
1484sub esc_url {
1485        my $str = shift;
1486        return undef unless defined $str;
1487        $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1488        $str =~ s/ /\+/g;
1489        return $str;
1490}
1491
1492# quote unsafe characters in HTML attributes
1493sub esc_attr {
1494
1495        # for XHTML conformance escaping '"' to '&quot;' is not enough
1496        return esc_html(@_);
1497}
1498
1499# replace invalid utf8 character with SUBSTITUTION sequence
1500sub esc_html {
1501        my $str = shift;
1502        my %opts = @_;
1503
1504        return undef unless defined $str;
1505
1506        $str = to_utf8($str);
1507        $str = $cgi->escapeHTML($str);
1508        if ($opts{'-nbsp'}) {
1509                $str =~ s/ /&nbsp;/g;
1510        }
1511        $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1512        return $str;
1513}
1514
1515# quote control characters and escape filename to HTML
1516sub esc_path {
1517        my $str = shift;
1518        my %opts = @_;
1519
1520        return undef unless defined $str;
1521
1522        $str = to_utf8($str);
1523        $str = $cgi->escapeHTML($str);
1524        if ($opts{'-nbsp'}) {
1525                $str =~ s/ /&nbsp;/g;
1526        }
1527        $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1528        return $str;
1529}
1530
1531# Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1532sub sanitize {
1533        my $str = shift;
1534
1535        return undef unless defined $str;
1536
1537        $str = to_utf8($str);
1538        $str =~ s|([[:cntrl:]])|($1 =~ /[\t\n\r]/ ? $1 : quot_cec($1))|eg;
1539        return $str;
1540}
1541
1542# Make control characters "printable", using character escape codes (CEC)
1543sub quot_cec {
1544        my $cntrl = shift;
1545        my %opts = @_;
1546        my %es = ( # character escape codes, aka escape sequences
1547                "\t" => '\t',   # tab            (HT)
1548                "\n" => '\n',   # line feed      (LF)
1549                "\r" => '\r',   # carrige return (CR)
1550                "\f" => '\f',   # form feed      (FF)
1551                "\b" => '\b',   # backspace      (BS)
1552                "\a" => '\a',   # alarm (bell)   (BEL)
1553                "\e" => '\e',   # escape         (ESC)
1554                "\013" => '\v', # vertical tab   (VT)
1555                "\000" => '\0', # nul character  (NUL)
1556        );
1557        my $chr = ( (exists $es{$cntrl})
1558                    ? $es{$cntrl}
1559                    : sprintf('\%2x', ord($cntrl)) );
1560        if ($opts{-nohtml}) {
1561                return $chr;
1562        } else {
1563                return "<span class=\"cntrl\">$chr</span>";
1564        }
1565}
1566
1567# Alternatively use unicode control pictures codepoints,
1568# Unicode "printable representation" (PR)
1569sub quot_upr {
1570        my $cntrl = shift;
1571        my %opts = @_;
1572
1573        my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1574        if ($opts{-nohtml}) {
1575                return $chr;
1576        } else {
1577                return "<span class=\"cntrl\">$chr</span>";
1578        }
1579}
1580
1581# git may return quoted and escaped filenames
1582sub unquote {
1583        my $str = shift;
1584
1585        sub unq {
1586                my $seq = shift;
1587                my %es = ( # character escape codes, aka escape sequences
1588                        't' => "\t",   # tab            (HT, TAB)
1589                        'n' => "\n",   # newline        (NL)
1590                        'r' => "\r",   # return         (CR)
1591                        'f' => "\f",   # form feed      (FF)
1592                        'b' => "\b",   # backspace      (BS)
1593                        'a' => "\a",   # alarm (bell)   (BEL)
1594                        'e' => "\e",   # escape         (ESC)
1595                        'v' => "\013", # vertical tab   (VT)
1596                );
1597
1598                if ($seq =~ m/^[0-7]{1,3}$/) {
1599                        # octal char sequence
1600                        return chr(oct($seq));
1601                } elsif (exists $es{$seq}) {
1602                        # C escape sequence, aka character escape code
1603                        return $es{$seq};
1604                }
1605                # quoted ordinary character
1606                return $seq;
1607        }
1608
1609        if ($str =~ m/^"(.*)"$/) {
1610                # needs unquoting
1611                $str = $1;
1612                $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1613        }
1614        return $str;
1615}
1616
1617# escape tabs (convert tabs to spaces)
1618sub untabify {
1619        my $line = shift;
1620
1621        while ((my $pos = index($line, "\t")) != -1) {
1622                if (my $count = (8 - ($pos % 8))) {
1623                        my $spaces = ' ' x $count;
1624                        $line =~ s/\t/$spaces/;
1625                }
1626        }
1627
1628        return $line;
1629}
1630
1631sub project_in_list {
1632        my $project = shift;
1633        my @list = git_get_projects_list();
1634        return @list && scalar(grep { $_->{'path'} eq $project } @list);
1635}
1636
1637## ----------------------------------------------------------------------
1638## HTML aware string manipulation
1639
1640# Try to chop given string on a word boundary between position
1641# $len and $len+$add_len. If there is no word boundary there,
1642# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1643# (marking chopped part) would be longer than given string.
1644sub chop_str {
1645        my $str = shift;
1646        my $len = shift;
1647        my $add_len = shift || 10;
1648        my $where = shift || 'right'; # 'left' | 'center' | 'right'
1649
1650        # Make sure perl knows it is utf8 encoded so we don't
1651        # cut in the middle of a utf8 multibyte char.
1652        $str = to_utf8($str);
1653
1654        # allow only $len chars, but don't cut a word if it would fit in $add_len
1655        # if it doesn't fit, cut it if it's still longer than the dots we would add
1656        # remove chopped character entities entirely
1657
1658        # when chopping in the middle, distribute $len into left and right part
1659        # return early if chopping wouldn't make string shorter
1660        if ($where eq 'center') {
1661                return $str if ($len + 5 >= length($str)); # filler is length 5
1662                $len = int($len/2);
1663        } else {
1664                return $str if ($len + 4 >= length($str)); # filler is length 4
1665        }
1666
1667        # regexps: ending and beginning with word part up to $add_len
1668        my $endre = qr/.{$len}\w{0,$add_len}/;
1669        my $begre = qr/\w{0,$add_len}.{$len}/;
1670
1671        if ($where eq 'left') {
1672                $str =~ m/^(.*?)($begre)$/;
1673                my ($lead, $body) = ($1, $2);
1674                if (length($lead) > 4) {
1675                        $lead = " ...";
1676                }
1677                return "$lead$body";
1678
1679        } elsif ($where eq 'center') {
1680                $str =~ m/^($endre)(.*)$/;
1681                my ($left, $str)  = ($1, $2);
1682                $str =~ m/^(.*?)($begre)$/;
1683                my ($mid, $right) = ($1, $2);
1684                if (length($mid) > 5) {
1685                        $mid = " ... ";
1686                }
1687                return "$left$mid$right";
1688
1689        } else {
1690                $str =~ m/^($endre)(.*)$/;
1691                my $body = $1;
1692                my $tail = $2;
1693                if (length($tail) > 4) {
1694                        $tail = "... ";
1695                }
1696                return "$body$tail";
1697        }
1698}
1699
1700# takes the same arguments as chop_str, but also wraps a <span> around the
1701# result with a title attribute if it does get chopped. Additionally, the
1702# string is HTML-escaped.
1703sub chop_and_escape_str {
1704        my ($str) = @_;
1705
1706        my $chopped = chop_str(@_);
1707        $str = to_utf8($str);
1708        if ($chopped eq $str) {
1709                return esc_html($chopped);
1710        } else {
1711                $str =~ s/[[:cntrl:]]/?/g;
1712                return $cgi->span({-title=>$str}, esc_html($chopped));
1713        }
1714}
1715
1716## ----------------------------------------------------------------------
1717## functions returning short strings
1718
1719# CSS class for given age value (in seconds)
1720sub age_class {
1721        my $age = shift;
1722
1723        if (!defined $age) {
1724                return "noage";
1725        } elsif ($age < 60*60*2) {
1726                return "age0";
1727        } elsif ($age < 60*60*24*2) {
1728                return "age1";
1729        } else {
1730                return "age2";
1731        }
1732}
1733
1734# convert age in seconds to "nn units ago" string
1735sub age_string {
1736        my $age = shift;
1737        my $age_str;
1738
1739        if ($age > 60*60*24*365*2) {
1740                $age_str = (int $age/60/60/24/365);
1741                $age_str .= " years ago";
1742        } elsif ($age > 60*60*24*(365/12)*2) {
1743                $age_str = int $age/60/60/24/(365/12);
1744                $age_str .= " months ago";
1745        } elsif ($age > 60*60*24*7*2) {
1746                $age_str = int $age/60/60/24/7;
1747                $age_str .= " weeks ago";
1748        } elsif ($age > 60*60*24*2) {
1749                $age_str = int $age/60/60/24;
1750                $age_str .= " days ago";
1751        } elsif ($age > 60*60*2) {
1752                $age_str = int $age/60/60;
1753                $age_str .= " hours ago";
1754        } elsif ($age > 60*2) {
1755                $age_str = int $age/60;
1756                $age_str .= " min ago";
1757        } elsif ($age > 2) {
1758                $age_str = int $age;
1759                $age_str .= " sec ago";
1760        } else {
1761                $age_str .= " right now";
1762        }
1763        return $age_str;
1764}
1765
1766use constant {
1767        S_IFINVALID => 0030000,
1768        S_IFGITLINK => 0160000,
1769};
1770
1771# submodule/subproject, a commit object reference
1772sub S_ISGITLINK {
1773        my $mode = shift;
1774
1775        return (($mode & S_IFMT) == S_IFGITLINK)
1776}
1777
1778# convert file mode in octal to symbolic file mode string
1779sub mode_str {
1780        my $mode = oct shift;
1781
1782        if (S_ISGITLINK($mode)) {
1783                return 'm---------';
1784        } elsif (S_ISDIR($mode & S_IFMT)) {
1785                return 'drwxr-xr-x';
1786        } elsif (S_ISLNK($mode)) {
1787                return 'lrwxrwxrwx';
1788        } elsif (S_ISREG($mode)) {
1789                # git cares only about the executable bit
1790                if ($mode & S_IXUSR) {
1791                        return '-rwxr-xr-x';
1792                } else {
1793                        return '-rw-r--r--';
1794                };
1795        } else {
1796                return '----------';
1797        }
1798}
1799
1800# convert file mode in octal to file type string
1801sub file_type {
1802        my $mode = shift;
1803
1804        if ($mode !~ m/^[0-7]+$/) {
1805                return $mode;
1806        } else {
1807                $mode = oct $mode;
1808        }
1809
1810        if (S_ISGITLINK($mode)) {
1811                return "submodule";
1812        } elsif (S_ISDIR($mode & S_IFMT)) {
1813                return "directory";
1814        } elsif (S_ISLNK($mode)) {
1815                return "symlink";
1816        } elsif (S_ISREG($mode)) {
1817                return "file";
1818        } else {
1819                return "unknown";
1820        }
1821}
1822
1823# convert file mode in octal to file type description string
1824sub file_type_long {
1825        my $mode = shift;
1826
1827        if ($mode !~ m/^[0-7]+$/) {
1828                return $mode;
1829        } else {
1830                $mode = oct $mode;
1831        }
1832
1833        if (S_ISGITLINK($mode)) {
1834                return "submodule";
1835        } elsif (S_ISDIR($mode & S_IFMT)) {
1836                return "directory";
1837        } elsif (S_ISLNK($mode)) {
1838                return "symlink";
1839        } elsif (S_ISREG($mode)) {
1840                if ($mode & S_IXUSR) {
1841                        return "executable";
1842                } else {
1843                        return "file";
1844                };
1845        } else {
1846                return "unknown";
1847        }
1848}
1849
1850
1851## ----------------------------------------------------------------------
1852## functions returning short HTML fragments, or transforming HTML fragments
1853## which don't belong to other sections
1854
1855# format line of commit message.
1856sub format_log_line_html {
1857        my $line = shift;
1858
1859        $line = esc_html($line, -nbsp=>1);
1860        $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1861                $cgi->a({-href => href(action=>"object", hash=>$1),
1862                                        -class => "text"}, $1);
1863        }eg;
1864
1865        return $line;
1866}
1867
1868# format marker of refs pointing to given object
1869
1870# the destination action is chosen based on object type and current context:
1871# - for annotated tags, we choose the tag view unless it's the current view
1872#   already, in which case we go to shortlog view
1873# - for other refs, we keep the current view if we're in history, shortlog or
1874#   log view, and select shortlog otherwise
1875sub format_ref_marker {
1876        my ($refs, $id) = @_;
1877        my $markers = '';
1878
1879        if (defined $refs->{$id}) {
1880                foreach my $ref (@{$refs->{$id}}) {
1881                        # this code exploits the fact that non-lightweight tags are the
1882                        # only indirect objects, and that they are the only objects for which
1883                        # we want to use tag instead of shortlog as action
1884                        my ($type, $name) = qw();
1885                        my $indirect = ($ref =~ s/\^\{\}$//);
1886                        # e.g. tags/v2.6.11 or heads/next
1887                        if ($ref =~ m!^(.*?)s?/(.*)$!) {
1888                                $type = $1;
1889                                $name = $2;
1890                        } else {
1891                                $type = "ref";
1892                                $name = $ref;
1893                        }
1894
1895                        my $class = $type;
1896                        $class .= " indirect" if $indirect;
1897
1898                        my $dest_action = "shortlog";
1899
1900                        if ($indirect) {
1901                                $dest_action = "tag" unless $action eq "tag";
1902                        } elsif ($action =~ /^(history|(short)?log)$/) {
1903                                $dest_action = $action;
1904                        }
1905
1906                        my $dest = "";
1907                        $dest .= "refs/" unless $ref =~ m!^refs/!;
1908                        $dest .= $ref;
1909
1910                        my $link = $cgi->a({
1911                                -href => href(
1912                                        action=>$dest_action,
1913                                        hash=>$dest
1914                                )}, $name);
1915
1916                        $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
1917                                $link . "</span>";
1918                }
1919        }
1920
1921        if ($markers) {
1922                return ' <span class="refs">'. $markers . '</span>';
1923        } else {
1924                return "";
1925        }
1926}
1927
1928# format, perhaps shortened and with markers, title line
1929sub format_subject_html {
1930        my ($long, $short, $href, $extra) = @_;
1931        $extra = '' unless defined($extra);
1932
1933        if (length($short) < length($long)) {
1934                $long =~ s/[[:cntrl:]]/?/g;
1935                return $cgi->a({-href => $href, -class => "list subject",
1936                                -title => to_utf8($long)},
1937                       esc_html($short)) . $extra;
1938        } else {
1939                return $cgi->a({-href => $href, -class => "list subject"},
1940                       esc_html($long)) . $extra;
1941        }
1942}
1943
1944# Rather than recomputing the url for an email multiple times, we cache it
1945# after the first hit. This gives a visible benefit in views where the avatar
1946# for the same email is used repeatedly (e.g. shortlog).
1947# The cache is shared by all avatar engines (currently gravatar only), which
1948# are free to use it as preferred. Since only one avatar engine is used for any
1949# given page, there's no risk for cache conflicts.
1950our %avatar_cache = ();
1951
1952# Compute the picon url for a given email, by using the picon search service over at
1953# http://www.cs.indiana.edu/picons/search.html
1954sub picon_url {
1955        my $email = lc shift;
1956        if (!$avatar_cache{$email}) {
1957                my ($user, $domain) = split('@', $email);
1958                $avatar_cache{$email} =
1959                        "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1960                        "$domain/$user/" .
1961                        "users+domains+unknown/up/single";
1962        }
1963        return $avatar_cache{$email};
1964}
1965
1966# Compute the gravatar url for a given email, if it's not in the cache already.
1967# Gravatar stores only the part of the URL before the size, since that's the
1968# one computationally more expensive. This also allows reuse of the cache for
1969# different sizes (for this particular engine).
1970sub gravatar_url {
1971        my $email = lc shift;
1972        my $size = shift;
1973        $avatar_cache{$email} ||=
1974                "http://www.gravatar.com/avatar/" .
1975                        Digest::MD5::md5_hex($email) . "?s=";
1976        return $avatar_cache{$email} . $size;
1977}
1978
1979# Insert an avatar for the given $email at the given $size if the feature
1980# is enabled.
1981sub git_get_avatar {
1982        my ($email, %opts) = @_;
1983        my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1984        my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1985        $opts{-size} ||= 'default';
1986        my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1987        my $url = "";
1988        if ($git_avatar eq 'gravatar') {
1989                $url = gravatar_url($email, $size);
1990        } elsif ($git_avatar eq 'picon') {
1991                $url = picon_url($email);
1992        }
1993        # Other providers can be added by extending the if chain, defining $url
1994        # as needed. If no variant puts something in $url, we assume avatars
1995        # are completely disabled/unavailable.
1996        if ($url) {
1997                return $pre_white .
1998                       "<img width=\"$size\" " .
1999                            "class=\"avatar\" " .
2000                            "src=\"".esc_url($url)."\" " .
2001                            "alt=\"\" " .
2002                       "/>" . $post_white;
2003        } else {
2004                return "";
2005        }
2006}
2007
2008sub format_search_author {
2009        my ($author, $searchtype, $displaytext) = @_;
2010        my $have_search = gitweb_check_feature('search');
2011
2012        if ($have_search) {
2013                my $performed = "";
2014                if ($searchtype eq 'author') {
2015                        $performed = "authored";
2016                } elsif ($searchtype eq 'committer') {
2017                        $performed = "committed";
2018                }
2019
2020                return $cgi->a({-href => href(action=>"search", hash=>$hash,
2021                                searchtext=>$author,
2022                                searchtype=>$searchtype), class=>"list",
2023                                title=>"Search for commits $performed by $author"},
2024                                $displaytext);
2025
2026        } else {
2027                return $displaytext;
2028        }
2029}
2030
2031# format the author name of the given commit with the given tag
2032# the author name is chopped and escaped according to the other
2033# optional parameters (see chop_str).
2034sub format_author_html {
2035        my $tag = shift;
2036        my $co = shift;
2037        my $author = chop_and_escape_str($co->{'author_name'}, @_);
2038        return "<$tag class=\"author\">" .
2039               format_search_author($co->{'author_name'}, "author",
2040                       git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2041                       $author) .
2042               "</$tag>";
2043}
2044
2045# format git diff header line, i.e. "diff --(git|combined|cc) ..."
2046sub format_git_diff_header_line {
2047        my $line = shift;
2048        my $diffinfo = shift;
2049        my ($from, $to) = @_;
2050
2051        if ($diffinfo->{'nparents'}) {
2052                # combined diff
2053                $line =~ s!^(diff (.*?) )"?.*$!$1!;
2054                if ($to->{'href'}) {
2055                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2056                                         esc_path($to->{'file'}));
2057                } else { # file was deleted (no href)
2058                        $line .= esc_path($to->{'file'});
2059                }
2060        } else {
2061                # "ordinary" diff
2062                $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2063                if ($from->{'href'}) {
2064                        $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2065                                         'a/' . esc_path($from->{'file'}));
2066                } else { # file was added (no href)
2067                        $line .= 'a/' . esc_path($from->{'file'});
2068                }
2069                $line .= ' ';
2070                if ($to->{'href'}) {
2071                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2072                                         'b/' . esc_path($to->{'file'}));
2073                } else { # file was deleted
2074                        $line .= 'b/' . esc_path($to->{'file'});
2075                }
2076        }
2077
2078        return "<div class=\"diff header\">$line</div>\n";
2079}
2080
2081# format extended diff header line, before patch itself
2082sub format_extended_diff_header_line {
2083        my $line = shift;
2084        my $diffinfo = shift;
2085        my ($from, $to) = @_;
2086
2087        # match <path>
2088        if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2089                $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2090                                       esc_path($from->{'file'}));
2091        }
2092        if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2093                $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2094                                 esc_path($to->{'file'}));
2095        }
2096        # match single <mode>
2097        if ($line =~ m/\s(\d{6})$/) {
2098                $line .= '<span class="info"> (' .
2099                         file_type_long($1) .
2100                         ')</span>';
2101        }
2102        # match <hash>
2103        if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2104                # can match only for combined diff
2105                $line = 'index ';
2106                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2107                        if ($from->{'href'}[$i]) {
2108                                $line .= $cgi->a({-href=>$from->{'href'}[$i],
2109                                                  -class=>"hash"},
2110                                                 substr($diffinfo->{'from_id'}[$i],0,7));
2111                        } else {
2112                                $line .= '0' x 7;
2113                        }
2114                        # separator
2115                        $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2116                }
2117                $line .= '..';
2118                if ($to->{'href'}) {
2119                        $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2120                                         substr($diffinfo->{'to_id'},0,7));
2121                } else {
2122                        $line .= '0' x 7;
2123                }
2124
2125        } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2126                # can match only for ordinary diff
2127                my ($from_link, $to_link);
2128                if ($from->{'href'}) {
2129                        $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2130                                             substr($diffinfo->{'from_id'},0,7));
2131                } else {
2132                        $from_link = '0' x 7;
2133                }
2134                if ($to->{'href'}) {
2135                        $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2136                                           substr($diffinfo->{'to_id'},0,7));
2137                } else {
2138                        $to_link = '0' x 7;
2139                }
2140                my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2141                $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2142        }
2143
2144        return $line . "<br/>\n";
2145}
2146
2147# format from-file/to-file diff header
2148sub format_diff_from_to_header {
2149        my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2150        my $line;
2151        my $result = '';
2152
2153        $line = $from_line;
2154        #assert($line =~ m/^---/) if DEBUG;
2155        # no extra formatting for "^--- /dev/null"
2156        if (! $diffinfo->{'nparents'}) {
2157                # ordinary (single parent) diff
2158                if ($line =~ m!^--- "?a/!) {
2159                        if ($from->{'href'}) {
2160                                $line = '--- a/' .
2161                                        $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2162                                                esc_path($from->{'file'}));
2163                        } else {
2164                                $line = '--- a/' .
2165                                        esc_path($from->{'file'});
2166                        }
2167                }
2168                $result .= qq!<div class="diff from_file">$line</div>\n!;
2169
2170        } else {
2171                # combined diff (merge commit)
2172                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2173                        if ($from->{'href'}[$i]) {
2174                                $line = '--- ' .
2175                                        $cgi->a({-href=>href(action=>"blobdiff",
2176                                                             hash_parent=>$diffinfo->{'from_id'}[$i],
2177                                                             hash_parent_base=>$parents[$i],
2178                                                             file_parent=>$from->{'file'}[$i],
2179                                                             hash=>$diffinfo->{'to_id'},
2180                                                             hash_base=>$hash,
2181                                                             file_name=>$to->{'file'}),
2182                                                 -class=>"path",
2183                                                 -title=>"diff" . ($i+1)},
2184                                                $i+1) .
2185                                        '/' .
2186                                        $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2187                                                esc_path($from->{'file'}[$i]));
2188                        } else {
2189                                $line = '--- /dev/null';
2190                        }
2191                        $result .= qq!<div class="diff from_file">$line</div>\n!;
2192                }
2193        }
2194
2195        $line = $to_line;
2196        #assert($line =~ m/^\+\+\+/) if DEBUG;
2197        # no extra formatting for "^+++ /dev/null"
2198        if ($line =~ m!^\+\+\+ "?b/!) {
2199                if ($to->{'href'}) {
2200                        $line = '+++ b/' .
2201                                $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2202                                        esc_path($to->{'file'}));
2203                } else {
2204                        $line = '+++ b/' .
2205                                esc_path($to->{'file'});
2206                }
2207        }
2208        $result .= qq!<div class="diff to_file">$line</div>\n!;
2209
2210        return $result;
2211}
2212
2213# create note for patch simplified by combined diff
2214sub format_diff_cc_simplified {
2215        my ($diffinfo, @parents) = @_;
2216        my $result = '';
2217
2218        $result .= "<div class=\"diff header\">" .
2219                   "diff --cc ";
2220        if (!is_deleted($diffinfo)) {
2221                $result .= $cgi->a({-href => href(action=>"blob",
2222                                                  hash_base=>$hash,
2223                                                  hash=>$diffinfo->{'to_id'},
2224                                                  file_name=>$diffinfo->{'to_file'}),
2225                                    -class => "path"},
2226                                   esc_path($diffinfo->{'to_file'}));
2227        } else {
2228                $result .= esc_path($diffinfo->{'to_file'});
2229        }
2230        $result .= "</div>\n" . # class="diff header"
2231                   "<div class=\"diff nodifferences\">" .
2232                   "Simple merge" .
2233                   "</div>\n"; # class="diff nodifferences"
2234
2235        return $result;
2236}
2237
2238sub diff_line_class {
2239        my ($line, $from, $to) = @_;
2240
2241        # ordinary diff
2242        my $num_sign = 1;
2243        # combined diff
2244        if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2245                $num_sign = scalar @{$from->{'href'}};
2246        }
2247
2248        my @diff_line_classifier = (
2249                { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2250                { regexp => qr/^\\/,               class => "incomplete"  },
2251                { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2252                # classifier for context must come before classifier add/rem,
2253                # or we would have to use more complicated regexp, for example
2254                # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2255                { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2256                { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2257        );
2258        for my $clsfy (@diff_line_classifier) {
2259                return $clsfy->{'class'}
2260                        if ($line =~ $clsfy->{'regexp'});
2261        }
2262
2263        # fallback
2264        return "";
2265}
2266
2267# assumes that $from and $to are defined and correctly filled,
2268# and that $line holds a line of chunk header for unified diff
2269sub format_unidiff_chunk_header {
2270        my ($line, $from, $to) = @_;
2271
2272        my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2273                $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2274
2275        $from_lines = 0 unless defined $from_lines;
2276        $to_lines   = 0 unless defined $to_lines;
2277
2278        if ($from->{'href'}) {
2279                $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2280                                     -class=>"list"}, $from_text);
2281        }
2282        if ($to->{'href'}) {
2283                $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2284                                     -class=>"list"}, $to_text);
2285        }
2286        $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2287                "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2288        return $line;
2289}
2290
2291# assumes that $from and $to are defined and correctly filled,
2292# and that $line holds a line of chunk header for combined diff
2293sub format_cc_diff_chunk_header {
2294        my ($line, $from, $to) = @_;
2295
2296        my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2297        my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2298
2299        @from_text = split(' ', $ranges);
2300        for (my $i = 0; $i < @from_text; ++$i) {
2301                ($from_start[$i], $from_nlines[$i]) =
2302                        (split(',', substr($from_text[$i], 1)), 0);
2303        }
2304
2305        $to_text   = pop @from_text;
2306        $to_start  = pop @from_start;
2307        $to_nlines = pop @from_nlines;
2308
2309        $line = "<span class=\"chunk_info\">$prefix ";
2310        for (my $i = 0; $i < @from_text; ++$i) {
2311                if ($from->{'href'}[$i]) {
2312                        $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2313                                          -class=>"list"}, $from_text[$i]);
2314                } else {
2315                        $line .= $from_text[$i];
2316                }
2317                $line .= " ";
2318        }
2319        if ($to->{'href'}) {
2320                $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2321                                  -class=>"list"}, $to_text);
2322        } else {
2323                $line .= $to_text;
2324        }
2325        $line .= " $prefix</span>" .
2326                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2327        return $line;
2328}
2329
2330# process patch (diff) line (not to be used for diff headers),
2331# returning class and HTML-formatted (but not wrapped) line
2332sub process_diff_line {
2333        my $line = shift;
2334        my ($from, $to) = @_;
2335
2336        my $diff_class = diff_line_class($line, $from, $to);
2337
2338        chomp $line;
2339        $line = untabify($line);
2340
2341        if ($from && $to && $line =~ m/^\@{2} /) {
2342                $line = format_unidiff_chunk_header($line, $from, $to);
2343                return $diff_class, $line;
2344
2345        } elsif ($from && $to && $line =~ m/^\@{3}/) {
2346                $line = format_cc_diff_chunk_header($line, $from, $to);
2347                return $diff_class, $line;
2348
2349        }
2350        return $diff_class, esc_html($line, -nbsp=>1);
2351}
2352
2353# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2354# linked.  Pass the hash of the tree/commit to snapshot.
2355sub format_snapshot_links {
2356        my ($hash) = @_;
2357        my $num_fmts = @snapshot_fmts;
2358        if ($num_fmts > 1) {
2359                # A parenthesized list of links bearing format names.
2360                # e.g. "snapshot (_tar.gz_ _zip_)"
2361                return "snapshot (" . join(' ', map
2362                        $cgi->a({
2363                                -href => href(
2364                                        action=>"snapshot",
2365                                        hash=>$hash,
2366                                        snapshot_format=>$_
2367                                )
2368                        }, $known_snapshot_formats{$_}{'display'})
2369                , @snapshot_fmts) . ")";
2370        } elsif ($num_fmts == 1) {
2371                # A single "snapshot" link whose tooltip bears the format name.
2372                # i.e. "_snapshot_"
2373                my ($fmt) = @snapshot_fmts;
2374                return
2375                        $cgi->a({
2376                                -href => href(
2377                                        action=>"snapshot",
2378                                        hash=>$hash,
2379                                        snapshot_format=>$fmt
2380                                ),
2381                                -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2382                        }, "snapshot");
2383        } else { # $num_fmts == 0
2384                return undef;
2385        }
2386}
2387
2388## ......................................................................
2389## functions returning values to be passed, perhaps after some
2390## transformation, to other functions; e.g. returning arguments to href()
2391
2392# returns hash to be passed to href to generate gitweb URL
2393# in -title key it returns description of link
2394sub get_feed_info {
2395        my $format = shift || 'Atom';
2396        my %res = (action => lc($format));
2397
2398        # feed links are possible only for project views
2399        return unless (defined $project);
2400        # some views should link to OPML, or to generic project feed,
2401        # or don't have specific feed yet (so they should use generic)
2402        return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2403
2404        my $branch;
2405        # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2406        # from tag links; this also makes possible to detect branch links
2407        if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2408            (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2409                $branch = $1;
2410        }
2411        # find log type for feed description (title)
2412        my $type = 'log';
2413        if (defined $file_name) {
2414                $type  = "history of $file_name";
2415                $type .= "/" if ($action eq 'tree');
2416                $type .= " on '$branch'" if (defined $branch);
2417        } else {
2418                $type = "log of $branch" if (defined $branch);
2419        }
2420
2421        $res{-title} = $type;
2422        $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2423        $res{'file_name'} = $file_name;
2424
2425        return %res;
2426}
2427
2428## ----------------------------------------------------------------------
2429## git utility subroutines, invoking git commands
2430
2431# returns path to the core git executable and the --git-dir parameter as list
2432sub git_cmd {
2433        $number_of_git_cmds++;
2434        return $GIT, '--git-dir='.$git_dir;
2435}
2436
2437# quote the given arguments for passing them to the shell
2438# quote_command("command", "arg 1", "arg with ' and ! characters")
2439# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2440# Try to avoid using this function wherever possible.
2441sub quote_command {
2442        return join(' ',
2443                map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2444}
2445
2446# get HEAD ref of given project as hash
2447sub git_get_head_hash {
2448        return git_get_full_hash(shift, 'HEAD');
2449}
2450
2451sub git_get_full_hash {
2452        return git_get_hash(@_);
2453}
2454
2455sub git_get_short_hash {
2456        return git_get_hash(@_, '--short=7');
2457}
2458
2459sub git_get_hash {
2460        my ($project, $hash, @options) = @_;
2461        my $o_git_dir = $git_dir;
2462        my $retval = undef;
2463        $git_dir = "$projectroot/$project";
2464        if (open my $fd, '-|', git_cmd(), 'rev-parse',
2465            '--verify', '-q', @options, $hash) {
2466                $retval = <$fd>;
2467                chomp $retval if defined $retval;
2468                close $fd;
2469        }
2470        if (defined $o_git_dir) {
2471                $git_dir = $o_git_dir;
2472        }
2473        return $retval;
2474}
2475
2476# get type of given object
2477sub git_get_type {
2478        my $hash = shift;
2479
2480        open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2481        my $type = <$fd>;
2482        close $fd or return;
2483        chomp $type;
2484        return $type;
2485}
2486
2487# repository configuration
2488our $config_file = '';
2489our %config;
2490
2491# store multiple values for single key as anonymous array reference
2492# single values stored directly in the hash, not as [ <value> ]
2493sub hash_set_multi {
2494        my ($hash, $key, $value) = @_;
2495
2496        if (!exists $hash->{$key}) {
2497                $hash->{$key} = $value;
2498        } elsif (!ref $hash->{$key}) {
2499                $hash->{$key} = [ $hash->{$key}, $value ];
2500        } else {
2501                push @{$hash->{$key}}, $value;
2502        }
2503}
2504
2505# return hash of git project configuration
2506# optionally limited to some section, e.g. 'gitweb'
2507sub git_parse_project_config {
2508        my $section_regexp = shift;
2509        my %config;
2510
2511        local $/ = "\0";
2512
2513        open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2514                or return;
2515
2516        while (my $keyval = <$fh>) {
2517                chomp $keyval;
2518                my ($key, $value) = split(/\n/, $keyval, 2);
2519
2520                hash_set_multi(\%config, $key, $value)
2521                        if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2522        }
2523        close $fh;
2524
2525        return %config;
2526}
2527
2528# convert config value to boolean: 'true' or 'false'
2529# no value, number > 0, 'true' and 'yes' values are true
2530# rest of values are treated as false (never as error)
2531sub config_to_bool {
2532        my $val = shift;
2533
2534        return 1 if !defined $val;             # section.key
2535
2536        # strip leading and trailing whitespace
2537        $val =~ s/^\s+//;
2538        $val =~ s/\s+$//;
2539
2540        return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2541                ($val =~ /^(?:true|yes)$/i));  # section.key = true
2542}
2543
2544# convert config value to simple decimal number
2545# an optional value suffix of 'k', 'm', or 'g' will cause the value
2546# to be multiplied by 1024, 1048576, or 1073741824
2547sub config_to_int {
2548        my $val = shift;
2549
2550        # strip leading and trailing whitespace
2551        $val =~ s/^\s+//;
2552        $val =~ s/\s+$//;
2553
2554        if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2555                $unit = lc($unit);
2556                # unknown unit is treated as 1
2557                return $num * ($unit eq 'g' ? 1073741824 :
2558                               $unit eq 'm' ?    1048576 :
2559                               $unit eq 'k' ?       1024 : 1);
2560        }
2561        return $val;
2562}
2563
2564# convert config value to array reference, if needed
2565sub config_to_multi {
2566        my $val = shift;
2567
2568        return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2569}
2570
2571sub git_get_project_config {
2572        my ($key, $type) = @_;
2573
2574        return unless defined $git_dir;
2575
2576        # key sanity check
2577        return unless ($key);
2578        # only subsection, if exists, is case sensitive,
2579        # and not lowercased by 'git config -z -l'
2580        if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2581                $key = join(".", lc($hi), $mi, lc($lo));
2582        } else {
2583                $key = lc($key);
2584        }
2585        $key =~ s/^gitweb\.//;
2586        return if ($key =~ m/\W/);
2587
2588        # type sanity check
2589        if (defined $type) {
2590                $type =~ s/^--//;
2591                $type = undef
2592                        unless ($type eq 'bool' || $type eq 'int');
2593        }
2594
2595        # get config
2596        if (!defined $config_file ||
2597            $config_file ne "$git_dir/config") {
2598                %config = git_parse_project_config('gitweb');
2599                $config_file = "$git_dir/config";
2600        }
2601
2602        # check if config variable (key) exists
2603        return unless exists $config{"gitweb.$key"};
2604
2605        # ensure given type
2606        if (!defined $type) {
2607                return $config{"gitweb.$key"};
2608        } elsif ($type eq 'bool') {
2609                # backward compatibility: 'git config --bool' returns true/false
2610                return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2611        } elsif ($type eq 'int') {
2612                return config_to_int($config{"gitweb.$key"});
2613        }
2614        return $config{"gitweb.$key"};
2615}
2616
2617# get hash of given path at given ref
2618sub git_get_hash_by_path {
2619        my $base = shift;
2620        my $path = shift || return undef;
2621        my $type = shift;
2622
2623        $path =~ s,/+$,,;
2624
2625        open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2626                or die_error(500, "Open git-ls-tree failed");
2627        my $line = <$fd>;
2628        close $fd or return undef;
2629
2630        if (!defined $line) {
2631                # there is no tree or hash given by $path at $base
2632                return undef;
2633        }
2634
2635        #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2636        $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2637        if (defined $type && $type ne $2) {
2638                # type doesn't match
2639                return undef;
2640        }
2641        return $3;
2642}
2643
2644# get path of entry with given hash at given tree-ish (ref)
2645# used to get 'from' filename for combined diff (merge commit) for renames
2646sub git_get_path_by_hash {
2647        my $base = shift || return;
2648        my $hash = shift || return;
2649
2650        local $/ = "\0";
2651
2652        open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2653                or return undef;
2654        while (my $line = <$fd>) {
2655                chomp $line;
2656
2657                #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2658                #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2659                if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2660                        close $fd;
2661                        return $1;
2662                }
2663        }
2664        close $fd;
2665        return undef;
2666}
2667
2668## ......................................................................
2669## git utility functions, directly accessing git repository
2670
2671# get the value of config variable either from file named as the variable
2672# itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2673# configuration variable in the repository config file.
2674sub git_get_file_or_project_config {
2675        my ($path, $name) = @_;
2676
2677        $git_dir = "$projectroot/$path";
2678        open my $fd, '<', "$git_dir/$name"
2679                or return git_get_project_config($name);
2680        my $conf = <$fd>;
2681        close $fd;
2682        if (defined $conf) {
2683                chomp $conf;
2684        }
2685        return $conf;
2686}
2687
2688sub git_get_project_description {
2689        my $path = shift;
2690        return git_get_file_or_project_config($path, 'description');
2691}
2692
2693sub git_get_project_category {
2694        my $path = shift;
2695        return git_get_file_or_project_config($path, 'category');
2696}
2697
2698
2699# supported formats:
2700# * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2701#   - if its contents is a number, use it as tag weight,
2702#   - otherwise add a tag with weight 1
2703# * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2704#   the same value multiple times increases tag weight
2705# * `gitweb.ctag' multi-valued repo config variable
2706sub git_get_project_ctags {
2707        my $project = shift;
2708        my $ctags = {};
2709
2710        $git_dir = "$projectroot/$project";
2711        if (opendir my $dh, "$git_dir/ctags") {
2712                my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2713                foreach my $tagfile (@files) {
2714                        open my $ct, '<', $tagfile
2715                                or next;
2716                        my $val = <$ct>;
2717                        chomp $val if $val;
2718                        close $ct;
2719
2720                        (my $ctag = $tagfile) =~ s#.*/##;
2721                        if ($val =~ /^\d+$/) {
2722                                $ctags->{$ctag} = $val;
2723                        } else {
2724                                $ctags->{$ctag} = 1;
2725                        }
2726                }
2727                closedir $dh;
2728
2729        } elsif (open my $fh, '<', "$git_dir/ctags") {
2730                while (my $line = <$fh>) {
2731                        chomp $line;
2732                        $ctags->{$line}++ if $line;
2733                }
2734                close $fh;
2735
2736        } else {
2737                my $taglist = config_to_multi(git_get_project_config('ctag'));
2738                foreach my $tag (@$taglist) {
2739                        $ctags->{$tag}++;
2740                }
2741        }
2742
2743        return $ctags;
2744}
2745
2746# return hash, where keys are content tags ('ctags'),
2747# and values are sum of weights of given tag in every project
2748sub git_gather_all_ctags {
2749        my $projects = shift;
2750        my $ctags = {};
2751
2752        foreach my $p (@$projects) {
2753                foreach my $ct (keys %{$p->{'ctags'}}) {
2754                        $ctags->{$ct} += $p->{'ctags'}->{$ct};
2755                }
2756        }
2757
2758        return $ctags;
2759}
2760
2761sub git_populate_project_tagcloud {
2762        my $ctags = shift;
2763
2764        # First, merge different-cased tags; tags vote on casing
2765        my %ctags_lc;
2766        foreach (keys %$ctags) {
2767                $ctags_lc{lc $_}->{count} += $ctags->{$_};
2768                if (not $ctags_lc{lc $_}->{topcount}
2769                    or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2770                        $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2771                        $ctags_lc{lc $_}->{topname} = $_;
2772                }
2773        }
2774
2775        my $cloud;
2776        my $matched = $cgi->param('by_tag');
2777        if (eval { require HTML::TagCloud; 1; }) {
2778                $cloud = HTML::TagCloud->new;
2779                foreach my $ctag (sort keys %ctags_lc) {
2780                        # Pad the title with spaces so that the cloud looks
2781                        # less crammed.
2782                        my $title = esc_html($ctags_lc{$ctag}->{topname});
2783                        $title =~ s/ /&nbsp;/g;
2784                        $title =~ s/^/&nbsp;/g;
2785                        $title =~ s/$/&nbsp;/g;
2786                        if (defined $matched && $matched eq $ctag) {
2787                                $title = qq(<span class="match">$title</span>);
2788                        }
2789                        $cloud->add($title, href(project=>undef, ctag=>$ctag),
2790                                    $ctags_lc{$ctag}->{count});
2791                }
2792        } else {
2793                $cloud = {};
2794                foreach my $ctag (keys %ctags_lc) {
2795                        my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2796                        if (defined $matched && $matched eq $ctag) {
2797                                $title = qq(<span class="match">$title</span>);
2798                        }
2799                        $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2800                        $cloud->{$ctag}{ctag} =
2801                                $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2802                }
2803        }
2804        return $cloud;
2805}
2806
2807sub git_show_project_tagcloud {
2808        my ($cloud, $count) = @_;
2809        if (ref $cloud eq 'HTML::TagCloud') {
2810                return $cloud->html_and_css($count);
2811        } else {
2812                my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2813                return
2814                        '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2815                        join (', ', map {
2816                                $cloud->{$_}->{'ctag'}
2817                        } splice(@tags, 0, $count)) .
2818                        '</div>';
2819        }
2820}
2821
2822sub git_get_project_url_list {
2823        my $path = shift;
2824
2825        $git_dir = "$projectroot/$path";
2826        open my $fd, '<', "$git_dir/cloneurl"
2827                or return wantarray ?
2828                @{ config_to_multi(git_get_project_config('url')) } :
2829                   config_to_multi(git_get_project_config('url'));
2830        my @git_project_url_list = map { chomp; $_ } <$fd>;
2831        close $fd;
2832
2833        return wantarray ? @git_project_url_list : \@git_project_url_list;
2834}
2835
2836sub git_get_projects_list {
2837        my $filter = shift || '';
2838        my $paranoid = shift;
2839        my @list;
2840
2841        if (-d $projects_list) {
2842                # search in directory
2843                my $dir = $projects_list;
2844                # remove the trailing "/"
2845                $dir =~ s!/+$!!;
2846                my $pfxlen = length("$dir");
2847                my $pfxdepth = ($dir =~ tr!/!!);
2848                # when filtering, search only given subdirectory
2849                if ($filter && !$paranoid) {
2850                        $dir .= "/$filter";
2851                        $dir =~ s!/+$!!;
2852                }
2853
2854                File::Find::find({
2855                        follow_fast => 1, # follow symbolic links
2856                        follow_skip => 2, # ignore duplicates
2857                        dangling_symlinks => 0, # ignore dangling symlinks, silently
2858                        wanted => sub {
2859                                # global variables
2860                                our $project_maxdepth;
2861                                our $projectroot;
2862                                # skip project-list toplevel, if we get it.
2863                                return if (m!^[/.]$!);
2864                                # only directories can be git repositories
2865                                return unless (-d $_);
2866                                # don't traverse too deep (Find is super slow on os x)
2867                                # $project_maxdepth excludes depth of $projectroot
2868                                if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2869                                        $File::Find::prune = 1;
2870                                        return;
2871                                }
2872
2873                                my $path = substr($File::Find::name, $pfxlen + 1);
2874                                # paranoidly only filter here
2875                                if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
2876                                        next;
2877                                }
2878                                # we check related file in $projectroot
2879                                if (check_export_ok("$projectroot/$path")) {
2880                                        push @list, { path => $path };
2881                                        $File::Find::prune = 1;
2882                                }
2883                        },
2884                }, "$dir");
2885
2886        } elsif (-f $projects_list) {
2887                # read from file(url-encoded):
2888                # 'git%2Fgit.git Linus+Torvalds'
2889                # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2890                # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2891                open my $fd, '<', $projects_list or return;
2892        PROJECT:
2893                while (my $line = <$fd>) {
2894                        chomp $line;
2895                        my ($path, $owner) = split ' ', $line;
2896                        $path = unescape($path);
2897                        $owner = unescape($owner);
2898                        if (!defined $path) {
2899                                next;
2900                        }
2901                        # if $filter is rpovided, check if $path begins with $filter
2902                        if ($filter && $path !~ m!^\Q$filter\E/!) {
2903                                next;
2904                        }
2905                        if (check_export_ok("$projectroot/$path")) {
2906                                my $pr = {
2907                                        path => $path,
2908                                        owner => to_utf8($owner),
2909                                };
2910                                push @list, $pr;
2911                        }
2912                }
2913                close $fd;
2914        }
2915        return @list;
2916}
2917
2918# written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
2919# as side effects it sets 'forks' field to list of forks for forked projects
2920sub filter_forks_from_projects_list {
2921        my $projects = shift;
2922
2923        my %trie; # prefix tree of directories (path components)
2924        # generate trie out of those directories that might contain forks
2925        foreach my $pr (@$projects) {
2926                my $path = $pr->{'path'};
2927                $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
2928                next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
2929                next unless ($path);      # skip '.git' repository: tests, git-instaweb
2930                next unless (-d "$projectroot/$path"); # containing directory exists
2931                $pr->{'forks'} = [];      # there can be 0 or more forks of project
2932
2933                # add to trie
2934                my @dirs = split('/', $path);
2935                # walk the trie, until either runs out of components or out of trie
2936                my $ref = \%trie;
2937                while (scalar @dirs &&
2938                       exists($ref->{$dirs[0]})) {
2939                        $ref = $ref->{shift @dirs};
2940                }
2941                # create rest of trie structure from rest of components
2942                foreach my $dir (@dirs) {
2943                        $ref = $ref->{$dir} = {};
2944                }
2945                # create end marker, store $pr as a data
2946                $ref->{''} = $pr if (!exists $ref->{''});
2947        }
2948
2949        # filter out forks, by finding shortest prefix match for paths
2950        my @filtered;
2951 PROJECT:
2952        foreach my $pr (@$projects) {
2953                # trie lookup
2954                my $ref = \%trie;
2955        DIR:
2956                foreach my $dir (split('/', $pr->{'path'})) {
2957                        if (exists $ref->{''}) {
2958                                # found [shortest] prefix, is a fork - skip it
2959                                push @{$ref->{''}{'forks'}}, $pr;
2960                                next PROJECT;
2961                        }
2962                        if (!exists $ref->{$dir}) {
2963                                # not in trie, cannot have prefix, not a fork
2964                                push @filtered, $pr;
2965                                next PROJECT;
2966                        }
2967                        # If the dir is there, we just walk one step down the trie.
2968                        $ref = $ref->{$dir};
2969                }
2970                # we ran out of trie
2971                # (shouldn't happen: it's either no match, or end marker)
2972                push @filtered, $pr;
2973        }
2974
2975        return @filtered;
2976}
2977
2978# note: fill_project_list_info must be run first,
2979# for 'descr_long' and 'ctags' to be filled
2980sub search_projects_list {
2981        my ($projlist, %opts) = @_;
2982        my $tagfilter  = $opts{'tagfilter'};
2983        my $searchtext = $opts{'searchtext'};
2984
2985        return @$projlist
2986                unless ($tagfilter || $searchtext);
2987
2988        my @projects;
2989 PROJECT:
2990        foreach my $pr (@$projlist) {
2991
2992                if ($tagfilter) {
2993                        next unless ref($pr->{'ctags'}) eq 'HASH';
2994                        next unless
2995                                grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
2996                }
2997
2998                if ($searchtext) {
2999                        next unless
3000                                $pr->{'path'} =~ /$searchtext/ ||
3001                                $pr->{'descr_long'} =~ /$searchtext/;
3002                }
3003
3004                push @projects, $pr;
3005        }
3006
3007        return @projects;
3008}
3009
3010our $gitweb_project_owner = undef;
3011sub git_get_project_list_from_file {
3012
3013        return if (defined $gitweb_project_owner);
3014
3015        $gitweb_project_owner = {};
3016        # read from file (url-encoded):
3017        # 'git%2Fgit.git Linus+Torvalds'
3018        # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3019        # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3020        if (-f $projects_list) {
3021                open(my $fd, '<', $projects_list);
3022                while (my $line = <$fd>) {
3023                        chomp $line;
3024                        my ($pr, $ow) = split ' ', $line;
3025                        $pr = unescape($pr);
3026                        $ow = unescape($ow);
3027                        $gitweb_project_owner->{$pr} = to_utf8($ow);
3028                }
3029                close $fd;
3030        }
3031}
3032
3033sub git_get_project_owner {
3034        my $project = shift;
3035        my $owner;
3036
3037        return undef unless $project;
3038        $git_dir = "$projectroot/$project";
3039
3040        if (!defined $gitweb_project_owner) {
3041                git_get_project_list_from_file();
3042        }
3043
3044        if (exists $gitweb_project_owner->{$project}) {
3045                $owner = $gitweb_project_owner->{$project};
3046        }
3047        if (!defined $owner){
3048                $owner = git_get_project_config('owner');
3049        }
3050        if (!defined $owner) {
3051                $owner = get_file_owner("$git_dir");
3052        }
3053
3054        return $owner;
3055}
3056
3057sub git_get_last_activity {
3058        my ($path) = @_;
3059        my $fd;
3060
3061        $git_dir = "$projectroot/$path";
3062        open($fd, "-|", git_cmd(), 'for-each-ref',
3063             '--format=%(committer)',
3064             '--sort=-committerdate',
3065             '--count=1',
3066             'refs/heads') or return;
3067        my $most_recent = <$fd>;
3068        close $fd or return;
3069        if (defined $most_recent &&
3070            $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3071                my $timestamp = $1;
3072                my $age = time - $timestamp;
3073                return ($age, age_string($age));
3074        }
3075        return (undef, undef);
3076}
3077
3078# Implementation note: when a single remote is wanted, we cannot use 'git
3079# remote show -n' because that command always work (assuming it's a remote URL
3080# if it's not defined), and we cannot use 'git remote show' because that would
3081# try to make a network roundtrip. So the only way to find if that particular
3082# remote is defined is to walk the list provided by 'git remote -v' and stop if
3083# and when we find what we want.
3084sub git_get_remotes_list {
3085        my $wanted = shift;
3086        my %remotes = ();
3087
3088        open my $fd, '-|' , git_cmd(), 'remote', '-v';
3089        return unless $fd;
3090        while (my $remote = <$fd>) {
3091                chomp $remote;
3092                $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3093                next if $wanted and not $remote eq $wanted;
3094                my ($url, $key) = ($1, $2);
3095
3096                $remotes{$remote} ||= { 'heads' => () };
3097                $remotes{$remote}{$key} = $url;
3098        }
3099        close $fd or return;
3100        return wantarray ? %remotes : \%remotes;
3101}
3102
3103# Takes a hash of remotes as first parameter and fills it by adding the
3104# available remote heads for each of the indicated remotes.
3105sub fill_remote_heads {
3106        my $remotes = shift;
3107        my @heads = map { "remotes/$_" } keys %$remotes;
3108        my @remoteheads = git_get_heads_list(undef, @heads);
3109        foreach my $remote (keys %$remotes) {
3110                $remotes->{$remote}{'heads'} = [ grep {
3111                        $_->{'name'} =~ s!^$remote/!!
3112                        } @remoteheads ];
3113        }
3114}
3115
3116sub git_get_references {
3117        my $type = shift || "";
3118        my %refs;
3119        # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3120        # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3121        open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3122                ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3123                or return;
3124
3125        while (my $line = <$fd>) {
3126                chomp $line;
3127                if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3128                        if (defined $refs{$1}) {
3129                                push @{$refs{$1}}, $2;
3130                        } else {
3131                                $refs{$1} = [ $2 ];
3132                        }
3133                }
3134        }
3135        close $fd or return;
3136        return \%refs;
3137}
3138
3139sub git_get_rev_name_tags {
3140        my $hash = shift || return undef;
3141
3142        open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3143                or return;
3144        my $name_rev = <$fd>;
3145        close $fd;
3146
3147        if ($name_rev =~ m|^$hash tags/(.*)$|) {
3148                return $1;
3149        } else {
3150                # catches also '$hash undefined' output
3151                return undef;
3152        }
3153}
3154
3155## ----------------------------------------------------------------------
3156## parse to hash functions
3157
3158sub parse_date {
3159        my $epoch = shift;
3160        my $tz = shift || "-0000";
3161
3162        my %date;
3163        my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3164        my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3165        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3166        $date{'hour'} = $hour;
3167        $date{'minute'} = $min;
3168        $date{'mday'} = $mday;
3169        $date{'day'} = $days[$wday];
3170        $date{'month'} = $months[$mon];
3171        $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3172                             $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3173        $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3174                             $mday, $months[$mon], $hour ,$min;
3175        $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3176                             1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3177
3178        my ($tz_sign, $tz_hour, $tz_min) =
3179                ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3180        $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3181        my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3182        ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3183        $date{'hour_local'} = $hour;
3184        $date{'minute_local'} = $min;
3185        $date{'tz_local'} = $tz;
3186        $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3187                                  1900+$year, $mon+1, $mday,
3188                                  $hour, $min, $sec, $tz);
3189        return %date;
3190}
3191
3192sub parse_tag {
3193        my $tag_id = shift;
3194        my %tag;
3195        my @comment;
3196
3197        open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3198        $tag{'id'} = $tag_id;
3199        while (my $line = <$fd>) {
3200                chomp $line;
3201                if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3202                        $tag{'object'} = $1;
3203                } elsif ($line =~ m/^type (.+)$/) {
3204                        $tag{'type'} = $1;
3205                } elsif ($line =~ m/^tag (.+)$/) {
3206                        $tag{'name'} = $1;
3207                } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3208                        $tag{'author'} = $1;
3209                        $tag{'author_epoch'} = $2;
3210                        $tag{'author_tz'} = $3;
3211                        if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3212                                $tag{'author_name'}  = $1;
3213                                $tag{'author_email'} = $2;
3214                        } else {
3215                                $tag{'author_name'} = $tag{'author'};
3216                        }
3217                } elsif ($line =~ m/--BEGIN/) {
3218                        push @comment, $line;
3219                        last;
3220                } elsif ($line eq "") {
3221                        last;
3222                }
3223        }
3224        push @comment, <$fd>;
3225        $tag{'comment'} = \@comment;
3226        close $fd or return;
3227        if (!defined $tag{'name'}) {
3228                return
3229        };
3230        return %tag
3231}
3232
3233sub parse_commit_text {
3234        my ($commit_text, $withparents) = @_;
3235        my @commit_lines = split '\n', $commit_text;
3236        my %co;
3237
3238        pop @commit_lines; # Remove '\0'
3239
3240        if (! @commit_lines) {
3241                return;
3242        }
3243
3244        my $header = shift @commit_lines;
3245        if ($header !~ m/^[0-9a-fA-F]{40}/) {
3246                return;
3247        }
3248        ($co{'id'}, my @parents) = split ' ', $header;
3249        while (my $line = shift @commit_lines) {
3250                last if $line eq "\n";
3251                if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3252                        $co{'tree'} = $1;
3253                } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3254                        push @parents, $1;
3255                } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3256                        $co{'author'} = to_utf8($1);
3257                        $co{'author_epoch'} = $2;
3258                        $co{'author_tz'} = $3;
3259                        if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3260                                $co{'author_name'}  = $1;
3261                                $co{'author_email'} = $2;
3262                        } else {
3263                                $co{'author_name'} = $co{'author'};
3264                        }
3265                } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3266                        $co{'committer'} = to_utf8($1);
3267                        $co{'committer_epoch'} = $2;
3268                        $co{'committer_tz'} = $3;
3269                        if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3270                                $co{'committer_name'}  = $1;
3271                                $co{'committer_email'} = $2;
3272                        } else {
3273                                $co{'committer_name'} = $co{'committer'};
3274                        }
3275                }
3276        }
3277        if (!defined $co{'tree'}) {
3278                return;
3279        };
3280        $co{'parents'} = \@parents;
3281        $co{'parent'} = $parents[0];
3282
3283        foreach my $title (@commit_lines) {
3284                $title =~ s/^    //;
3285                if ($title ne "") {
3286                        $co{'title'} = chop_str($title, 80, 5);
3287                        # remove leading stuff of merges to make the interesting part visible
3288                        if (length($title) > 50) {
3289                                $title =~ s/^Automatic //;
3290                                $title =~ s/^merge (of|with) /Merge ... /i;
3291                                if (length($title) > 50) {
3292                                        $title =~ s/(http|rsync):\/\///;
3293                                }
3294                                if (length($title) > 50) {
3295                                        $title =~ s/(master|www|rsync)\.//;
3296                                }
3297                                if (length($title) > 50) {
3298                                        $title =~ s/kernel.org:?//;
3299                                }
3300                                if (length($title) > 50) {
3301                                        $title =~ s/\/pub\/scm//;
3302                                }
3303                        }
3304                        $co{'title_short'} = chop_str($title, 50, 5);
3305                        last;
3306                }
3307        }
3308        if (! defined $co{'title'} || $co{'title'} eq "") {
3309                $co{'title'} = $co{'title_short'} = '(no commit message)';
3310        }
3311        # remove added spaces
3312        foreach my $line (@commit_lines) {
3313                $line =~ s/^    //;
3314        }
3315        $co{'comment'} = \@commit_lines;
3316
3317        my $age = time - $co{'committer_epoch'};
3318        $co{'age'} = $age;
3319        $co{'age_string'} = age_string($age);
3320        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3321        if ($age > 60*60*24*7*2) {
3322                $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3323                $co{'age_string_age'} = $co{'age_string'};
3324        } else {
3325                $co{'age_string_date'} = $co{'age_string'};
3326                $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3327        }
3328        return %co;
3329}
3330
3331sub parse_commit {
3332        my ($commit_id) = @_;
3333        my %co;
3334
3335        local $/ = "\0";
3336
3337        open my $fd, "-|", git_cmd(), "rev-list",
3338                "--parents",
3339                "--header",
3340                "--max-count=1",
3341                $commit_id,
3342                "--",
3343                or die_error(500, "Open git-rev-list failed");
3344        %co = parse_commit_text(<$fd>, 1);
3345        close $fd;
3346
3347        return %co;
3348}
3349
3350sub parse_commits {
3351        my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3352        my @cos;
3353
3354        $maxcount ||= 1;
3355        $skip ||= 0;
3356
3357        local $/ = "\0";
3358
3359        open my $fd, "-|", git_cmd(), "rev-list",
3360                "--header",
3361                @args,
3362                ("--max-count=" . $maxcount),
3363                ("--skip=" . $skip),
3364                @extra_options,
3365                $commit_id,
3366                "--",
3367                ($filename ? ($filename) : ())
3368                or die_error(500, "Open git-rev-list failed");
3369        while (my $line = <$fd>) {
3370                my %co = parse_commit_text($line);
3371                push @cos, \%co;
3372        }
3373        close $fd;
3374
3375        return wantarray ? @cos : \@cos;
3376}
3377
3378# parse line of git-diff-tree "raw" output
3379sub parse_difftree_raw_line {
3380        my $line = shift;
3381        my %res;
3382
3383        # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3384        # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3385        if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3386                $res{'from_mode'} = $1;
3387                $res{'to_mode'} = $2;
3388                $res{'from_id'} = $3;
3389                $res{'to_id'} = $4;
3390                $res{'status'} = $5;
3391                $res{'similarity'} = $6;
3392                if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3393                        ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3394                } else {
3395                        $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3396                }
3397        }
3398        # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3399        # combined diff (for merge commit)
3400        elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3401                $res{'nparents'}  = length($1);
3402                $res{'from_mode'} = [ split(' ', $2) ];
3403                $res{'to_mode'} = pop @{$res{'from_mode'}};
3404                $res{'from_id'} = [ split(' ', $3) ];
3405                $res{'to_id'} = pop @{$res{'from_id'}};
3406                $res{'status'} = [ split('', $4) ];
3407                $res{'to_file'} = unquote($5);
3408        }
3409        # 'c512b523472485aef4fff9e57b229d9d243c967f'
3410        elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3411                $res{'commit'} = $1;
3412        }
3413
3414        return wantarray ? %res : \%res;
3415}
3416
3417# wrapper: return parsed line of git-diff-tree "raw" output
3418# (the argument might be raw line, or parsed info)
3419sub parsed_difftree_line {
3420        my $line_or_ref = shift;
3421
3422        if (ref($line_or_ref) eq "HASH") {
3423                # pre-parsed (or generated by hand)
3424                return $line_or_ref;
3425        } else {
3426                return parse_difftree_raw_line($line_or_ref);
3427        }
3428}
3429
3430# parse line of git-ls-tree output
3431sub parse_ls_tree_line {
3432        my $line = shift;
3433        my %opts = @_;
3434        my %res;
3435
3436        if ($opts{'-l'}) {
3437                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3438                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3439
3440                $res{'mode'} = $1;
3441                $res{'type'} = $2;
3442                $res{'hash'} = $3;
3443                $res{'size'} = $4;
3444                if ($opts{'-z'}) {
3445                        $res{'name'} = $5;
3446                } else {
3447                        $res{'name'} = unquote($5);
3448                }
3449        } else {
3450                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3451                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3452
3453                $res{'mode'} = $1;
3454                $res{'type'} = $2;
3455                $res{'hash'} = $3;
3456                if ($opts{'-z'}) {
3457                        $res{'name'} = $4;
3458                } else {
3459                        $res{'name'} = unquote($4);
3460                }
3461        }
3462
3463        return wantarray ? %res : \%res;
3464}
3465
3466# generates _two_ hashes, references to which are passed as 2 and 3 argument
3467sub parse_from_to_diffinfo {
3468        my ($diffinfo, $from, $to, @parents) = @_;
3469
3470        if ($diffinfo->{'nparents'}) {
3471                # combined diff
3472                $from->{'file'} = [];
3473                $from->{'href'} = [];
3474                fill_from_file_info($diffinfo, @parents)
3475                        unless exists $diffinfo->{'from_file'};
3476                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3477                        $from->{'file'}[$i] =
3478                                defined $diffinfo->{'from_file'}[$i] ?
3479                                        $diffinfo->{'from_file'}[$i] :
3480                                        $diffinfo->{'to_file'};
3481                        if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3482                                $from->{'href'}[$i] = href(action=>"blob",
3483                                                           hash_base=>$parents[$i],
3484                                                           hash=>$diffinfo->{'from_id'}[$i],
3485                                                           file_name=>$from->{'file'}[$i]);
3486                        } else {
3487                                $from->{'href'}[$i] = undef;
3488                        }
3489                }
3490        } else {
3491                # ordinary (not combined) diff
3492                $from->{'file'} = $diffinfo->{'from_file'};
3493                if ($diffinfo->{'status'} ne "A") { # not new (added) file
3494                        $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3495                                               hash=>$diffinfo->{'from_id'},
3496                                               file_name=>$from->{'file'});
3497                } else {
3498                        delete $from->{'href'};
3499                }
3500        }
3501
3502        $to->{'file'} = $diffinfo->{'to_file'};
3503        if (!is_deleted($diffinfo)) { # file exists in result
3504                $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3505                                     hash=>$diffinfo->{'to_id'},
3506                                     file_name=>$to->{'file'});
3507        } else {
3508                delete $to->{'href'};
3509        }
3510}
3511
3512## ......................................................................
3513## parse to array of hashes functions
3514
3515sub git_get_heads_list {
3516        my ($limit, @classes) = @_;
3517        @classes = ('heads') unless @classes;
3518        my @patterns = map { "refs/$_" } @classes;
3519        my @headslist;
3520
3521        open my $fd, '-|', git_cmd(), 'for-each-ref',
3522                ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3523                '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3524                @patterns
3525                or return;
3526        while (my $line = <$fd>) {
3527                my %ref_item;
3528
3529                chomp $line;
3530                my ($refinfo, $committerinfo) = split(/\0/, $line);
3531                my ($hash, $name, $title) = split(' ', $refinfo, 3);
3532                my ($committer, $epoch, $tz) =
3533                        ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3534                $ref_item{'fullname'}  = $name;
3535                $name =~ s!^refs/(?:head|remote)s/!!;
3536
3537                $ref_item{'name'}  = $name;
3538                $ref_item{'id'}    = $hash;
3539                $ref_item{'title'} = $title || '(no commit message)';
3540                $ref_item{'epoch'} = $epoch;
3541                if ($epoch) {
3542                        $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3543                } else {
3544                        $ref_item{'age'} = "unknown";
3545                }
3546
3547                push @headslist, \%ref_item;
3548        }
3549        close $fd;
3550
3551        return wantarray ? @headslist : \@headslist;
3552}
3553
3554sub git_get_tags_list {
3555        my $limit = shift;
3556        my @tagslist;
3557
3558        open my $fd, '-|', git_cmd(), 'for-each-ref',
3559                ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3560                '--format=%(objectname) %(objecttype) %(refname) '.
3561                '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3562                'refs/tags'
3563                or return;
3564        while (my $line = <$fd>) {
3565                my %ref_item;
3566
3567                chomp $line;
3568                my ($refinfo, $creatorinfo) = split(/\0/, $line);
3569                my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3570                my ($creator, $epoch, $tz) =
3571                        ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3572                $ref_item{'fullname'} = $name;
3573                $name =~ s!^refs/tags/!!;
3574
3575                $ref_item{'type'} = $type;
3576                $ref_item{'id'} = $id;
3577                $ref_item{'name'} = $name;
3578                if ($type eq "tag") {
3579                        $ref_item{'subject'} = $title;
3580                        $ref_item{'reftype'} = $reftype;
3581                        $ref_item{'refid'}   = $refid;
3582                } else {
3583                        $ref_item{'reftype'} = $type;
3584                        $ref_item{'refid'}   = $id;
3585                }
3586
3587                if ($type eq "tag" || $type eq "commit") {
3588                        $ref_item{'epoch'} = $epoch;
3589                        if ($epoch) {
3590                                $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3591                        } else {
3592                                $ref_item{'age'} = "unknown";
3593                        }
3594                }
3595
3596                push @tagslist, \%ref_item;
3597        }
3598        close $fd;
3599
3600        return wantarray ? @tagslist : \@tagslist;
3601}
3602
3603## ----------------------------------------------------------------------
3604## filesystem-related functions
3605
3606sub get_file_owner {
3607        my $path = shift;
3608
3609        my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3610        my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3611        if (!defined $gcos) {
3612                return undef;
3613        }
3614        my $owner = $gcos;
3615        $owner =~ s/[,;].*$//;
3616        return to_utf8($owner);
3617}
3618
3619# assume that file exists
3620sub insert_file {
3621        my $filename = shift;
3622
3623        open my $fd, '<', $filename;
3624        print map { to_utf8($_) } <$fd>;
3625        close $fd;
3626}
3627
3628## ......................................................................
3629## mimetype related functions
3630
3631sub mimetype_guess_file {
3632        my $filename = shift;
3633        my $mimemap = shift;
3634        -r $mimemap or return undef;
3635
3636        my %mimemap;
3637        open(my $mh, '<', $mimemap) or return undef;
3638        while (<$mh>) {
3639                next if m/^#/; # skip comments
3640                my ($mimetype, @exts) = split(/\s+/);
3641                foreach my $ext (@exts) {
3642                        $mimemap{$ext} = $mimetype;
3643                }
3644        }
3645        close($mh);
3646
3647        $filename =~ /\.([^.]*)$/;
3648        return $mimemap{$1};
3649}
3650
3651sub mimetype_guess {
3652        my $filename = shift;
3653        my $mime;
3654        $filename =~ /\./ or return undef;
3655
3656        if ($mimetypes_file) {
3657                my $file = $mimetypes_file;
3658                if ($file !~ m!^/!) { # if it is relative path
3659                        # it is relative to project
3660                        $file = "$projectroot/$project/$file";
3661                }
3662                $mime = mimetype_guess_file($filename, $file);
3663        }
3664        $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3665        return $mime;
3666}
3667
3668sub blob_mimetype {
3669        my $fd = shift;
3670        my $filename = shift;
3671
3672        if ($filename) {
3673                my $mime = mimetype_guess($filename);
3674                $mime and return $mime;
3675        }
3676
3677        # just in case
3678        return $default_blob_plain_mimetype unless $fd;
3679
3680        if (-T $fd) {
3681                return 'text/plain';
3682        } elsif (! $filename) {
3683                return 'application/octet-stream';
3684        } elsif ($filename =~ m/\.png$/i) {
3685                return 'image/png';
3686        } elsif ($filename =~ m/\.gif$/i) {
3687                return 'image/gif';
3688        } elsif ($filename =~ m/\.jpe?g$/i) {
3689                return 'image/jpeg';
3690        } else {
3691                return 'application/octet-stream';
3692        }
3693}
3694
3695sub blob_contenttype {
3696        my ($fd, $file_name, $type) = @_;
3697
3698        $type ||= blob_mimetype($fd, $file_name);
3699        if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3700                $type .= "; charset=$default_text_plain_charset";
3701        }
3702
3703        return $type;
3704}
3705
3706# guess file syntax for syntax highlighting; return undef if no highlighting
3707# the name of syntax can (in the future) depend on syntax highlighter used
3708sub guess_file_syntax {
3709        my ($highlight, $mimetype, $file_name) = @_;
3710        return undef unless ($highlight && defined $file_name);
3711        my $basename = basename($file_name, '.in');
3712        return $highlight_basename{$basename}
3713                if exists $highlight_basename{$basename};
3714
3715        $basename =~ /\.([^.]*)$/;
3716        my $ext = $1 or return undef;
3717        return $highlight_ext{$ext}
3718                if exists $highlight_ext{$ext};
3719
3720        return undef;
3721}
3722
3723# run highlighter and return FD of its output,
3724# or return original FD if no highlighting
3725sub run_highlighter {
3726        my ($fd, $highlight, $syntax) = @_;
3727        return $fd unless ($highlight && defined $syntax);
3728
3729        close $fd;
3730        open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3731                  quote_command($highlight_bin).
3732                  " --replace-tabs=8 --fragment --syntax $syntax |"
3733                or die_error(500, "Couldn't open file or run syntax highlighter");
3734        return $fd;
3735}
3736
3737## ======================================================================
3738## functions printing HTML: header, footer, error page
3739
3740sub get_page_title {
3741        my $title = to_utf8($site_name);
3742
3743        unless (defined $project) {
3744                if (defined $project_filter) {
3745                        $title .= " - " . to_utf8($project_filter);
3746                }
3747                return $title;
3748        }
3749        $title .= " - " . to_utf8($project);
3750
3751        return $title unless (defined $action);
3752        $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3753
3754        return $title unless (defined $file_name);
3755        $title .= " - " . esc_path($file_name);
3756        if ($action eq "tree" && $file_name !~ m|/$|) {
3757                $title .= "/";
3758        }
3759
3760        return $title;
3761}
3762
3763sub get_content_type_html {
3764        # require explicit support from the UA if we are to send the page as
3765        # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3766        # we have to do this because MSIE sometimes globs '*/*', pretending to
3767        # support xhtml+xml but choking when it gets what it asked for.
3768        if (defined $cgi->http('HTTP_ACCEPT') &&
3769            $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3770            $cgi->Accept('application/xhtml+xml') != 0) {
3771                return 'application/xhtml+xml';
3772        } else {
3773                return 'text/html';
3774        }
3775}
3776
3777sub print_feed_meta {
3778        if (defined $project) {
3779                my %href_params = get_feed_info();
3780                if (!exists $href_params{'-title'}) {
3781                        $href_params{'-title'} = 'log';
3782                }
3783
3784                foreach my $format (qw(RSS Atom)) {
3785                        my $type = lc($format);
3786                        my %link_attr = (
3787                                '-rel' => 'alternate',
3788                                '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3789                                '-type' => "application/$type+xml"
3790                        );
3791
3792                        $href_params{'action'} = $type;
3793                        $link_attr{'-href'} = href(%href_params);
3794                        print "<link ".
3795                              "rel=\"$link_attr{'-rel'}\" ".
3796                              "title=\"$link_attr{'-title'}\" ".
3797                              "href=\"$link_attr{'-href'}\" ".
3798                              "type=\"$link_attr{'-type'}\" ".
3799                              "/>\n";
3800
3801                        $href_params{'extra_options'} = '--no-merges';
3802                        $link_attr{'-href'} = href(%href_params);
3803                        $link_attr{'-title'} .= ' (no merges)';
3804                        print "<link ".
3805                              "rel=\"$link_attr{'-rel'}\" ".
3806                              "title=\"$link_attr{'-title'}\" ".
3807                              "href=\"$link_attr{'-href'}\" ".
3808                              "type=\"$link_attr{'-type'}\" ".
3809                              "/>\n";
3810                }
3811
3812        } else {
3813                printf('<link rel="alternate" title="%s projects list" '.
3814                       'href="%s" type="text/plain; charset=utf-8" />'."\n",
3815                       esc_attr($site_name), href(project=>undef, action=>"project_index"));
3816                printf('<link rel="alternate" title="%s projects feeds" '.
3817                       'href="%s" type="text/x-opml" />'."\n",
3818                       esc_attr($site_name), href(project=>undef, action=>"opml"));
3819        }
3820}
3821
3822sub print_header_links {
3823        my $status = shift;
3824
3825        # print out each stylesheet that exist, providing backwards capability
3826        # for those people who defined $stylesheet in a config file
3827        if (defined $stylesheet) {
3828                print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3829        } else {
3830                foreach my $stylesheet (@stylesheets) {
3831                        next unless $stylesheet;
3832                        print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3833                }
3834        }
3835        print_feed_meta()
3836                if ($status eq '200 OK');
3837        if (defined $favicon) {
3838                print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3839        }
3840}
3841
3842sub print_nav_breadcrumbs_path {
3843        my $dirprefix = undef;
3844        while (my $part = shift) {
3845                $dirprefix .= "/" if defined $dirprefix;
3846                $dirprefix .= $part;
3847                print $cgi->a({-href => href(project => undef,
3848                                             project_filter => $dirprefix,
3849                                             action => "project_list")},
3850                              esc_html($part)) . " / ";
3851        }
3852}
3853
3854sub print_nav_breadcrumbs {
3855        my %opts = @_;
3856
3857        print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3858        if (defined $project) {
3859                print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3860                if (defined $action) {
3861                        my $action_print = $action ;
3862                        if (defined $opts{-action_extra}) {
3863                                $action_print = $cgi->a({-href => href(action=>$action)},
3864                                        $action);
3865                        }
3866                        print " / $action_print";
3867                }
3868                if (defined $opts{-action_extra}) {
3869                        print " / $opts{-action_extra}";
3870                }
3871                print "\n";
3872        } elsif (defined $project_filter) {
3873                print_nav_breadcrumbs_path(split '/', $project_filter);
3874        }
3875}
3876
3877sub print_search_form {
3878        if (!defined $searchtext) {
3879                $searchtext = "";
3880        }
3881        my $search_hash;
3882        if (defined $hash_base) {
3883                $search_hash = $hash_base;
3884        } elsif (defined $hash) {
3885                $search_hash = $hash;
3886        } else {
3887                $search_hash = "HEAD";
3888        }
3889        my $action = $my_uri;
3890        my $use_pathinfo = gitweb_check_feature('pathinfo');
3891        if ($use_pathinfo) {
3892                $action .= "/".esc_url($project);
3893        }
3894        print $cgi->startform(-method => "get", -action => $action) .
3895              "<div class=\"search\">\n" .
3896              (!$use_pathinfo &&
3897              $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3898              $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3899              $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3900              $cgi->popup_menu(-name => 'st', -default => 'commit',
3901                               -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3902              $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3903              " search:\n",
3904              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3905              "<span title=\"Extended regular expression\">" .
3906              $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3907                             -checked => $search_use_regexp) .
3908              "</span>" .
3909              "</div>" .
3910              $cgi->end_form() . "\n";
3911}
3912
3913sub git_header_html {
3914        my $status = shift || "200 OK";
3915        my $expires = shift;
3916        my %opts = @_;
3917
3918        my $title = get_page_title();
3919        my $content_type = get_content_type_html();
3920        print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3921                           -status=> $status, -expires => $expires)
3922                unless ($opts{'-no_http_header'});
3923        my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3924        print <<EOF;
3925<?xml version="1.0" encoding="utf-8"?>
3926<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3927<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3928<!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3929<!-- git core binaries version $git_version -->
3930<head>
3931<meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3932<meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3933<meta name="robots" content="index, nofollow"/>
3934<title>$title</title>
3935EOF
3936        # the stylesheet, favicon etc urls won't work correctly with path_info
3937        # unless we set the appropriate base URL
3938        if ($ENV{'PATH_INFO'}) {
3939                print "<base href=\"".esc_url($base_url)."\" />\n";
3940        }
3941        print_header_links($status);
3942
3943        if (defined $site_html_head_string) {
3944                print to_utf8($site_html_head_string);
3945        }
3946
3947        print "</head>\n" .
3948              "<body>\n";
3949
3950        if (defined $site_header && -f $site_header) {
3951                insert_file($site_header);
3952        }
3953
3954        print "<div class=\"page_header\">\n";
3955        if (defined $logo) {
3956                print $cgi->a({-href => esc_url($logo_url),
3957                               -title => $logo_label},
3958                              $cgi->img({-src => esc_url($logo),
3959                                         -width => 72, -height => 27,
3960                                         -alt => "git",
3961                                         -class => "logo"}));
3962        }
3963        print_nav_breadcrumbs(%opts);
3964        print "</div>\n";
3965
3966        my $have_search = gitweb_check_feature('search');
3967        if (defined $project && $have_search) {
3968                print_search_form();
3969        }
3970}
3971
3972sub git_footer_html {
3973        my $feed_class = 'rss_logo';
3974
3975        print "<div class=\"page_footer\">\n";
3976        if (defined $project) {
3977                my $descr = git_get_project_description($project);
3978                if (defined $descr) {
3979                        print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3980                }
3981
3982                my %href_params = get_feed_info();
3983                if (!%href_params) {
3984                        $feed_class .= ' generic';
3985                }
3986                $href_params{'-title'} ||= 'log';
3987
3988                foreach my $format (qw(RSS Atom)) {
3989                        $href_params{'action'} = lc($format);
3990                        print $cgi->a({-href => href(%href_params),
3991                                      -title => "$href_params{'-title'} $format feed",
3992                                      -class => $feed_class}, $format)."\n";
3993                }
3994
3995        } else {
3996                print $cgi->a({-href => href(project=>undef, action=>"opml",
3997                                             project_filter => $project_filter),
3998                              -class => $feed_class}, "OPML") . " ";
3999                print $cgi->a({-href => href(project=>undef, action=>"project_index",
4000                                             project_filter => $project_filter),
4001                              -class => $feed_class}, "TXT") . "\n";
4002        }
4003        print "</div>\n"; # class="page_footer"
4004
4005        if (defined $t0 && gitweb_check_feature('timed')) {
4006                print "<div id=\"generating_info\">\n";
4007                print 'This page took '.
4008                      '<span id="generating_time" class="time_span">'.
4009                      tv_interval($t0, [ gettimeofday() ]).
4010                      ' seconds </span>'.
4011                      ' and '.
4012                      '<span id="generating_cmd">'.
4013                      $number_of_git_cmds.
4014                      '</span> git commands '.
4015                      " to generate.\n";
4016                print "</div>\n"; # class="page_footer"
4017        }
4018
4019        if (defined $site_footer && -f $site_footer) {
4020                insert_file($site_footer);
4021        }
4022
4023        print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
4024        if (defined $action &&
4025            $action eq 'blame_incremental') {
4026                print qq!<script type="text/javascript">\n!.
4027                      qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
4028                      qq!           "!. href() .qq!");\n!.
4029                      qq!</script>\n!;
4030        } else {
4031                my ($jstimezone, $tz_cookie, $datetime_class) =
4032                        gitweb_get_feature('javascript-timezone');
4033
4034                print qq!<script type="text/javascript">\n!.
4035                      qq!window.onload = function () {\n!;
4036                if (gitweb_check_feature('javascript-actions')) {
4037                        print qq!       fixLinks();\n!;
4038                }
4039                if ($jstimezone && $tz_cookie && $datetime_class) {
4040                        print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4041                              qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4042                }
4043                print qq!};\n!.
4044                      qq!</script>\n!;
4045        }
4046
4047        print "</body>\n" .
4048              "</html>";
4049}
4050
4051# die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4052# Example: die_error(404, 'Hash not found')
4053# By convention, use the following status codes (as defined in RFC 2616):
4054# 400: Invalid or missing CGI parameters, or
4055#      requested object exists but has wrong type.
4056# 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4057#      this server or project.
4058# 404: Requested object/revision/project doesn't exist.
4059# 500: The server isn't configured properly, or
4060#      an internal error occurred (e.g. failed assertions caused by bugs), or
4061#      an unknown error occurred (e.g. the git binary died unexpectedly).
4062# 503: The server is currently unavailable (because it is overloaded,
4063#      or down for maintenance).  Generally, this is a temporary state.
4064sub die_error {
4065        my $status = shift || 500;
4066        my $error = esc_html(shift) || "Internal Server Error";
4067        my $extra = shift;
4068        my %opts = @_;
4069
4070        my %http_responses = (
4071                400 => '400 Bad Request',
4072                403 => '403 Forbidden',
4073                404 => '404 Not Found',
4074                500 => '500 Internal Server Error',
4075                503 => '503 Service Unavailable',
4076        );
4077        git_header_html($http_responses{$status}, undef, %opts);
4078        print <<EOF;
4079<div class="page_body">
4080<br /><br />
4081$status - $error
4082<br />
4083EOF
4084        if (defined $extra) {
4085                print "<hr />\n" .
4086                      "$extra\n";
4087        }
4088        print "</div>\n";
4089
4090        git_footer_html();
4091        goto DONE_GITWEB
4092                unless ($opts{'-error_handler'});
4093}
4094
4095## ----------------------------------------------------------------------
4096## functions printing or outputting HTML: navigation
4097
4098sub git_print_page_nav {
4099        my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4100        $extra = '' if !defined $extra; # pager or formats
4101
4102        my @navs = qw(summary shortlog log commit commitdiff tree);
4103        if ($suppress) {
4104                @navs = grep { $_ ne $suppress } @navs;
4105        }
4106
4107        my %arg = map { $_ => {action=>$_} } @navs;
4108        if (defined $head) {
4109                for (qw(commit commitdiff)) {
4110                        $arg{$_}{'hash'} = $head;
4111                }
4112                if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4113                        for (qw(shortlog log)) {
4114                                $arg{$_}{'hash'} = $head;
4115                        }
4116                }
4117        }
4118
4119        $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4120        $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4121
4122        my @actions = gitweb_get_feature('actions');
4123        my %repl = (
4124                '%' => '%',
4125                'n' => $project,         # project name
4126                'f' => $git_dir,         # project path within filesystem
4127                'h' => $treehead || '',  # current hash ('h' parameter)
4128                'b' => $treebase || '',  # hash base ('hb' parameter)
4129        );
4130        while (@actions) {
4131                my ($label, $link, $pos) = splice(@actions,0,3);
4132                # insert
4133                @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4134                # munch munch
4135                $link =~ s/%([%nfhb])/$repl{$1}/g;
4136                $arg{$label}{'_href'} = $link;
4137        }
4138
4139        print "<div class=\"page_nav\">\n" .
4140                (join " | ",
4141                 map { $_ eq $current ?
4142                       $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4143                 } @navs);
4144        print "<br/>\n$extra<br/>\n" .
4145              "</div>\n";
4146}
4147
4148# returns a submenu for the nagivation of the refs views (tags, heads,
4149# remotes) with the current view disabled and the remotes view only
4150# available if the feature is enabled
4151sub format_ref_views {
4152        my ($current) = @_;
4153        my @ref_views = qw{tags heads};
4154        push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4155        return join " | ", map {
4156                $_ eq $current ? $_ :
4157                $cgi->a({-href => href(action=>$_)}, $_)
4158        } @ref_views
4159}
4160
4161sub format_paging_nav {
4162        my ($action, $page, $has_next_link) = @_;
4163        my $paging_nav;
4164
4165
4166        if ($page > 0) {
4167                $paging_nav .=
4168                        $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4169                        " &sdot; " .
4170                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
4171                                 -accesskey => "p", -title => "Alt-p"}, "prev");
4172        } else {
4173                $paging_nav .= "first &sdot; prev";
4174        }
4175
4176        if ($has_next_link) {
4177                $paging_nav .= " &sdot; " .
4178                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
4179                                 -accesskey => "n", -title => "Alt-n"}, "next");
4180        } else {
4181                $paging_nav .= " &sdot; next";
4182        }
4183
4184        return $paging_nav;
4185}
4186
4187## ......................................................................
4188## functions printing or outputting HTML: div
4189
4190sub git_print_header_div {
4191        my ($action, $title, $hash, $hash_base) = @_;
4192        my %args = ();
4193
4194        $args{'action'} = $action;
4195        $args{'hash'} = $hash if $hash;
4196        $args{'hash_base'} = $hash_base if $hash_base;
4197
4198        print "<div class=\"header\">\n" .
4199              $cgi->a({-href => href(%args), -class => "title"},
4200              $title ? $title : $action) .
4201              "\n</div>\n";
4202}
4203
4204sub format_repo_url {
4205        my ($name, $url) = @_;
4206        return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4207}
4208
4209# Group output by placing it in a DIV element and adding a header.
4210# Options for start_div() can be provided by passing a hash reference as the
4211# first parameter to the function.
4212# Options to git_print_header_div() can be provided by passing an array
4213# reference. This must follow the options to start_div if they are present.
4214# The content can be a scalar, which is output as-is, a scalar reference, which
4215# is output after html escaping, an IO handle passed either as *handle or
4216# *handle{IO}, or a function reference. In the latter case all following
4217# parameters will be taken as argument to the content function call.
4218sub git_print_section {
4219        my ($div_args, $header_args, $content);
4220        my $arg = shift;
4221        if (ref($arg) eq 'HASH') {
4222                $div_args = $arg;
4223                $arg = shift;
4224        }
4225        if (ref($arg) eq 'ARRAY') {
4226                $header_args = $arg;
4227                $arg = shift;
4228        }
4229        $content = $arg;
4230
4231        print $cgi->start_div($div_args);
4232        git_print_header_div(@$header_args);
4233
4234        if (ref($content) eq 'CODE') {
4235                $content->(@_);
4236        } elsif (ref($content) eq 'SCALAR') {
4237                print esc_html($$content);
4238        } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4239                print <$content>;
4240        } elsif (!ref($content) && defined($content)) {
4241                print $content;
4242        }
4243
4244        print $cgi->end_div;
4245}
4246
4247sub format_timestamp_html {
4248        my $date = shift;
4249        my $strtime = $date->{'rfc2822'};
4250
4251        my (undef, undef, $datetime_class) =
4252                gitweb_get_feature('javascript-timezone');
4253        if ($datetime_class) {
4254                $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4255        }
4256
4257        my $localtime_format = '(%02d:%02d %s)';
4258        if ($date->{'hour_local'} < 6) {
4259                $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4260        }
4261        $strtime .= ' ' .
4262                    sprintf($localtime_format,
4263                            $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4264
4265        return $strtime;
4266}
4267
4268# Outputs the author name and date in long form
4269sub git_print_authorship {
4270        my $co = shift;
4271        my %opts = @_;
4272        my $tag = $opts{-tag} || 'div';
4273        my $author = $co->{'author_name'};
4274
4275        my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4276        print "<$tag class=\"author_date\">" .
4277              format_search_author($author, "author", esc_html($author)) .
4278              " [".format_timestamp_html(\%ad)."]".
4279              git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4280              "</$tag>\n";
4281}
4282
4283# Outputs table rows containing the full author or committer information,
4284# in the format expected for 'commit' view (& similar).
4285# Parameters are a commit hash reference, followed by the list of people
4286# to output information for. If the list is empty it defaults to both
4287# author and committer.
4288sub git_print_authorship_rows {
4289        my $co = shift;
4290        # too bad we can't use @people = @_ || ('author', 'committer')
4291        my @people = @_;
4292        @people = ('author', 'committer') unless @people;
4293        foreach my $who (@people) {
4294                my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4295                print "<tr><td>$who</td><td>" .
4296                      format_search_author($co->{"${who}_name"}, $who,
4297                                           esc_html($co->{"${who}_name"})) . " " .
4298                      format_search_author($co->{"${who}_email"}, $who,
4299                                           esc_html("<" . $co->{"${who}_email"} . ">")) .
4300                      "</td><td rowspan=\"2\">" .
4301                      git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4302                      "</td></tr>\n" .
4303                      "<tr>" .
4304                      "<td></td><td>" .
4305                      format_timestamp_html(\%wd) .
4306                      "</td>" .
4307                      "</tr>\n";
4308        }
4309}
4310
4311sub git_print_page_path {
4312        my $name = shift;
4313        my $type = shift;
4314        my $hb = shift;
4315
4316
4317        print "<div class=\"page_path\">";
4318        print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4319                      -title => 'tree root'}, to_utf8("[$project]"));
4320        print " / ";
4321        if (defined $name) {
4322                my @dirname = split '/', $name;
4323                my $basename = pop @dirname;
4324                my $fullname = '';
4325
4326                foreach my $dir (@dirname) {
4327                        $fullname .= ($fullname ? '/' : '') . $dir;
4328                        print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4329                                                     hash_base=>$hb),
4330                                      -title => $fullname}, esc_path($dir));
4331                        print " / ";
4332                }
4333                if (defined $type && $type eq 'blob') {
4334                        print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4335                                                     hash_base=>$hb),
4336                                      -title => $name}, esc_path($basename));
4337                } elsif (defined $type && $type eq 'tree') {
4338                        print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4339                                                     hash_base=>$hb),
4340                                      -title => $name}, esc_path($basename));
4341                        print " / ";
4342                } else {
4343                        print esc_path($basename);
4344                }
4345        }
4346        print "<br/></div>\n";
4347}
4348
4349sub git_print_log {
4350        my $log = shift;
4351        my %opts = @_;
4352
4353        if ($opts{'-remove_title'}) {
4354                # remove title, i.e. first line of log
4355                shift @$log;
4356        }
4357        # remove leading empty lines
4358        while (defined $log->[0] && $log->[0] eq "") {
4359                shift @$log;
4360        }
4361
4362        # print log
4363        my $signoff = 0;
4364        my $empty = 0;
4365        foreach my $line (@$log) {
4366                if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4367                        $signoff = 1;
4368                        $empty = 0;
4369                        if (! $opts{'-remove_signoff'}) {
4370                                print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4371                                next;
4372                        } else {
4373                                # remove signoff lines
4374                                next;
4375                        }
4376                } else {
4377                        $signoff = 0;
4378                }
4379
4380                # print only one empty line
4381                # do not print empty line after signoff
4382                if ($line eq "") {
4383                        next if ($empty || $signoff);
4384                        $empty = 1;
4385                } else {
4386                        $empty = 0;
4387                }
4388
4389                print format_log_line_html($line) . "<br/>\n";
4390        }
4391
4392        if ($opts{'-final_empty_line'}) {
4393                # end with single empty line
4394                print "<br/>\n" unless $empty;
4395        }
4396}
4397
4398# return link target (what link points to)
4399sub git_get_link_target {
4400        my $hash = shift;
4401        my $link_target;
4402
4403        # read link
4404        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4405                or return;
4406        {
4407                local $/ = undef;
4408                $link_target = <$fd>;
4409        }
4410        close $fd
4411                or return;
4412
4413        return $link_target;
4414}
4415
4416# given link target, and the directory (basedir) the link is in,
4417# return target of link relative to top directory (top tree);
4418# return undef if it is not possible (including absolute links).
4419sub normalize_link_target {
4420        my ($link_target, $basedir) = @_;
4421
4422        # absolute symlinks (beginning with '/') cannot be normalized
4423        return if (substr($link_target, 0, 1) eq '/');
4424
4425        # normalize link target to path from top (root) tree (dir)
4426        my $path;
4427        if ($basedir) {
4428                $path = $basedir . '/' . $link_target;
4429        } else {
4430                # we are in top (root) tree (dir)
4431                $path = $link_target;
4432        }
4433
4434        # remove //, /./, and /../
4435        my @path_parts;
4436        foreach my $part (split('/', $path)) {
4437                # discard '.' and ''
4438                next if (!$part || $part eq '.');
4439                # handle '..'
4440                if ($part eq '..') {
4441                        if (@path_parts) {
4442                                pop @path_parts;
4443                        } else {
4444                                # link leads outside repository (outside top dir)
4445                                return;
4446                        }
4447                } else {
4448                        push @path_parts, $part;
4449                }
4450        }
4451        $path = join('/', @path_parts);
4452
4453        return $path;
4454}
4455
4456# print tree entry (row of git_tree), but without encompassing <tr> element
4457sub git_print_tree_entry {
4458        my ($t, $basedir, $hash_base, $have_blame) = @_;
4459
4460        my %base_key = ();
4461        $base_key{'hash_base'} = $hash_base if defined $hash_base;
4462
4463        # The format of a table row is: mode list link.  Where mode is
4464        # the mode of the entry, list is the name of the entry, an href,
4465        # and link is the action links of the entry.
4466
4467        print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4468        if (exists $t->{'size'}) {
4469                print "<td class=\"size\">$t->{'size'}</td>\n";
4470        }
4471        if ($t->{'type'} eq "blob") {
4472                print "<td class=\"list\">" .
4473                        $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4474                                               file_name=>"$basedir$t->{'name'}", %base_key),
4475                                -class => "list"}, esc_path($t->{'name'}));
4476                if (S_ISLNK(oct $t->{'mode'})) {
4477                        my $link_target = git_get_link_target($t->{'hash'});
4478                        if ($link_target) {
4479                                my $norm_target = normalize_link_target($link_target, $basedir);
4480                                if (defined $norm_target) {
4481                                        print " -> " .
4482                                              $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4483                                                                     file_name=>$norm_target),
4484                                                       -title => $norm_target}, esc_path($link_target));
4485                                } else {
4486                                        print " -> " . esc_path($link_target);
4487                                }
4488                        }
4489                }
4490                print "</td>\n";
4491                print "<td class=\"link\">";
4492                print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4493                                             file_name=>"$basedir$t->{'name'}", %base_key)},
4494                              "blob");
4495                if ($have_blame) {
4496                        print " | " .
4497                              $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4498                                                     file_name=>"$basedir$t->{'name'}", %base_key)},
4499                                      "blame");
4500                }
4501                if (defined $hash_base) {
4502                        print " | " .
4503                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4504                                                     hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4505                                      "history");
4506                }
4507                print " | " .
4508                        $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4509                                               file_name=>"$basedir$t->{'name'}")},
4510                                "raw");
4511                print "</td>\n";
4512
4513        } elsif ($t->{'type'} eq "tree") {
4514                print "<td class=\"list\">";
4515                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4516                                             file_name=>"$basedir$t->{'name'}",
4517                                             %base_key)},
4518                              esc_path($t->{'name'}));
4519                print "</td>\n";
4520                print "<td class=\"link\">";
4521                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4522                                             file_name=>"$basedir$t->{'name'}",
4523                                             %base_key)},
4524                              "tree");
4525                if (defined $hash_base) {
4526                        print " | " .
4527                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4528                                                     file_name=>"$basedir$t->{'name'}")},
4529                                      "history");
4530                }
4531                print "</td>\n";
4532        } else {
4533                # unknown object: we can only present history for it
4534                # (this includes 'commit' object, i.e. submodule support)
4535                print "<td class=\"list\">" .
4536                      esc_path($t->{'name'}) .
4537                      "</td>\n";
4538                print "<td class=\"link\">";
4539                if (defined $hash_base) {
4540                        print $cgi->a({-href => href(action=>"history",
4541                                                     hash_base=>$hash_base,
4542                                                     file_name=>"$basedir$t->{'name'}")},
4543                                      "history");
4544                }
4545                print "</td>\n";
4546        }
4547}
4548
4549## ......................................................................
4550## functions printing large fragments of HTML
4551
4552# get pre-image filenames for merge (combined) diff
4553sub fill_from_file_info {
4554        my ($diff, @parents) = @_;
4555
4556        $diff->{'from_file'} = [ ];
4557        $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4558        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4559                if ($diff->{'status'}[$i] eq 'R' ||
4560                    $diff->{'status'}[$i] eq 'C') {
4561                        $diff->{'from_file'}[$i] =
4562                                git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4563                }
4564        }
4565
4566        return $diff;
4567}
4568
4569# is current raw difftree line of file deletion
4570sub is_deleted {
4571        my $diffinfo = shift;
4572
4573        return $diffinfo->{'to_id'} eq ('0' x 40);
4574}
4575
4576# does patch correspond to [previous] difftree raw line
4577# $diffinfo  - hashref of parsed raw diff format
4578# $patchinfo - hashref of parsed patch diff format
4579#              (the same keys as in $diffinfo)
4580sub is_patch_split {
4581        my ($diffinfo, $patchinfo) = @_;
4582
4583        return defined $diffinfo && defined $patchinfo
4584                && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4585}
4586
4587
4588sub git_difftree_body {
4589        my ($difftree, $hash, @parents) = @_;
4590        my ($parent) = $parents[0];
4591        my $have_blame = gitweb_check_feature('blame');
4592        print "<div class=\"list_head\">\n";
4593        if ($#{$difftree} > 10) {
4594                print(($#{$difftree} + 1) . " files changed:\n");
4595        }
4596        print "</div>\n";
4597
4598        print "<table class=\"" .
4599              (@parents > 1 ? "combined " : "") .
4600              "diff_tree\">\n";
4601
4602        # header only for combined diff in 'commitdiff' view
4603        my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4604        if ($has_header) {
4605                # table header
4606                print "<thead><tr>\n" .
4607                       "<th></th><th></th>\n"; # filename, patchN link
4608                for (my $i = 0; $i < @parents; $i++) {
4609                        my $par = $parents[$i];
4610                        print "<th>" .
4611                              $cgi->a({-href => href(action=>"commitdiff",
4612                                                     hash=>$hash, hash_parent=>$par),
4613                                       -title => 'commitdiff to parent number ' .
4614                                                  ($i+1) . ': ' . substr($par,0,7)},
4615                                      $i+1) .
4616                              "&nbsp;</th>\n";
4617                }
4618                print "</tr></thead>\n<tbody>\n";
4619        }
4620
4621        my $alternate = 1;
4622        my $patchno = 0;
4623        foreach my $line (@{$difftree}) {
4624                my $diff = parsed_difftree_line($line);
4625
4626                if ($alternate) {
4627                        print "<tr class=\"dark\">\n";
4628                } else {
4629                        print "<tr class=\"light\">\n";
4630                }
4631                $alternate ^= 1;
4632
4633                if (exists $diff->{'nparents'}) { # combined diff
4634
4635                        fill_from_file_info($diff, @parents)
4636                                unless exists $diff->{'from_file'};
4637
4638                        if (!is_deleted($diff)) {
4639                                # file exists in the result (child) commit
4640                                print "<td>" .
4641                                      $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4642                                                             file_name=>$diff->{'to_file'},
4643                                                             hash_base=>$hash),
4644                                              -class => "list"}, esc_path($diff->{'to_file'})) .
4645                                      "</td>\n";
4646                        } else {
4647                                print "<td>" .
4648                                      esc_path($diff->{'to_file'}) .
4649                                      "</td>\n";
4650                        }
4651
4652                        if ($action eq 'commitdiff') {
4653                                # link to patch
4654                                $patchno++;
4655                                print "<td class=\"link\">" .
4656                                      $cgi->a({-href => href(-anchor=>"patch$patchno")},
4657                                              "patch") .
4658                                      " | " .
4659                                      "</td>\n";
4660                        }
4661
4662                        my $has_history = 0;
4663                        my $not_deleted = 0;
4664                        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4665                                my $hash_parent = $parents[$i];
4666                                my $from_hash = $diff->{'from_id'}[$i];
4667                                my $from_path = $diff->{'from_file'}[$i];
4668                                my $status = $diff->{'status'}[$i];
4669
4670                                $has_history ||= ($status ne 'A');
4671                                $not_deleted ||= ($status ne 'D');
4672
4673                                if ($status eq 'A') {
4674                                        print "<td  class=\"link\" align=\"right\"> | </td>\n";
4675                                } elsif ($status eq 'D') {
4676                                        print "<td class=\"link\">" .
4677                                              $cgi->a({-href => href(action=>"blob",
4678                                                                     hash_base=>$hash,
4679                                                                     hash=>$from_hash,
4680                                                                     file_name=>$from_path)},
4681                                                      "blob" . ($i+1)) .
4682                                              " | </td>\n";
4683                                } else {
4684                                        if ($diff->{'to_id'} eq $from_hash) {
4685                                                print "<td class=\"link nochange\">";
4686                                        } else {
4687                                                print "<td class=\"link\">";
4688                                        }
4689                                        print $cgi->a({-href => href(action=>"blobdiff",
4690                                                                     hash=>$diff->{'to_id'},
4691                                                                     hash_parent=>$from_hash,
4692                                                                     hash_base=>$hash,
4693                                                                     hash_parent_base=>$hash_parent,
4694                                                                     file_name=>$diff->{'to_file'},
4695                                                                     file_parent=>$from_path)},
4696                                                      "diff" . ($i+1)) .
4697                                              " | </td>\n";
4698                                }
4699                        }
4700
4701                        print "<td class=\"link\">";
4702                        if ($not_deleted) {
4703                                print $cgi->a({-href => href(action=>"blob",
4704                                                             hash=>$diff->{'to_id'},
4705                                                             file_name=>$diff->{'to_file'},
4706                                                             hash_base=>$hash)},
4707                                              "blob");
4708                                print " | " if ($has_history);
4709                        }
4710                        if ($has_history) {
4711                                print $cgi->a({-href => href(action=>"history",
4712                                                             file_name=>$diff->{'to_file'},
4713                                                             hash_base=>$hash)},
4714                                              "history");
4715                        }
4716                        print "</td>\n";
4717
4718                        print "</tr>\n";
4719                        next; # instead of 'else' clause, to avoid extra indent
4720                }
4721                # else ordinary diff
4722
4723                my ($to_mode_oct, $to_mode_str, $to_file_type);
4724                my ($from_mode_oct, $from_mode_str, $from_file_type);
4725                if ($diff->{'to_mode'} ne ('0' x 6)) {
4726                        $to_mode_oct = oct $diff->{'to_mode'};
4727                        if (S_ISREG($to_mode_oct)) { # only for regular file
4728                                $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4729                        }
4730                        $to_file_type = file_type($diff->{'to_mode'});
4731                }
4732                if ($diff->{'from_mode'} ne ('0' x 6)) {
4733                        $from_mode_oct = oct $diff->{'from_mode'};
4734                        if (S_ISREG($from_mode_oct)) { # only for regular file
4735                                $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4736                        }
4737                        $from_file_type = file_type($diff->{'from_mode'});
4738                }
4739
4740                if ($diff->{'status'} eq "A") { # created
4741                        my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4742                        $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4743                        $mode_chng   .= "]</span>";
4744                        print "<td>";
4745                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4746                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4747                                      -class => "list"}, esc_path($diff->{'file'}));
4748                        print "</td>\n";
4749                        print "<td>$mode_chng</td>\n";
4750                        print "<td class=\"link\">";
4751                        if ($action eq 'commitdiff') {
4752                                # link to patch
4753                                $patchno++;
4754                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4755                                              "patch") .
4756                                      " | ";
4757                        }
4758                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4759                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4760                                      "blob");
4761                        print "</td>\n";
4762
4763                } elsif ($diff->{'status'} eq "D") { # deleted
4764                        my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4765                        print "<td>";
4766                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4767                                                     hash_base=>$parent, file_name=>$diff->{'file'}),
4768                                       -class => "list"}, esc_path($diff->{'file'}));
4769                        print "</td>\n";
4770                        print "<td>$mode_chng</td>\n";
4771                        print "<td class=\"link\">";
4772                        if ($action eq 'commitdiff') {
4773                                # link to patch
4774                                $patchno++;
4775                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4776                                              "patch") .
4777                                      " | ";
4778                        }
4779                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4780                                                     hash_base=>$parent, file_name=>$diff->{'file'})},
4781                                      "blob") . " | ";
4782                        if ($have_blame) {
4783                                print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4784                                                             file_name=>$diff->{'file'})},
4785                                              "blame") . " | ";
4786                        }
4787                        print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4788                                                     file_name=>$diff->{'file'})},
4789                                      "history");
4790                        print "</td>\n";
4791
4792                } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4793                        my $mode_chnge = "";
4794                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4795                                $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4796                                if ($from_file_type ne $to_file_type) {
4797                                        $mode_chnge .= " from $from_file_type to $to_file_type";
4798                                }
4799                                if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4800                                        if ($from_mode_str && $to_mode_str) {
4801                                                $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4802                                        } elsif ($to_mode_str) {
4803                                                $mode_chnge .= " mode: $to_mode_str";
4804                                        }
4805                                }
4806                                $mode_chnge .= "]</span>\n";
4807                        }
4808                        print "<td>";
4809                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4810                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4811                                      -class => "list"}, esc_path($diff->{'file'}));
4812                        print "</td>\n";
4813                        print "<td>$mode_chnge</td>\n";
4814                        print "<td class=\"link\">";
4815                        if ($action eq 'commitdiff') {
4816                                # link to patch
4817                                $patchno++;
4818                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4819                                              "patch") .
4820                                      " | ";
4821                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4822                                # "commit" view and modified file (not onlu mode changed)
4823                                print $cgi->a({-href => href(action=>"blobdiff",
4824                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4825                                                             hash_base=>$hash, hash_parent_base=>$parent,
4826                                                             file_name=>$diff->{'file'})},
4827                                              "diff") .
4828                                      " | ";
4829                        }
4830                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4831                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4832                                       "blob") . " | ";
4833                        if ($have_blame) {
4834                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4835                                                             file_name=>$diff->{'file'})},
4836                                              "blame") . " | ";
4837                        }
4838                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4839                                                     file_name=>$diff->{'file'})},
4840                                      "history");
4841                        print "</td>\n";
4842
4843                } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4844                        my %status_name = ('R' => 'moved', 'C' => 'copied');
4845                        my $nstatus = $status_name{$diff->{'status'}};
4846                        my $mode_chng = "";
4847                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4848                                # mode also for directories, so we cannot use $to_mode_str
4849                                $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4850                        }
4851                        print "<td>" .
4852                              $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4853                                                     hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4854                                      -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4855                              "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4856                              $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4857                                                     hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4858                                      -class => "list"}, esc_path($diff->{'from_file'})) .
4859                              " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4860                              "<td class=\"link\">";
4861                        if ($action eq 'commitdiff') {
4862                                # link to patch
4863                                $patchno++;
4864                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4865                                              "patch") .
4866                                      " | ";
4867                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4868                                # "commit" view and modified file (not only pure rename or copy)
4869                                print $cgi->a({-href => href(action=>"blobdiff",
4870                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4871                                                             hash_base=>$hash, hash_parent_base=>$parent,
4872                                                             file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4873                                              "diff") .
4874                                      " | ";
4875                        }
4876                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4877                                                     hash_base=>$parent, file_name=>$diff->{'to_file'})},
4878                                      "blob") . " | ";
4879                        if ($have_blame) {
4880                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4881                                                             file_name=>$diff->{'to_file'})},
4882                                              "blame") . " | ";
4883                        }
4884                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4885                                                    file_name=>$diff->{'to_file'})},
4886                                      "history");
4887                        print "</td>\n";
4888
4889                } # we should not encounter Unmerged (U) or Unknown (X) status
4890                print "</tr>\n";
4891        }
4892        print "</tbody>" if $has_header;
4893        print "</table>\n";
4894}
4895
4896sub print_sidebyside_diff_chunk {
4897        my @chunk = @_;
4898        my (@ctx, @rem, @add);
4899
4900        return unless @chunk;
4901
4902        # incomplete last line might be among removed or added lines,
4903        # or both, or among context lines: find which
4904        for (my $i = 1; $i < @chunk; $i++) {
4905                if ($chunk[$i][0] eq 'incomplete') {
4906                        $chunk[$i][0] = $chunk[$i-1][0];
4907                }
4908        }
4909
4910        # guardian
4911        push @chunk, ["", ""];
4912
4913        foreach my $line_info (@chunk) {
4914                my ($class, $line) = @$line_info;
4915
4916                # print chunk headers
4917                if ($class && $class eq 'chunk_header') {
4918                        print $line;
4919                        next;
4920                }
4921
4922                ## print from accumulator when type of class of lines change
4923                # empty contents block on start rem/add block, or end of chunk
4924                if (@ctx && (!$class || $class eq 'rem' || $class eq 'add')) {
4925                        print join '',
4926                                '<div class="chunk_block ctx">',
4927                                        '<div class="old">',
4928                                        @ctx,
4929                                        '</div>',
4930                                        '<div class="new">',
4931                                        @ctx,
4932                                        '</div>',
4933                                '</div>';
4934                        @ctx = ();
4935                }
4936                # empty add/rem block on start context block, or end of chunk
4937                if ((@rem || @add) && (!$class || $class eq 'ctx')) {
4938                        if (!@add) {
4939                                # pure removal
4940                                print join '',
4941                                        '<div class="chunk_block rem">',
4942                                                '<div class="old">',
4943                                                @rem,
4944                                                '</div>',
4945                                        '</div>';
4946                        } elsif (!@rem) {
4947                                # pure addition
4948                                print join '',
4949                                        '<div class="chunk_block add">',
4950                                                '<div class="new">',
4951                                                @add,
4952                                                '</div>',
4953                                        '</div>';
4954                        } else {
4955                                # assume that it is change
4956                                print join '',
4957                                        '<div class="chunk_block chg">',
4958                                                '<div class="old">',
4959                                                @rem,
4960                                                '</div>',
4961                                                '<div class="new">',
4962                                                @add,
4963                                                '</div>',
4964                                        '</div>';
4965                        }
4966                        @rem = @add = ();
4967                }
4968
4969                ## adding lines to accumulator
4970                # guardian value
4971                last unless $line;
4972                # rem, add or change
4973                if ($class eq 'rem') {
4974                        push @rem, $line;
4975                } elsif ($class eq 'add') {
4976                        push @add, $line;
4977                }
4978                # context line
4979                if ($class eq 'ctx') {
4980                        push @ctx, $line;
4981                }
4982        }
4983}
4984
4985sub git_patchset_body {
4986        my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
4987        my ($hash_parent) = $hash_parents[0];
4988
4989        my $is_combined = (@hash_parents > 1);
4990        my $patch_idx = 0;
4991        my $patch_number = 0;
4992        my $patch_line;
4993        my $diffinfo;
4994        my $to_name;
4995        my (%from, %to);
4996        my @chunk; # for side-by-side diff
4997
4998        print "<div class=\"patchset\">\n";
4999
5000        # skip to first patch
5001        while ($patch_line = <$fd>) {
5002                chomp $patch_line;
5003
5004                last if ($patch_line =~ m/^diff /);
5005        }
5006
5007 PATCH:
5008        while ($patch_line) {
5009
5010                # parse "git diff" header line
5011                if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
5012                        # $1 is from_name, which we do not use
5013                        $to_name = unquote($2);
5014                        $to_name =~ s!^b/!!;
5015                } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
5016                        # $1 is 'cc' or 'combined', which we do not use
5017                        $to_name = unquote($2);
5018                } else {
5019                        $to_name = undef;
5020                }
5021
5022                # check if current patch belong to current raw line
5023                # and parse raw git-diff line if needed
5024                if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
5025                        # this is continuation of a split patch
5026                        print "<div class=\"patch cont\">\n";
5027                } else {
5028                        # advance raw git-diff output if needed
5029                        $patch_idx++ if defined $diffinfo;
5030
5031                        # read and prepare patch information
5032                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5033
5034                        # compact combined diff output can have some patches skipped
5035                        # find which patch (using pathname of result) we are at now;
5036                        if ($is_combined) {
5037                                while ($to_name ne $diffinfo->{'to_file'}) {
5038                                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5039                                              format_diff_cc_simplified($diffinfo, @hash_parents) .
5040                                              "</div>\n";  # class="patch"
5041
5042                                        $patch_idx++;
5043                                        $patch_number++;
5044
5045                                        last if $patch_idx > $#$difftree;
5046                                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5047                                }
5048                        }
5049
5050                        # modifies %from, %to hashes
5051                        parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5052
5053                        # this is first patch for raw difftree line with $patch_idx index
5054                        # we index @$difftree array from 0, but number patches from 1
5055                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5056                }
5057
5058                # git diff header
5059                #assert($patch_line =~ m/^diff /) if DEBUG;
5060                #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5061                $patch_number++;
5062                # print "git diff" header
5063                print format_git_diff_header_line($patch_line, $diffinfo,
5064                                                  \%from, \%to);
5065
5066                # print extended diff header
5067                print "<div class=\"diff extended_header\">\n";
5068        EXTENDED_HEADER:
5069                while ($patch_line = <$fd>) {
5070                        chomp $patch_line;
5071
5072                        last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5073
5074                        print format_extended_diff_header_line($patch_line, $diffinfo,
5075                                                               \%from, \%to);
5076                }
5077                print "</div>\n"; # class="diff extended_header"
5078
5079                # from-file/to-file diff header
5080                if (! $patch_line) {
5081                        print "</div>\n"; # class="patch"
5082                        last PATCH;
5083                }
5084                next PATCH if ($patch_line =~ m/^diff /);
5085                #assert($patch_line =~ m/^---/) if DEBUG;
5086
5087                my $last_patch_line = $patch_line;
5088                $patch_line = <$fd>;
5089                chomp $patch_line;
5090                #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5091
5092                print format_diff_from_to_header($last_patch_line, $patch_line,
5093                                                 $diffinfo, \%from, \%to,
5094                                                 @hash_parents);
5095
5096                # the patch itself
5097        LINE:
5098                while ($patch_line = <$fd>) {
5099                        chomp $patch_line;
5100
5101                        next PATCH if ($patch_line =~ m/^diff /);
5102
5103                        my ($class, $line) = process_diff_line($patch_line, \%from, \%to);
5104                        my $diff_classes = "diff";
5105                        $diff_classes .= " $class" if ($class);
5106                        $line = "<div class=\"$diff_classes\">$line</div>\n";
5107
5108                        if ($diff_style eq 'sidebyside' && !$is_combined) {
5109                                if ($class eq 'chunk_header') {
5110                                        print_sidebyside_diff_chunk(@chunk);
5111                                        @chunk = ( [ $class, $line ] );
5112                                } else {
5113                                        push @chunk, [ $class, $line ];
5114                                }
5115                        } else {
5116                                # default 'inline' style and unknown styles
5117                                print $line;
5118                        }
5119                }
5120
5121        } continue {
5122                if (@chunk) {
5123                        print_sidebyside_diff_chunk(@chunk);
5124                        @chunk = ();
5125                }
5126                print "</div>\n"; # class="patch"
5127        }
5128
5129        # for compact combined (--cc) format, with chunk and patch simplification
5130        # the patchset might be empty, but there might be unprocessed raw lines
5131        for (++$patch_idx if $patch_number > 0;
5132             $patch_idx < @$difftree;
5133             ++$patch_idx) {
5134                # read and prepare patch information
5135                $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5136
5137                # generate anchor for "patch" links in difftree / whatchanged part
5138                print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5139                      format_diff_cc_simplified($diffinfo, @hash_parents) .
5140                      "</div>\n";  # class="patch"
5141
5142                $patch_number++;
5143        }
5144
5145        if ($patch_number == 0) {
5146                if (@hash_parents > 1) {
5147                        print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5148                } else {
5149                        print "<div class=\"diff nodifferences\">No differences found</div>\n";
5150                }
5151        }
5152
5153        print "</div>\n"; # class="patchset"
5154}
5155
5156# . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5157
5158# fills project list info (age, description, owner, category, forks)
5159# for each project in the list, removing invalid projects from
5160# returned list
5161# NOTE: modifies $projlist, but does not remove entries from it
5162sub fill_project_list_info {
5163        my $projlist = shift;
5164        my @projects;
5165
5166        my $show_ctags = gitweb_check_feature('ctags');
5167 PROJECT:
5168        foreach my $pr (@$projlist) {
5169                my (@activity) = git_get_last_activity($pr->{'path'});
5170                unless (@activity) {
5171                        next PROJECT;
5172                }
5173                ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5174                if (!defined $pr->{'descr'}) {
5175                        my $descr = git_get_project_description($pr->{'path'}) || "";
5176                        $descr = to_utf8($descr);
5177                        $pr->{'descr_long'} = $descr;
5178                        $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5179                }
5180                if (!defined $pr->{'owner'}) {
5181                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5182                }
5183                if ($show_ctags) {
5184                        $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5185                }
5186                if ($projects_list_group_categories && !defined $pr->{'category'}) {
5187                        my $cat = git_get_project_category($pr->{'path'}) ||
5188                                                           $project_list_default_category;
5189                        $pr->{'category'} = to_utf8($cat);
5190                }
5191
5192                push @projects, $pr;
5193        }
5194
5195        return @projects;
5196}
5197
5198sub sort_projects_list {
5199        my ($projlist, $order) = @_;
5200        my @projects;
5201
5202        my %order_info = (
5203                project => { key => 'path', type => 'str' },
5204                descr => { key => 'descr_long', type => 'str' },
5205                owner => { key => 'owner', type => 'str' },
5206                age => { key => 'age', type => 'num' }
5207        );
5208        my $oi = $order_info{$order};
5209        return @$projlist unless defined $oi;
5210        if ($oi->{'type'} eq 'str') {
5211                @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5212        } else {
5213                @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5214        }
5215
5216        return @projects;
5217}
5218
5219# returns a hash of categories, containing the list of project
5220# belonging to each category
5221sub build_projlist_by_category {
5222        my ($projlist, $from, $to) = @_;
5223        my %categories;
5224
5225        $from = 0 unless defined $from;
5226        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5227
5228        for (my $i = $from; $i <= $to; $i++) {
5229                my $pr = $projlist->[$i];
5230                push @{$categories{ $pr->{'category'} }}, $pr;
5231        }
5232
5233        return wantarray ? %categories : \%categories;
5234}
5235
5236# print 'sort by' <th> element, generating 'sort by $name' replay link
5237# if that order is not selected
5238sub print_sort_th {
5239        print format_sort_th(@_);
5240}
5241
5242sub format_sort_th {
5243        my ($name, $order, $header) = @_;
5244        my $sort_th = "";
5245        $header ||= ucfirst($name);
5246
5247        if ($order eq $name) {
5248                $sort_th .= "<th>$header</th>\n";
5249        } else {
5250                $sort_th .= "<th>" .
5251                            $cgi->a({-href => href(-replay=>1, order=>$name),
5252                                     -class => "header"}, $header) .
5253                            "</th>\n";
5254        }
5255
5256        return $sort_th;
5257}
5258
5259sub git_project_list_rows {
5260        my ($projlist, $from, $to, $check_forks) = @_;
5261
5262        $from = 0 unless defined $from;
5263        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5264
5265        my $alternate = 1;
5266        for (my $i = $from; $i <= $to; $i++) {
5267                my $pr = $projlist->[$i];
5268
5269                if ($alternate) {
5270                        print "<tr class=\"dark\">\n";
5271                } else {
5272                        print "<tr class=\"light\">\n";
5273                }
5274                $alternate ^= 1;
5275
5276                if ($check_forks) {
5277                        print "<td>";
5278                        if ($pr->{'forks'}) {
5279                                my $nforks = scalar @{$pr->{'forks'}};
5280                                if ($nforks > 0) {
5281                                        print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5282                                                       -title => "$nforks forks"}, "+");
5283                                } else {
5284                                        print $cgi->span({-title => "$nforks forks"}, "+");
5285                                }
5286                        }
5287                        print "</td>\n";
5288                }
5289                print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5290                                        -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
5291                      "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5292                                        -class => "list", -title => $pr->{'descr_long'}},
5293                                        esc_html($pr->{'descr'})) . "</td>\n" .
5294                      "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5295                print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5296                      (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
5297                      "<td class=\"link\">" .
5298                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5299                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5300                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5301                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5302                      ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5303                      "</td>\n" .
5304                      "</tr>\n";
5305        }
5306}
5307
5308sub git_project_list_body {
5309        # actually uses global variable $project
5310        my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5311        my @projects = @$projlist;
5312
5313        my $check_forks = gitweb_check_feature('forks');
5314        my $show_ctags  = gitweb_check_feature('ctags');
5315        my $tagfilter = $show_ctags ? $cgi->param('by_tag') : undef;
5316        $check_forks = undef
5317                if ($tagfilter || $searchtext);
5318
5319        # filtering out forks before filling info allows to do less work
5320        @projects = filter_forks_from_projects_list(\@projects)
5321                if ($check_forks);
5322        @projects = fill_project_list_info(\@projects);
5323        # searching projects require filling to be run before it
5324        @projects = search_projects_list(\@projects,
5325                                         'searchtext' => $searchtext,
5326                                         'tagfilter'  => $tagfilter)
5327                if ($tagfilter || $searchtext);
5328
5329        $order ||= $default_projects_order;
5330        $from = 0 unless defined $from;
5331        $to = $#projects if (!defined $to || $#projects < $to);
5332
5333        # short circuit
5334        if ($from > $to) {
5335                print "<center>\n".
5336                      "<b>No such projects found</b><br />\n".
5337                      "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5338                      "</center>\n<br />\n";
5339                return;
5340        }
5341
5342        @projects = sort_projects_list(\@projects, $order);
5343
5344        if ($show_ctags) {
5345                my $ctags = git_gather_all_ctags(\@projects);
5346                my $cloud = git_populate_project_tagcloud($ctags);
5347                print git_show_project_tagcloud($cloud, 64);
5348        }
5349
5350        print "<table class=\"project_list\">\n";
5351        unless ($no_header) {
5352                print "<tr>\n";
5353                if ($check_forks) {
5354                        print "<th></th>\n";
5355                }
5356                print_sort_th('project', $order, 'Project');
5357                print_sort_th('descr', $order, 'Description');
5358                print_sort_th('owner', $order, 'Owner');
5359                print_sort_th('age', $order, 'Last Change');
5360                print "<th></th>\n" . # for links
5361                      "</tr>\n";
5362        }
5363
5364        if ($projects_list_group_categories) {
5365                # only display categories with projects in the $from-$to window
5366                @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5367                my %categories = build_projlist_by_category(\@projects, $from, $to);
5368                foreach my $cat (sort keys %categories) {
5369                        unless ($cat eq "") {
5370                                print "<tr>\n";
5371                                if ($check_forks) {
5372                                        print "<td></td>\n";
5373                                }
5374                                print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5375                                print "</tr>\n";
5376                        }
5377
5378                        git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5379                }
5380        } else {
5381                git_project_list_rows(\@projects, $from, $to, $check_forks);
5382        }
5383
5384        if (defined $extra) {
5385                print "<tr>\n";
5386                if ($check_forks) {
5387                        print "<td></td>\n";
5388                }
5389                print "<td colspan=\"5\">$extra</td>\n" .
5390                      "</tr>\n";
5391        }
5392        print "</table>\n";
5393}
5394
5395sub git_log_body {
5396        # uses global variable $project
5397        my ($commitlist, $from, $to, $refs, $extra) = @_;
5398
5399        $from = 0 unless defined $from;
5400        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5401
5402        for (my $i = 0; $i <= $to; $i++) {
5403                my %co = %{$commitlist->[$i]};
5404                next if !%co;
5405                my $commit = $co{'id'};
5406                my $ref = format_ref_marker($refs, $commit);
5407                git_print_header_div('commit',
5408                               "<span class=\"age\">$co{'age_string'}</span>" .
5409                               esc_html($co{'title'}) . $ref,
5410                               $commit);
5411                print "<div class=\"title_text\">\n" .
5412                      "<div class=\"log_link\">\n" .
5413                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5414                      " | " .
5415                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5416                      " | " .
5417                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5418                      "<br/>\n" .
5419                      "</div>\n";
5420                      git_print_authorship(\%co, -tag => 'span');
5421                      print "<br/>\n</div>\n";
5422
5423                print "<div class=\"log_body\">\n";
5424                git_print_log($co{'comment'}, -final_empty_line=> 1);
5425                print "</div>\n";
5426        }
5427        if ($extra) {
5428                print "<div class=\"page_nav\">\n";
5429                print "$extra\n";
5430                print "</div>\n";
5431        }
5432}
5433
5434sub git_shortlog_body {
5435        # uses global variable $project
5436        my ($commitlist, $from, $to, $refs, $extra) = @_;
5437
5438        $from = 0 unless defined $from;
5439        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5440
5441        print "<table class=\"shortlog\">\n";
5442        my $alternate = 1;
5443        for (my $i = $from; $i <= $to; $i++) {
5444                my %co = %{$commitlist->[$i]};
5445                my $commit = $co{'id'};
5446                my $ref = format_ref_marker($refs, $commit);
5447                if ($alternate) {
5448                        print "<tr class=\"dark\">\n";
5449                } else {
5450                        print "<tr class=\"light\">\n";
5451                }
5452                $alternate ^= 1;
5453                # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5454                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5455                      format_author_html('td', \%co, 10) . "<td>";
5456                print format_subject_html($co{'title'}, $co{'title_short'},
5457                                          href(action=>"commit", hash=>$commit), $ref);
5458                print "</td>\n" .
5459                      "<td class=\"link\">" .
5460                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5461                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5462                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5463                my $snapshot_links = format_snapshot_links($commit);
5464                if (defined $snapshot_links) {
5465                        print " | " . $snapshot_links;
5466                }
5467                print "</td>\n" .
5468                      "</tr>\n";
5469        }
5470        if (defined $extra) {
5471                print "<tr>\n" .
5472                      "<td colspan=\"4\">$extra</td>\n" .
5473                      "</tr>\n";
5474        }
5475        print "</table>\n";
5476}
5477
5478sub git_history_body {
5479        # Warning: assumes constant type (blob or tree) during history
5480        my ($commitlist, $from, $to, $refs, $extra,
5481            $file_name, $file_hash, $ftype) = @_;
5482
5483        $from = 0 unless defined $from;
5484        $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5485
5486        print "<table class=\"history\">\n";
5487        my $alternate = 1;
5488        for (my $i = $from; $i <= $to; $i++) {
5489                my %co = %{$commitlist->[$i]};
5490                if (!%co) {
5491                        next;
5492                }
5493                my $commit = $co{'id'};
5494
5495                my $ref = format_ref_marker($refs, $commit);
5496
5497                if ($alternate) {
5498                        print "<tr class=\"dark\">\n";
5499                } else {
5500                        print "<tr class=\"light\">\n";
5501                }
5502                $alternate ^= 1;
5503                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5504        # shortlog:   format_author_html('td', \%co, 10)
5505                      format_author_html('td', \%co, 15, 3) . "<td>";
5506                # originally git_history used chop_str($co{'title'}, 50)
5507                print format_subject_html($co{'title'}, $co{'title_short'},
5508                                          href(action=>"commit", hash=>$commit), $ref);
5509                print "</td>\n" .
5510                      "<td class=\"link\">" .
5511                      $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5512                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5513
5514                if ($ftype eq 'blob') {
5515                        my $blob_current = $file_hash;
5516                        my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5517                        if (defined $blob_current && defined $blob_parent &&
5518                                        $blob_current ne $blob_parent) {
5519                                print " | " .
5520                                        $cgi->a({-href => href(action=>"blobdiff",
5521                                                               hash=>$blob_current, hash_parent=>$blob_parent,
5522                                                               hash_base=>$hash_base, hash_parent_base=>$commit,
5523                                                               file_name=>$file_name)},
5524                                                "diff to current");
5525                        }
5526                }
5527                print "</td>\n" .
5528                      "</tr>\n";
5529        }
5530        if (defined $extra) {
5531                print "<tr>\n" .
5532                      "<td colspan=\"4\">$extra</td>\n" .
5533                      "</tr>\n";
5534        }
5535        print "</table>\n";
5536}
5537
5538sub git_tags_body {
5539        # uses global variable $project
5540        my ($taglist, $from, $to, $extra) = @_;
5541        $from = 0 unless defined $from;
5542        $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5543
5544        print "<table class=\"tags\">\n";
5545        my $alternate = 1;
5546        for (my $i = $from; $i <= $to; $i++) {
5547                my $entry = $taglist->[$i];
5548                my %tag = %$entry;
5549                my $comment = $tag{'subject'};
5550                my $comment_short;
5551                if (defined $comment) {
5552                        $comment_short = chop_str($comment, 30, 5);
5553                }
5554                if ($alternate) {
5555                        print "<tr class=\"dark\">\n";
5556                } else {
5557                        print "<tr class=\"light\">\n";
5558                }
5559                $alternate ^= 1;
5560                if (defined $tag{'age'}) {
5561                        print "<td><i>$tag{'age'}</i></td>\n";
5562                } else {
5563                        print "<td></td>\n";
5564                }
5565                print "<td>" .
5566                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5567                               -class => "list name"}, esc_html($tag{'name'})) .
5568                      "</td>\n" .
5569                      "<td>";
5570                if (defined $comment) {
5571                        print format_subject_html($comment, $comment_short,
5572                                                  href(action=>"tag", hash=>$tag{'id'}));
5573                }
5574                print "</td>\n" .
5575                      "<td class=\"selflink\">";
5576                if ($tag{'type'} eq "tag") {
5577                        print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5578                } else {
5579                        print "&nbsp;";
5580                }
5581                print "</td>\n" .
5582                      "<td class=\"link\">" . " | " .
5583                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5584                if ($tag{'reftype'} eq "commit") {
5585                        print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5586                              " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5587                } elsif ($tag{'reftype'} eq "blob") {
5588                        print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5589                }
5590                print "</td>\n" .
5591                      "</tr>";
5592        }
5593        if (defined $extra) {
5594                print "<tr>\n" .
5595                      "<td colspan=\"5\">$extra</td>\n" .
5596                      "</tr>\n";
5597        }
5598        print "</table>\n";
5599}
5600
5601sub git_heads_body {
5602        # uses global variable $project
5603        my ($headlist, $head, $from, $to, $extra) = @_;
5604        $from = 0 unless defined $from;
5605        $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5606
5607        print "<table class=\"heads\">\n";
5608        my $alternate = 1;
5609        for (my $i = $from; $i <= $to; $i++) {
5610                my $entry = $headlist->[$i];
5611                my %ref = %$entry;
5612                my $curr = $ref{'id'} eq $head;
5613                if ($alternate) {
5614                        print "<tr class=\"dark\">\n";
5615                } else {
5616                        print "<tr class=\"light\">\n";
5617                }
5618                $alternate ^= 1;
5619                print "<td><i>$ref{'age'}</i></td>\n" .
5620                      ($curr ? "<td class=\"current_head\">" : "<td>") .
5621                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5622                               -class => "list name"},esc_html($ref{'name'})) .
5623                      "</td>\n" .
5624                      "<td class=\"link\">" .
5625                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5626                      $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5627                      $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5628                      "</td>\n" .
5629                      "</tr>";
5630        }
5631        if (defined $extra) {
5632                print "<tr>\n" .
5633                      "<td colspan=\"3\">$extra</td>\n" .
5634                      "</tr>\n";
5635        }
5636        print "</table>\n";
5637}
5638
5639# Display a single remote block
5640sub git_remote_block {
5641        my ($remote, $rdata, $limit, $head) = @_;
5642
5643        my $heads = $rdata->{'heads'};
5644        my $fetch = $rdata->{'fetch'};
5645        my $push = $rdata->{'push'};
5646
5647        my $urls_table = "<table class=\"projects_list\">\n" ;
5648
5649        if (defined $fetch) {
5650                if ($fetch eq $push) {
5651                        $urls_table .= format_repo_url("URL", $fetch);
5652                } else {
5653                        $urls_table .= format_repo_url("Fetch URL", $fetch);
5654                        $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5655                }
5656        } elsif (defined $push) {
5657                $urls_table .= format_repo_url("Push URL", $push);
5658        } else {
5659                $urls_table .= format_repo_url("", "No remote URL");
5660        }
5661
5662        $urls_table .= "</table>\n";
5663
5664        my $dots;
5665        if (defined $limit && $limit < @$heads) {
5666                $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5667        }
5668
5669        print $urls_table;
5670        git_heads_body($heads, $head, 0, $limit, $dots);
5671}
5672
5673# Display a list of remote names with the respective fetch and push URLs
5674sub git_remotes_list {
5675        my ($remotedata, $limit) = @_;
5676        print "<table class=\"heads\">\n";
5677        my $alternate = 1;
5678        my @remotes = sort keys %$remotedata;
5679
5680        my $limited = $limit && $limit < @remotes;
5681
5682        $#remotes = $limit - 1 if $limited;
5683
5684        while (my $remote = shift @remotes) {
5685                my $rdata = $remotedata->{$remote};
5686                my $fetch = $rdata->{'fetch'};
5687                my $push = $rdata->{'push'};
5688                if ($alternate) {
5689                        print "<tr class=\"dark\">\n";
5690                } else {
5691                        print "<tr class=\"light\">\n";
5692                }
5693                $alternate ^= 1;
5694                print "<td>" .
5695                      $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5696                               -class=> "list name"},esc_html($remote)) .
5697                      "</td>";
5698                print "<td class=\"link\">" .
5699                      (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5700                      " | " .
5701                      (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5702                      "</td>";
5703
5704                print "</tr>\n";
5705        }
5706
5707        if ($limited) {
5708                print "<tr>\n" .
5709                      "<td colspan=\"3\">" .
5710                      $cgi->a({-href => href(action=>"remotes")}, "...") .
5711                      "</td>\n" . "</tr>\n";
5712        }
5713
5714        print "</table>";
5715}
5716
5717# Display remote heads grouped by remote, unless there are too many
5718# remotes, in which case we only display the remote names
5719sub git_remotes_body {
5720        my ($remotedata, $limit, $head) = @_;
5721        if ($limit and $limit < keys %$remotedata) {
5722                git_remotes_list($remotedata, $limit);
5723        } else {
5724                fill_remote_heads($remotedata);
5725                while (my ($remote, $rdata) = each %$remotedata) {
5726                        git_print_section({-class=>"remote", -id=>$remote},
5727                                ["remotes", $remote, $remote], sub {
5728                                        git_remote_block($remote, $rdata, $limit, $head);
5729                                });
5730                }
5731        }
5732}
5733
5734sub git_search_message {
5735        my %co = @_;
5736
5737        my $greptype;
5738        if ($searchtype eq 'commit') {
5739                $greptype = "--grep=";
5740        } elsif ($searchtype eq 'author') {
5741                $greptype = "--author=";
5742        } elsif ($searchtype eq 'committer') {
5743                $greptype = "--committer=";
5744        }
5745        $greptype .= $searchtext;
5746        my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
5747                                       $greptype, '--regexp-ignore-case',
5748                                       $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
5749
5750        my $paging_nav = '';
5751        if ($page > 0) {
5752                $paging_nav .=
5753                        $cgi->a({-href => href(-replay=>1, page=>undef)},
5754                                "first") .
5755                        " &sdot; " .
5756                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
5757                                 -accesskey => "p", -title => "Alt-p"}, "prev");
5758        } else {
5759                $paging_nav .= "first &sdot; prev";
5760        }
5761        my $next_link = '';
5762        if ($#commitlist >= 100) {
5763                $next_link =
5764                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
5765                                 -accesskey => "n", -title => "Alt-n"}, "next");
5766                $paging_nav .= " &sdot; $next_link";
5767        } else {
5768                $paging_nav .= " &sdot; next";
5769        }
5770
5771        git_header_html();
5772
5773        git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
5774        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5775        if ($page == 0 && !@commitlist) {
5776                print "<p>No match.</p>\n";
5777        } else {
5778                git_search_grep_body(\@commitlist, 0, 99, $next_link);
5779        }
5780
5781        git_footer_html();
5782}
5783
5784sub git_search_changes {
5785        my %co = @_;
5786
5787        local $/ = "\n";
5788        open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
5789                '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
5790                ($search_use_regexp ? '--pickaxe-regex' : ())
5791                        or die_error(500, "Open git-log failed");
5792
5793        git_header_html();
5794
5795        git_print_page_nav('','', $hash,$co{'tree'},$hash);
5796        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5797
5798        print "<table class=\"pickaxe search\">\n";
5799        my $alternate = 1;
5800        undef %co;
5801        my @files;
5802        while (my $line = <$fd>) {
5803                chomp $line;
5804                next unless $line;
5805
5806                my %set = parse_difftree_raw_line($line);
5807                if (defined $set{'commit'}) {
5808                        # finish previous commit
5809                        if (%co) {
5810                                print "</td>\n" .
5811                                      "<td class=\"link\">" .
5812                                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5813                                              "commit") .
5814                                      " | " .
5815                                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5816                                                             hash_base=>$co{'id'})},
5817                                              "tree") .
5818                                      "</td>\n" .
5819                                      "</tr>\n";
5820                        }
5821
5822                        if ($alternate) {
5823                                print "<tr class=\"dark\">\n";
5824                        } else {
5825                                print "<tr class=\"light\">\n";
5826                        }
5827                        $alternate ^= 1;
5828                        %co = parse_commit($set{'commit'});
5829                        my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
5830                        print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5831                              "<td><i>$author</i></td>\n" .
5832                              "<td>" .
5833                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5834                                      -class => "list subject"},
5835                                      chop_and_escape_str($co{'title'}, 50) . "<br/>");
5836                } elsif (defined $set{'to_id'}) {
5837                        next if ($set{'to_id'} =~ m/^0{40}$/);
5838
5839                        print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
5840                                                     hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
5841                                      -class => "list"},
5842                                      "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
5843                              "<br/>\n";
5844                }
5845        }
5846        close $fd;
5847
5848        # finish last commit (warning: repetition!)
5849        if (%co) {
5850                print "</td>\n" .
5851                      "<td class=\"link\">" .
5852                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5853                              "commit") .
5854                      " | " .
5855                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5856                                             hash_base=>$co{'id'})},
5857                              "tree") .
5858                      "</td>\n" .
5859                      "</tr>\n";
5860        }
5861
5862        print "</table>\n";
5863
5864        git_footer_html();
5865}
5866
5867sub git_search_files {
5868        my %co = @_;
5869
5870        local $/ = "\n";
5871        open my $fd, "-|", git_cmd(), 'grep', '-n', '-z',
5872                $search_use_regexp ? ('-E', '-i') : '-F',
5873                $searchtext, $co{'tree'}
5874                        or die_error(500, "Open git-grep failed");
5875
5876        git_header_html();
5877
5878        git_print_page_nav('','', $hash,$co{'tree'},$hash);
5879        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5880
5881        print "<table class=\"grep_search\">\n";
5882        my $alternate = 1;
5883        my $matches = 0;
5884        my $lastfile = '';
5885        while (my $line = <$fd>) {
5886                chomp $line;
5887                my ($file, $file_href, $lno, $ltext, $binary);
5888                last if ($matches++ > 1000);
5889                if ($line =~ /^Binary file (.+) matches$/) {
5890                        $file = $1;
5891                        $binary = 1;
5892                } else {
5893                        ($file, $lno, $ltext) = split(/\0/, $line, 3);
5894                        $file =~ s/^$co{'tree'}://;
5895                }
5896                if ($file ne $lastfile) {
5897                        $lastfile and print "</td></tr>\n";
5898                        if ($alternate++) {
5899                                print "<tr class=\"dark\">\n";
5900                        } else {
5901                                print "<tr class=\"light\">\n";
5902                        }
5903                        $file_href = href(action=>"blob", hash_base=>$co{'id'},
5904                                          file_name=>$file);
5905                        print "<td class=\"list\">".
5906                                $cgi->a({-href => $file_href, -class => "list"}, esc_path($file));
5907                        print "</td><td>\n";
5908                        $lastfile = $file;
5909                }
5910                if ($binary) {
5911                        print "<div class=\"binary\">Binary file</div>\n";
5912                } else {
5913                        $ltext = untabify($ltext);
5914                        if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
5915                                $ltext = esc_html($1, -nbsp=>1);
5916                                $ltext .= '<span class="match">';
5917                                $ltext .= esc_html($2, -nbsp=>1);
5918                                $ltext .= '</span>';
5919                                $ltext .= esc_html($3, -nbsp=>1);
5920                        } else {
5921                                $ltext = esc_html($ltext, -nbsp=>1);
5922                        }
5923                        print "<div class=\"pre\">" .
5924                                $cgi->a({-href => $file_href.'#l'.$lno,
5925                                        -class => "linenr"}, sprintf('%4i', $lno)) .
5926                                ' ' .  $ltext . "</div>\n";
5927                }
5928        }
5929        if ($lastfile) {
5930                print "</td></tr>\n";
5931                if ($matches > 1000) {
5932                        print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
5933                }
5934        } else {
5935                print "<div class=\"diff nodifferences\">No matches found</div>\n";
5936        }
5937        close $fd;
5938
5939        print "</table>\n";
5940
5941        git_footer_html();
5942}
5943
5944sub git_search_grep_body {
5945        my ($commitlist, $from, $to, $extra) = @_;
5946        $from = 0 unless defined $from;
5947        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5948
5949        print "<table class=\"commit_search\">\n";
5950        my $alternate = 1;
5951        for (my $i = $from; $i <= $to; $i++) {
5952                my %co = %{$commitlist->[$i]};
5953                if (!%co) {
5954                        next;
5955                }
5956                my $commit = $co{'id'};
5957                if ($alternate) {
5958                        print "<tr class=\"dark\">\n";
5959                } else {
5960                        print "<tr class=\"light\">\n";
5961                }
5962                $alternate ^= 1;
5963                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5964                      format_author_html('td', \%co, 15, 5) .
5965                      "<td>" .
5966                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5967                               -class => "list subject"},
5968                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
5969                my $comment = $co{'comment'};
5970                foreach my $line (@$comment) {
5971                        if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
5972                                my ($lead, $match, $trail) = ($1, $2, $3);
5973                                $match = chop_str($match, 70, 5, 'center');
5974                                my $contextlen = int((80 - length($match))/2);
5975                                $contextlen = 30 if ($contextlen > 30);
5976                                $lead  = chop_str($lead,  $contextlen, 10, 'left');
5977                                $trail = chop_str($trail, $contextlen, 10, 'right');
5978
5979                                $lead  = esc_html($lead);
5980                                $match = esc_html($match);
5981                                $trail = esc_html($trail);
5982
5983                                print "$lead<span class=\"match\">$match</span>$trail<br />";
5984                        }
5985                }
5986                print "</td>\n" .
5987                      "<td class=\"link\">" .
5988                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5989                      " | " .
5990                      $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5991                      " | " .
5992                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5993                print "</td>\n" .
5994                      "</tr>\n";
5995        }
5996        if (defined $extra) {
5997                print "<tr>\n" .
5998                      "<td colspan=\"3\">$extra</td>\n" .
5999                      "</tr>\n";
6000        }
6001        print "</table>\n";
6002}
6003
6004## ======================================================================
6005## ======================================================================
6006## actions
6007
6008sub git_project_list {
6009        my $order = $input_params{'order'};
6010        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6011                die_error(400, "Unknown order parameter");
6012        }
6013
6014        my @list = git_get_projects_list($project_filter, $strict_export);
6015        if (!@list) {
6016                die_error(404, "No projects found");
6017        }
6018
6019        git_header_html();
6020        if (defined $home_text && -f $home_text) {
6021                print "<div class=\"index_include\">\n";
6022                insert_file($home_text);
6023                print "</div>\n";
6024        }
6025        print $cgi->startform(-method => "get") .
6026              "<p class=\"projsearch\">Search:\n" .
6027              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
6028              "</p>" .
6029              $cgi->end_form() . "\n";
6030        git_project_list_body(\@list, $order);
6031        git_footer_html();
6032}
6033
6034sub git_forks {
6035        my $order = $input_params{'order'};
6036        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6037                die_error(400, "Unknown order parameter");
6038        }
6039
6040        my $filter = $project;
6041        $filter =~ s/\.git$//;
6042        my @list = git_get_projects_list($filter);
6043        if (!@list) {
6044                die_error(404, "No forks found");
6045        }
6046
6047        git_header_html();
6048        git_print_page_nav('','');
6049        git_print_header_div('summary', "$project forks");
6050        git_project_list_body(\@list, $order);
6051        git_footer_html();
6052}
6053
6054sub git_project_index {
6055        my @projects = git_get_projects_list($project_filter, $strict_export);
6056        if (!@projects) {
6057                die_error(404, "No projects found");
6058        }
6059
6060        print $cgi->header(
6061                -type => 'text/plain',
6062                -charset => 'utf-8',
6063                -content_disposition => 'inline; filename="index.aux"');
6064
6065        foreach my $pr (@projects) {
6066                if (!exists $pr->{'owner'}) {
6067                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6068                }
6069
6070                my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6071                # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6072                $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6073                $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6074                $path  =~ s/ /\+/g;
6075                $owner =~ s/ /\+/g;
6076
6077                print "$path $owner\n";
6078        }
6079}
6080
6081sub git_summary {
6082        my $descr = git_get_project_description($project) || "none";
6083        my %co = parse_commit("HEAD");
6084        my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6085        my $head = $co{'id'};
6086        my $remote_heads = gitweb_check_feature('remote_heads');
6087
6088        my $owner = git_get_project_owner($project);
6089
6090        my $refs = git_get_references();
6091        # These get_*_list functions return one more to allow us to see if
6092        # there are more ...
6093        my @taglist  = git_get_tags_list(16);
6094        my @headlist = git_get_heads_list(16);
6095        my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6096        my @forklist;
6097        my $check_forks = gitweb_check_feature('forks');
6098
6099        if ($check_forks) {
6100                # find forks of a project
6101                my $filter = $project;
6102                $filter =~ s/\.git$//;
6103                @forklist = git_get_projects_list($filter);
6104                # filter out forks of forks
6105                @forklist = filter_forks_from_projects_list(\@forklist)
6106                        if (@forklist);
6107        }
6108
6109        git_header_html();
6110        git_print_page_nav('summary','', $head);
6111
6112        print "<div class=\"title\">&nbsp;</div>\n";
6113        print "<table class=\"projects_list\">\n" .
6114              "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
6115              "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6116        if (defined $cd{'rfc2822'}) {
6117                print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6118                      "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6119        }
6120
6121        # use per project git URL list in $projectroot/$project/cloneurl
6122        # or make project git URL from git base URL and project name
6123        my $url_tag = "URL";
6124        my @url_list = git_get_project_url_list($project);
6125        @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6126        foreach my $git_url (@url_list) {
6127                next unless $git_url;
6128                print format_repo_url($url_tag, $git_url);
6129                $url_tag = "";
6130        }
6131
6132        # Tag cloud
6133        my $show_ctags = gitweb_check_feature('ctags');
6134        if ($show_ctags) {
6135                my $ctags = git_get_project_ctags($project);
6136                if (%$ctags) {
6137                        # without ability to add tags, don't show if there are none
6138                        my $cloud = git_populate_project_tagcloud($ctags);
6139                        print "<tr id=\"metadata_ctags\">" .
6140                              "<td>content tags</td>" .
6141                              "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6142                              "</tr>\n";
6143                }
6144        }
6145
6146        print "</table>\n";
6147
6148        # If XSS prevention is on, we don't include README.html.
6149        # TODO: Allow a readme in some safe format.
6150        if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6151                print "<div class=\"title\">readme</div>\n" .
6152                      "<div class=\"readme\">\n";
6153                insert_file("$projectroot/$project/README.html");
6154                print "\n</div>\n"; # class="readme"
6155        }
6156
6157        # we need to request one more than 16 (0..15) to check if
6158        # those 16 are all
6159        my @commitlist = $head ? parse_commits($head, 17) : ();
6160        if (@commitlist) {
6161                git_print_header_div('shortlog');
6162                git_shortlog_body(\@commitlist, 0, 15, $refs,
6163                                  $#commitlist <=  15 ? undef :
6164                                  $cgi->a({-href => href(action=>"shortlog")}, "..."));
6165        }
6166
6167        if (@taglist) {
6168                git_print_header_div('tags');
6169                git_tags_body(\@taglist, 0, 15,
6170                              $#taglist <=  15 ? undef :
6171                              $cgi->a({-href => href(action=>"tags")}, "..."));
6172        }
6173
6174        if (@headlist) {
6175                git_print_header_div('heads');
6176                git_heads_body(\@headlist, $head, 0, 15,
6177                               $#headlist <= 15 ? undef :
6178                               $cgi->a({-href => href(action=>"heads")}, "..."));
6179        }
6180
6181        if (%remotedata) {
6182                git_print_header_div('remotes');
6183                git_remotes_body(\%remotedata, 15, $head);
6184        }
6185
6186        if (@forklist) {
6187                git_print_header_div('forks');
6188                git_project_list_body(\@forklist, 'age', 0, 15,
6189                                      $#forklist <= 15 ? undef :
6190                                      $cgi->a({-href => href(action=>"forks")}, "..."),
6191                                      'no_header');
6192        }
6193
6194        git_footer_html();
6195}
6196
6197sub git_tag {
6198        my %tag = parse_tag($hash);
6199
6200        if (! %tag) {
6201                die_error(404, "Unknown tag object");
6202        }
6203
6204        my $head = git_get_head_hash($project);
6205        git_header_html();
6206        git_print_page_nav('','', $head,undef,$head);
6207        git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6208        print "<div class=\"title_text\">\n" .
6209              "<table class=\"object_header\">\n" .
6210              "<tr>\n" .
6211              "<td>object</td>\n" .
6212              "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6213                               $tag{'object'}) . "</td>\n" .
6214              "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6215                                              $tag{'type'}) . "</td>\n" .
6216              "</tr>\n";
6217        if (defined($tag{'author'})) {
6218                git_print_authorship_rows(\%tag, 'author');
6219        }
6220        print "</table>\n\n" .
6221              "</div>\n";
6222        print "<div class=\"page_body\">";
6223        my $comment = $tag{'comment'};
6224        foreach my $line (@$comment) {
6225                chomp $line;
6226                print esc_html($line, -nbsp=>1) . "<br/>\n";
6227        }
6228        print "</div>\n";
6229        git_footer_html();
6230}
6231
6232sub git_blame_common {
6233        my $format = shift || 'porcelain';
6234        if ($format eq 'porcelain' && $cgi->param('js')) {
6235                $format = 'incremental';
6236                $action = 'blame_incremental'; # for page title etc
6237        }
6238
6239        # permissions
6240        gitweb_check_feature('blame')
6241                or die_error(403, "Blame view not allowed");
6242
6243        # error checking
6244        die_error(400, "No file name given") unless $file_name;
6245        $hash_base ||= git_get_head_hash($project);
6246        die_error(404, "Couldn't find base commit") unless $hash_base;
6247        my %co = parse_commit($hash_base)
6248                or die_error(404, "Commit not found");
6249        my $ftype = "blob";
6250        if (!defined $hash) {
6251                $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6252                        or die_error(404, "Error looking up file");
6253        } else {
6254                $ftype = git_get_type($hash);
6255                if ($ftype !~ "blob") {
6256                        die_error(400, "Object is not a blob");
6257                }
6258        }
6259
6260        my $fd;
6261        if ($format eq 'incremental') {
6262                # get file contents (as base)
6263                open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6264                        or die_error(500, "Open git-cat-file failed");
6265        } elsif ($format eq 'data') {
6266                # run git-blame --incremental
6267                open $fd, "-|", git_cmd(), "blame", "--incremental",
6268                        $hash_base, "--", $file_name
6269                        or die_error(500, "Open git-blame --incremental failed");
6270        } else {
6271                # run git-blame --porcelain
6272                open $fd, "-|", git_cmd(), "blame", '-p',
6273                        $hash_base, '--', $file_name
6274                        or die_error(500, "Open git-blame --porcelain failed");
6275        }
6276
6277        # incremental blame data returns early
6278        if ($format eq 'data') {
6279                print $cgi->header(
6280                        -type=>"text/plain", -charset => "utf-8",
6281                        -status=> "200 OK");
6282                local $| = 1; # output autoflush
6283                while (my $line = <$fd>) {
6284                        print to_utf8($line);
6285                }
6286                close $fd
6287                        or print "ERROR $!\n";
6288
6289                print 'END';
6290                if (defined $t0 && gitweb_check_feature('timed')) {
6291                        print ' '.
6292                              tv_interval($t0, [ gettimeofday() ]).
6293                              ' '.$number_of_git_cmds;
6294                }
6295                print "\n";
6296
6297                return;
6298        }
6299
6300        # page header
6301        git_header_html();
6302        my $formats_nav =
6303                $cgi->a({-href => href(action=>"blob", -replay=>1)},
6304                        "blob") .
6305                " | ";
6306        if ($format eq 'incremental') {
6307                $formats_nav .=
6308                        $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6309                                "blame") . " (non-incremental)";
6310        } else {
6311                $formats_nav .=
6312                        $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6313                                "blame") . " (incremental)";
6314        }
6315        $formats_nav .=
6316                " | " .
6317                $cgi->a({-href => href(action=>"history", -replay=>1)},
6318                        "history") .
6319                " | " .
6320                $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6321                        "HEAD");
6322        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6323        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6324        git_print_page_path($file_name, $ftype, $hash_base);
6325
6326        # page body
6327        if ($format eq 'incremental') {
6328                print "<noscript>\n<div class=\"error\"><center><b>\n".
6329                      "This page requires JavaScript to run.\n Use ".
6330                      $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6331                              'this page').
6332                      " instead.\n".
6333                      "</b></center></div>\n</noscript>\n";
6334
6335                print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6336        }
6337
6338        print qq!<div class="page_body">\n!;
6339        print qq!<div id="progress_info">... / ...</div>\n!
6340                if ($format eq 'incremental');
6341        print qq!<table id="blame_table" class="blame" width="100%">\n!.
6342              #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6343              qq!<thead>\n!.
6344              qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6345              qq!</thead>\n!.
6346              qq!<tbody>\n!;
6347
6348        my @rev_color = qw(light dark);
6349        my $num_colors = scalar(@rev_color);
6350        my $current_color = 0;
6351
6352        if ($format eq 'incremental') {
6353                my $color_class = $rev_color[$current_color];
6354
6355                #contents of a file
6356                my $linenr = 0;
6357        LINE:
6358                while (my $line = <$fd>) {
6359                        chomp $line;
6360                        $linenr++;
6361
6362                        print qq!<tr id="l$linenr" class="$color_class">!.
6363                              qq!<td class="sha1"><a href=""> </a></td>!.
6364                              qq!<td class="linenr">!.
6365                              qq!<a class="linenr" href="">$linenr</a></td>!;
6366                        print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6367                        print qq!</tr>\n!;
6368                }
6369
6370        } else { # porcelain, i.e. ordinary blame
6371                my %metainfo = (); # saves information about commits
6372
6373                # blame data
6374        LINE:
6375                while (my $line = <$fd>) {
6376                        chomp $line;
6377                        # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6378                        # no <lines in group> for subsequent lines in group of lines
6379                        my ($full_rev, $orig_lineno, $lineno, $group_size) =
6380                           ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6381                        if (!exists $metainfo{$full_rev}) {
6382                                $metainfo{$full_rev} = { 'nprevious' => 0 };
6383                        }
6384                        my $meta = $metainfo{$full_rev};
6385                        my $data;
6386                        while ($data = <$fd>) {
6387                                chomp $data;
6388                                last if ($data =~ s/^\t//); # contents of line
6389                                if ($data =~ /^(\S+)(?: (.*))?$/) {
6390                                        $meta->{$1} = $2 unless exists $meta->{$1};
6391                                }
6392                                if ($data =~ /^previous /) {
6393                                        $meta->{'nprevious'}++;
6394                                }
6395                        }
6396                        my $short_rev = substr($full_rev, 0, 8);
6397                        my $author = $meta->{'author'};
6398                        my %date =
6399                                parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6400                        my $date = $date{'iso-tz'};
6401                        if ($group_size) {
6402                                $current_color = ($current_color + 1) % $num_colors;
6403                        }
6404                        my $tr_class = $rev_color[$current_color];
6405                        $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6406                        $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6407                        $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6408                        print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6409                        if ($group_size) {
6410                                print "<td class=\"sha1\"";
6411                                print " title=\"". esc_html($author) . ", $date\"";
6412                                print " rowspan=\"$group_size\"" if ($group_size > 1);
6413                                print ">";
6414                                print $cgi->a({-href => href(action=>"commit",
6415                                                             hash=>$full_rev,
6416                                                             file_name=>$file_name)},
6417                                              esc_html($short_rev));
6418                                if ($group_size >= 2) {
6419                                        my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6420                                        if (@author_initials) {
6421                                                print "<br />" .
6422                                                      esc_html(join('', @author_initials));
6423                                                #           or join('.', ...)
6424                                        }
6425                                }
6426                                print "</td>\n";
6427                        }
6428                        # 'previous' <sha1 of parent commit> <filename at commit>
6429                        if (exists $meta->{'previous'} &&
6430                            $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6431                                $meta->{'parent'} = $1;
6432                                $meta->{'file_parent'} = unquote($2);
6433                        }
6434                        my $linenr_commit =
6435                                exists($meta->{'parent'}) ?
6436                                $meta->{'parent'} : $full_rev;
6437                        my $linenr_filename =
6438                                exists($meta->{'file_parent'}) ?
6439                                $meta->{'file_parent'} : unquote($meta->{'filename'});
6440                        my $blamed = href(action => 'blame',
6441                                          file_name => $linenr_filename,
6442                                          hash_base => $linenr_commit);
6443                        print "<td class=\"linenr\">";
6444                        print $cgi->a({ -href => "$blamed#l$orig_lineno",
6445                                        -class => "linenr" },
6446                                      esc_html($lineno));
6447                        print "</td>";
6448                        print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6449                        print "</tr>\n";
6450                } # end while
6451
6452        }
6453
6454        # footer
6455        print "</tbody>\n".
6456              "</table>\n"; # class="blame"
6457        print "</div>\n";   # class="blame_body"
6458        close $fd
6459                or print "Reading blob failed\n";
6460
6461        git_footer_html();
6462}
6463
6464sub git_blame {
6465        git_blame_common();
6466}
6467
6468sub git_blame_incremental {
6469        git_blame_common('incremental');
6470}
6471
6472sub git_blame_data {
6473        git_blame_common('data');
6474}
6475
6476sub git_tags {
6477        my $head = git_get_head_hash($project);
6478        git_header_html();
6479        git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6480        git_print_header_div('summary', $project);
6481
6482        my @tagslist = git_get_tags_list();
6483        if (@tagslist) {
6484                git_tags_body(\@tagslist);
6485        }
6486        git_footer_html();
6487}
6488
6489sub git_heads {
6490        my $head = git_get_head_hash($project);
6491        git_header_html();
6492        git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6493        git_print_header_div('summary', $project);
6494
6495        my @headslist = git_get_heads_list();
6496        if (@headslist) {
6497                git_heads_body(\@headslist, $head);
6498        }
6499        git_footer_html();
6500}
6501
6502# used both for single remote view and for list of all the remotes
6503sub git_remotes {
6504        gitweb_check_feature('remote_heads')
6505                or die_error(403, "Remote heads view is disabled");
6506
6507        my $head = git_get_head_hash($project);
6508        my $remote = $input_params{'hash'};
6509
6510        my $remotedata = git_get_remotes_list($remote);
6511        die_error(500, "Unable to get remote information") unless defined $remotedata;
6512
6513        unless (%$remotedata) {
6514                die_error(404, defined $remote ?
6515                        "Remote $remote not found" :
6516                        "No remotes found");
6517        }
6518
6519        git_header_html(undef, undef, -action_extra => $remote);
6520        git_print_page_nav('', '',  $head, undef, $head,
6521                format_ref_views($remote ? '' : 'remotes'));
6522
6523        fill_remote_heads($remotedata);
6524        if (defined $remote) {
6525                git_print_header_div('remotes', "$remote remote for $project");
6526                git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6527        } else {
6528                git_print_header_div('summary', "$project remotes");
6529                git_remotes_body($remotedata, undef, $head);
6530        }
6531
6532        git_footer_html();
6533}
6534
6535sub git_blob_plain {
6536        my $type = shift;
6537        my $expires;
6538
6539        if (!defined $hash) {
6540                if (defined $file_name) {
6541                        my $base = $hash_base || git_get_head_hash($project);
6542                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6543                                or die_error(404, "Cannot find file");
6544                } else {
6545                        die_error(400, "No file name defined");
6546                }
6547        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6548                # blobs defined by non-textual hash id's can be cached
6549                $expires = "+1d";
6550        }
6551
6552        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6553                or die_error(500, "Open git-cat-file blob '$hash' failed");
6554
6555        # content-type (can include charset)
6556        $type = blob_contenttype($fd, $file_name, $type);
6557
6558        # "save as" filename, even when no $file_name is given
6559        my $save_as = "$hash";
6560        if (defined $file_name) {
6561                $save_as = $file_name;
6562        } elsif ($type =~ m/^text\//) {
6563                $save_as .= '.txt';
6564        }
6565
6566        # With XSS prevention on, blobs of all types except a few known safe
6567        # ones are served with "Content-Disposition: attachment" to make sure
6568        # they don't run in our security domain.  For certain image types,
6569        # blob view writes an <img> tag referring to blob_plain view, and we
6570        # want to be sure not to break that by serving the image as an
6571        # attachment (though Firefox 3 doesn't seem to care).
6572        my $sandbox = $prevent_xss &&
6573                $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6574
6575        # serve text/* as text/plain
6576        if ($prevent_xss &&
6577            ($type =~ m!^text/[a-z]+\b(.*)$! ||
6578             ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
6579                my $rest = $1;
6580                $rest = defined $rest ? $rest : '';
6581                $type = "text/plain$rest";
6582        }
6583
6584        print $cgi->header(
6585                -type => $type,
6586                -expires => $expires,
6587                -content_disposition =>
6588                        ($sandbox ? 'attachment' : 'inline')
6589                        . '; filename="' . $save_as . '"');
6590        local $/ = undef;
6591        binmode STDOUT, ':raw';
6592        print <$fd>;
6593        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6594        close $fd;
6595}
6596
6597sub git_blob {
6598        my $expires;
6599
6600        if (!defined $hash) {
6601                if (defined $file_name) {
6602                        my $base = $hash_base || git_get_head_hash($project);
6603                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6604                                or die_error(404, "Cannot find file");
6605                } else {
6606                        die_error(400, "No file name defined");
6607                }
6608        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6609                # blobs defined by non-textual hash id's can be cached
6610                $expires = "+1d";
6611        }
6612
6613        my $have_blame = gitweb_check_feature('blame');
6614        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6615                or die_error(500, "Couldn't cat $file_name, $hash");
6616        my $mimetype = blob_mimetype($fd, $file_name);
6617        # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6618        if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6619                close $fd;
6620                return git_blob_plain($mimetype);
6621        }
6622        # we can have blame only for text/* mimetype
6623        $have_blame &&= ($mimetype =~ m!^text/!);
6624
6625        my $highlight = gitweb_check_feature('highlight');
6626        my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6627        $fd = run_highlighter($fd, $highlight, $syntax)
6628                if $syntax;
6629
6630        git_header_html(undef, $expires);
6631        my $formats_nav = '';
6632        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6633                if (defined $file_name) {
6634                        if ($have_blame) {
6635                                $formats_nav .=
6636                                        $cgi->a({-href => href(action=>"blame", -replay=>1)},
6637                                                "blame") .
6638                                        " | ";
6639                        }
6640                        $formats_nav .=
6641                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6642                                        "history") .
6643                                " | " .
6644                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6645                                        "raw") .
6646                                " | " .
6647                                $cgi->a({-href => href(action=>"blob",
6648                                                       hash_base=>"HEAD", file_name=>$file_name)},
6649                                        "HEAD");
6650                } else {
6651                        $formats_nav .=
6652                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6653                                        "raw");
6654                }
6655                git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6656                git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6657        } else {
6658                print "<div class=\"page_nav\">\n" .
6659                      "<br/><br/></div>\n" .
6660                      "<div class=\"title\">".esc_html($hash)."</div>\n";
6661        }
6662        git_print_page_path($file_name, "blob", $hash_base);
6663        print "<div class=\"page_body\">\n";
6664        if ($mimetype =~ m!^image/!) {
6665                print qq!<img type="!.esc_attr($mimetype).qq!"!;
6666                if ($file_name) {
6667                        print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
6668                }
6669                print qq! src="! .
6670                      href(action=>"blob_plain", hash=>$hash,
6671                           hash_base=>$hash_base, file_name=>$file_name) .
6672                      qq!" />\n!;
6673        } else {
6674                my $nr;
6675                while (my $line = <$fd>) {
6676                        chomp $line;
6677                        $nr++;
6678                        $line = untabify($line);
6679                        printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
6680                               $nr, esc_attr(href(-replay => 1)), $nr, $nr,
6681                               $syntax ? sanitize($line) : esc_html($line, -nbsp=>1);
6682                }
6683        }
6684        close $fd
6685                or print "Reading blob failed.\n";
6686        print "</div>";
6687        git_footer_html();
6688}
6689
6690sub git_tree {
6691        if (!defined $hash_base) {
6692                $hash_base = "HEAD";
6693        }
6694        if (!defined $hash) {
6695                if (defined $file_name) {
6696                        $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
6697                } else {
6698                        $hash = $hash_base;
6699                }
6700        }
6701        die_error(404, "No such tree") unless defined($hash);
6702
6703        my $show_sizes = gitweb_check_feature('show-sizes');
6704        my $have_blame = gitweb_check_feature('blame');
6705
6706        my @entries = ();
6707        {
6708                local $/ = "\0";
6709                open my $fd, "-|", git_cmd(), "ls-tree", '-z',
6710                        ($show_sizes ? '-l' : ()), @extra_options, $hash
6711                        or die_error(500, "Open git-ls-tree failed");
6712                @entries = map { chomp; $_ } <$fd>;
6713                close $fd
6714                        or die_error(404, "Reading tree failed");
6715        }
6716
6717        my $refs = git_get_references();
6718        my $ref = format_ref_marker($refs, $hash_base);
6719        git_header_html();
6720        my $basedir = '';
6721        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6722                my @views_nav = ();
6723                if (defined $file_name) {
6724                        push @views_nav,
6725                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6726                                        "history"),
6727                                $cgi->a({-href => href(action=>"tree",
6728                                                       hash_base=>"HEAD", file_name=>$file_name)},
6729                                        "HEAD"),
6730                }
6731                my $snapshot_links = format_snapshot_links($hash);
6732                if (defined $snapshot_links) {
6733                        # FIXME: Should be available when we have no hash base as well.
6734                        push @views_nav, $snapshot_links;
6735                }
6736                git_print_page_nav('tree','', $hash_base, undef, undef,
6737                                   join(' | ', @views_nav));
6738                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6739        } else {
6740                undef $hash_base;
6741                print "<div class=\"page_nav\">\n";
6742                print "<br/><br/></div>\n";
6743                print "<div class=\"title\">".esc_html($hash)."</div>\n";
6744        }
6745        if (defined $file_name) {
6746                $basedir = $file_name;
6747                if ($basedir ne '' && substr($basedir, -1) ne '/') {
6748                        $basedir .= '/';
6749                }
6750                git_print_page_path($file_name, 'tree', $hash_base);
6751        }
6752        print "<div class=\"page_body\">\n";
6753        print "<table class=\"tree\">\n";
6754        my $alternate = 1;
6755        # '..' (top directory) link if possible
6756        if (defined $hash_base &&
6757            defined $file_name && $file_name =~ m![^/]+$!) {
6758                if ($alternate) {
6759                        print "<tr class=\"dark\">\n";
6760                } else {
6761                        print "<tr class=\"light\">\n";
6762                }
6763                $alternate ^= 1;
6764
6765                my $up = $file_name;
6766                $up =~ s!/?[^/]+$!!;
6767                undef $up unless $up;
6768                # based on git_print_tree_entry
6769                print '<td class="mode">' . mode_str('040000') . "</td>\n";
6770                print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6771                print '<td class="list">';
6772                print $cgi->a({-href => href(action=>"tree",
6773                                             hash_base=>$hash_base,
6774                                             file_name=>$up)},
6775                              "..");
6776                print "</td>\n";
6777                print "<td class=\"link\"></td>\n";
6778
6779                print "</tr>\n";
6780        }
6781        foreach my $line (@entries) {
6782                my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6783
6784                if ($alternate) {
6785                        print "<tr class=\"dark\">\n";
6786                } else {
6787                        print "<tr class=\"light\">\n";
6788                }
6789                $alternate ^= 1;
6790
6791                git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6792
6793                print "</tr>\n";
6794        }
6795        print "</table>\n" .
6796              "</div>";
6797        git_footer_html();
6798}
6799
6800sub snapshot_name {
6801        my ($project, $hash) = @_;
6802
6803        # path/to/project.git  -> project
6804        # path/to/project/.git -> project
6805        my $name = to_utf8($project);
6806        $name =~ s,([^/])/*\.git$,$1,;
6807        $name = basename($name);
6808        # sanitize name
6809        $name =~ s/[[:cntrl:]]/?/g;
6810
6811        my $ver = $hash;
6812        if ($hash =~ /^[0-9a-fA-F]+$/) {
6813                # shorten SHA-1 hash
6814                my $full_hash = git_get_full_hash($project, $hash);
6815                if ($full_hash =~ /^$hash/ && length($hash) > 7) {
6816                        $ver = git_get_short_hash($project, $hash);
6817                }
6818        } elsif ($hash =~ m!^refs/tags/(.*)$!) {
6819                # tags don't need shortened SHA-1 hash
6820                $ver = $1;
6821        } else {
6822                # branches and other need shortened SHA-1 hash
6823                if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
6824                        $ver = $1;
6825                }
6826                $ver .= '-' . git_get_short_hash($project, $hash);
6827        }
6828        # in case of hierarchical branch names
6829        $ver =~ s!/!.!g;
6830
6831        # name = project-version_string
6832        $name = "$name-$ver";
6833
6834        return wantarray ? ($name, $name) : $name;
6835}
6836
6837sub git_snapshot {
6838        my $format = $input_params{'snapshot_format'};
6839        if (!@snapshot_fmts) {
6840                die_error(403, "Snapshots not allowed");
6841        }
6842        # default to first supported snapshot format
6843        $format ||= $snapshot_fmts[0];
6844        if ($format !~ m/^[a-z0-9]+$/) {
6845                die_error(400, "Invalid snapshot format parameter");
6846        } elsif (!exists($known_snapshot_formats{$format})) {
6847                die_error(400, "Unknown snapshot format");
6848        } elsif ($known_snapshot_formats{$format}{'disabled'}) {
6849                die_error(403, "Snapshot format not allowed");
6850        } elsif (!grep($_ eq $format, @snapshot_fmts)) {
6851                die_error(403, "Unsupported snapshot format");
6852        }
6853
6854        my $type = git_get_type("$hash^{}");
6855        if (!$type) {
6856                die_error(404, 'Object does not exist');
6857        }  elsif ($type eq 'blob') {
6858                die_error(400, 'Object is not a tree-ish');
6859        }
6860
6861        my ($name, $prefix) = snapshot_name($project, $hash);
6862        my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
6863        my $cmd = quote_command(
6864                git_cmd(), 'archive',
6865                "--format=$known_snapshot_formats{$format}{'format'}",
6866                "--prefix=$prefix/", $hash);
6867        if (exists $known_snapshot_formats{$format}{'compressor'}) {
6868                $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
6869        }
6870
6871        $filename =~ s/(["\\])/\\$1/g;
6872        print $cgi->header(
6873                -type => $known_snapshot_formats{$format}{'type'},
6874                -content_disposition => 'inline; filename="' . $filename . '"',
6875                -status => '200 OK');
6876
6877        open my $fd, "-|", $cmd
6878                or die_error(500, "Execute git-archive failed");
6879        binmode STDOUT, ':raw';
6880        print <$fd>;
6881        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6882        close $fd;
6883}
6884
6885sub git_log_generic {
6886        my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
6887
6888        my $head = git_get_head_hash($project);
6889        if (!defined $base) {
6890                $base = $head;
6891        }
6892        if (!defined $page) {
6893                $page = 0;
6894        }
6895        my $refs = git_get_references();
6896
6897        my $commit_hash = $base;
6898        if (defined $parent) {
6899                $commit_hash = "$parent..$base";
6900        }
6901        my @commitlist =
6902                parse_commits($commit_hash, 101, (100 * $page),
6903                              defined $file_name ? ($file_name, "--full-history") : ());
6904
6905        my $ftype;
6906        if (!defined $file_hash && defined $file_name) {
6907                # some commits could have deleted file in question,
6908                # and not have it in tree, but one of them has to have it
6909                for (my $i = 0; $i < @commitlist; $i++) {
6910                        $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
6911                        last if defined $file_hash;
6912                }
6913        }
6914        if (defined $file_hash) {
6915                $ftype = git_get_type($file_hash);
6916        }
6917        if (defined $file_name && !defined $ftype) {
6918                die_error(500, "Unknown type of object");
6919        }
6920        my %co;
6921        if (defined $file_name) {
6922                %co = parse_commit($base)
6923                        or die_error(404, "Unknown commit object");
6924        }
6925
6926
6927        my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
6928        my $next_link = '';
6929        if ($#commitlist >= 100) {
6930                $next_link =
6931                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
6932                                 -accesskey => "n", -title => "Alt-n"}, "next");
6933        }
6934        my $patch_max = gitweb_get_feature('patches');
6935        if ($patch_max && !defined $file_name) {
6936                if ($patch_max < 0 || @commitlist <= $patch_max) {
6937                        $paging_nav .= " &sdot; " .
6938                                $cgi->a({-href => href(action=>"patches", -replay=>1)},
6939                                        "patches");
6940                }
6941        }
6942
6943        git_header_html();
6944        git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
6945        if (defined $file_name) {
6946                git_print_header_div('commit', esc_html($co{'title'}), $base);
6947        } else {
6948                git_print_header_div('summary', $project)
6949        }
6950        git_print_page_path($file_name, $ftype, $hash_base)
6951                if (defined $file_name);
6952
6953        $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
6954                     $file_name, $file_hash, $ftype);
6955
6956        git_footer_html();
6957}
6958
6959sub git_log {
6960        git_log_generic('log', \&git_log_body,
6961                        $hash, $hash_parent);
6962}
6963
6964sub git_commit {
6965        $hash ||= $hash_base || "HEAD";
6966        my %co = parse_commit($hash)
6967            or die_error(404, "Unknown commit object");
6968
6969        my $parent  = $co{'parent'};
6970        my $parents = $co{'parents'}; # listref
6971
6972        # we need to prepare $formats_nav before any parameter munging
6973        my $formats_nav;
6974        if (!defined $parent) {
6975                # --root commitdiff
6976                $formats_nav .= '(initial)';
6977        } elsif (@$parents == 1) {
6978                # single parent commit
6979                $formats_nav .=
6980                        '(parent: ' .
6981                        $cgi->a({-href => href(action=>"commit",
6982                                               hash=>$parent)},
6983                                esc_html(substr($parent, 0, 7))) .
6984                        ')';
6985        } else {
6986                # merge commit
6987                $formats_nav .=
6988                        '(merge: ' .
6989                        join(' ', map {
6990                                $cgi->a({-href => href(action=>"commit",
6991                                                       hash=>$_)},
6992                                        esc_html(substr($_, 0, 7)));
6993                        } @$parents ) .
6994                        ')';
6995        }
6996        if (gitweb_check_feature('patches') && @$parents <= 1) {
6997                $formats_nav .= " | " .
6998                        $cgi->a({-href => href(action=>"patch", -replay=>1)},
6999                                "patch");
7000        }
7001
7002        if (!defined $parent) {
7003                $parent = "--root";
7004        }
7005        my @difftree;
7006        open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
7007                @diff_opts,
7008                (@$parents <= 1 ? $parent : '-c'),
7009                $hash, "--"
7010                or die_error(500, "Open git-diff-tree failed");
7011        @difftree = map { chomp; $_ } <$fd>;
7012        close $fd or die_error(404, "Reading git-diff-tree failed");
7013
7014        # non-textual hash id's can be cached
7015        my $expires;
7016        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7017                $expires = "+1d";
7018        }
7019        my $refs = git_get_references();
7020        my $ref = format_ref_marker($refs, $co{'id'});
7021
7022        git_header_html(undef, $expires);
7023        git_print_page_nav('commit', '',
7024                           $hash, $co{'tree'}, $hash,
7025                           $formats_nav);
7026
7027        if (defined $co{'parent'}) {
7028                git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
7029        } else {
7030                git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
7031        }
7032        print "<div class=\"title_text\">\n" .
7033              "<table class=\"object_header\">\n";
7034        git_print_authorship_rows(\%co);
7035        print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
7036        print "<tr>" .
7037              "<td>tree</td>" .
7038              "<td class=\"sha1\">" .
7039              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7040                       class => "list"}, $co{'tree'}) .
7041              "</td>" .
7042              "<td class=\"link\">" .
7043              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7044                      "tree");
7045        my $snapshot_links = format_snapshot_links($hash);
7046        if (defined $snapshot_links) {
7047                print " | " . $snapshot_links;
7048        }
7049        print "</td>" .
7050              "</tr>\n";
7051
7052        foreach my $par (@$parents) {
7053                print "<tr>" .
7054                      "<td>parent</td>" .
7055                      "<td class=\"sha1\">" .
7056                      $cgi->a({-href => href(action=>"commit", hash=>$par),
7057                               class => "list"}, $par) .
7058                      "</td>" .
7059                      "<td class=\"link\">" .
7060                      $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7061                      " | " .
7062                      $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7063                      "</td>" .
7064                      "</tr>\n";
7065        }
7066        print "</table>".
7067              "</div>\n";
7068
7069        print "<div class=\"page_body\">\n";
7070        git_print_log($co{'comment'});
7071        print "</div>\n";
7072
7073        git_difftree_body(\@difftree, $hash, @$parents);
7074
7075        git_footer_html();
7076}
7077
7078sub git_object {
7079        # object is defined by:
7080        # - hash or hash_base alone
7081        # - hash_base and file_name
7082        my $type;
7083
7084        # - hash or hash_base alone
7085        if ($hash || ($hash_base && !defined $file_name)) {
7086                my $object_id = $hash || $hash_base;
7087
7088                open my $fd, "-|", quote_command(
7089                        git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7090                        or die_error(404, "Object does not exist");
7091                $type = <$fd>;
7092                chomp $type;
7093                close $fd
7094                        or die_error(404, "Object does not exist");
7095
7096        # - hash_base and file_name
7097        } elsif ($hash_base && defined $file_name) {
7098                $file_name =~ s,/+$,,;
7099
7100                system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7101                        or die_error(404, "Base object does not exist");
7102
7103                # here errors should not hapen
7104                open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7105                        or die_error(500, "Open git-ls-tree failed");
7106                my $line = <$fd>;
7107                close $fd;
7108
7109                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7110                unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7111                        die_error(404, "File or directory for given base does not exist");
7112                }
7113                $type = $2;
7114                $hash = $3;
7115        } else {
7116                die_error(400, "Not enough information to find object");
7117        }
7118
7119        print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7120                                          hash=>$hash, hash_base=>$hash_base,
7121                                          file_name=>$file_name),
7122                             -status => '302 Found');
7123}
7124
7125sub git_blobdiff {
7126        my $format = shift || 'html';
7127        my $diff_style = $input_params{'diff_style'} || 'inline';
7128
7129        my $fd;
7130        my @difftree;
7131        my %diffinfo;
7132        my $expires;
7133
7134        # preparing $fd and %diffinfo for git_patchset_body
7135        # new style URI
7136        if (defined $hash_base && defined $hash_parent_base) {
7137                if (defined $file_name) {
7138                        # read raw output
7139                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7140                                $hash_parent_base, $hash_base,
7141                                "--", (defined $file_parent ? $file_parent : ()), $file_name
7142                                or die_error(500, "Open git-diff-tree failed");
7143                        @difftree = map { chomp; $_ } <$fd>;
7144                        close $fd
7145                                or die_error(404, "Reading git-diff-tree failed");
7146                        @difftree
7147                                or die_error(404, "Blob diff not found");
7148
7149                } elsif (defined $hash &&
7150                         $hash =~ /[0-9a-fA-F]{40}/) {
7151                        # try to find filename from $hash
7152
7153                        # read filtered raw output
7154                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7155                                $hash_parent_base, $hash_base, "--"
7156                                or die_error(500, "Open git-diff-tree failed");
7157                        @difftree =
7158                                # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7159                                # $hash == to_id
7160                                grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7161                                map { chomp; $_ } <$fd>;
7162                        close $fd
7163                                or die_error(404, "Reading git-diff-tree failed");
7164                        @difftree
7165                                or die_error(404, "Blob diff not found");
7166
7167                } else {
7168                        die_error(400, "Missing one of the blob diff parameters");
7169                }
7170
7171                if (@difftree > 1) {
7172                        die_error(400, "Ambiguous blob diff specification");
7173                }
7174
7175                %diffinfo = parse_difftree_raw_line($difftree[0]);
7176                $file_parent ||= $diffinfo{'from_file'} || $file_name;
7177                $file_name   ||= $diffinfo{'to_file'};
7178
7179                $hash_parent ||= $diffinfo{'from_id'};
7180                $hash        ||= $diffinfo{'to_id'};
7181
7182                # non-textual hash id's can be cached
7183                if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7184                    $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7185                        $expires = '+1d';
7186                }
7187
7188                # open patch output
7189                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7190                        '-p', ($format eq 'html' ? "--full-index" : ()),
7191                        $hash_parent_base, $hash_base,
7192                        "--", (defined $file_parent ? $file_parent : ()), $file_name
7193                        or die_error(500, "Open git-diff-tree failed");
7194        }
7195
7196        # old/legacy style URI -- not generated anymore since 1.4.3.
7197        if (!%diffinfo) {
7198                die_error('404 Not Found', "Missing one of the blob diff parameters")
7199        }
7200
7201        # header
7202        if ($format eq 'html') {
7203                my $formats_nav =
7204                        $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7205                                "raw");
7206                $formats_nav .= diff_style_nav($diff_style);
7207                git_header_html(undef, $expires);
7208                if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7209                        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7210                        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7211                } else {
7212                        print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7213                        print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7214                }
7215                if (defined $file_name) {
7216                        git_print_page_path($file_name, "blob", $hash_base);
7217                } else {
7218                        print "<div class=\"page_path\"></div>\n";
7219                }
7220
7221        } elsif ($format eq 'plain') {
7222                print $cgi->header(
7223                        -type => 'text/plain',
7224                        -charset => 'utf-8',
7225                        -expires => $expires,
7226                        -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7227
7228                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7229
7230        } else {
7231                die_error(400, "Unknown blobdiff format");
7232        }
7233
7234        # patch
7235        if ($format eq 'html') {
7236                print "<div class=\"page_body\">\n";
7237
7238                git_patchset_body($fd, $diff_style,
7239                                  [ \%diffinfo ], $hash_base, $hash_parent_base);
7240                close $fd;
7241
7242                print "</div>\n"; # class="page_body"
7243                git_footer_html();
7244
7245        } else {
7246                while (my $line = <$fd>) {
7247                        $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7248                        $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7249
7250                        print $line;
7251
7252                        last if $line =~ m!^\+\+\+!;
7253                }
7254                local $/ = undef;
7255                print <$fd>;
7256                close $fd;
7257        }
7258}
7259
7260sub git_blobdiff_plain {
7261        git_blobdiff('plain');
7262}
7263
7264# assumes that it is added as later part of already existing navigation,
7265# so it returns "| foo | bar" rather than just "foo | bar"
7266sub diff_style_nav {
7267        my ($diff_style, $is_combined) = @_;
7268        $diff_style ||= 'inline';
7269
7270        return "" if ($is_combined);
7271
7272        my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7273        my %styles = @styles;
7274        @styles =
7275                @styles[ map { $_ * 2 } 0..$#styles/2 ];
7276
7277        return join '',
7278                map { " | ".$_ }
7279                map {
7280                        $_ eq $diff_style ? $styles{$_} :
7281                        $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7282                } @styles;
7283}
7284
7285sub git_commitdiff {
7286        my %params = @_;
7287        my $format = $params{-format} || 'html';
7288        my $diff_style = $input_params{'diff_style'} || 'inline';
7289
7290        my ($patch_max) = gitweb_get_feature('patches');
7291        if ($format eq 'patch') {
7292                die_error(403, "Patch view not allowed") unless $patch_max;
7293        }
7294
7295        $hash ||= $hash_base || "HEAD";
7296        my %co = parse_commit($hash)
7297            or die_error(404, "Unknown commit object");
7298
7299        # choose format for commitdiff for merge
7300        if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7301                $hash_parent = '--cc';
7302        }
7303        # we need to prepare $formats_nav before almost any parameter munging
7304        my $formats_nav;
7305        if ($format eq 'html') {
7306                $formats_nav =
7307                        $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7308                                "raw");
7309                if ($patch_max && @{$co{'parents'}} <= 1) {
7310                        $formats_nav .= " | " .
7311                                $cgi->a({-href => href(action=>"patch", -replay=>1)},
7312                                        "patch");
7313                }
7314                $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7315
7316                if (defined $hash_parent &&
7317                    $hash_parent ne '-c' && $hash_parent ne '--cc') {
7318                        # commitdiff with two commits given
7319                        my $hash_parent_short = $hash_parent;
7320                        if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7321                                $hash_parent_short = substr($hash_parent, 0, 7);
7322                        }
7323                        $formats_nav .=
7324                                ' (from';
7325                        for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7326                                if ($co{'parents'}[$i] eq $hash_parent) {
7327                                        $formats_nav .= ' parent ' . ($i+1);
7328                                        last;
7329                                }
7330                        }
7331                        $formats_nav .= ': ' .
7332                                $cgi->a({-href => href(-replay=>1,
7333                                                       hash=>$hash_parent, hash_base=>undef)},
7334                                        esc_html($hash_parent_short)) .
7335                                ')';
7336                } elsif (!$co{'parent'}) {
7337                        # --root commitdiff
7338                        $formats_nav .= ' (initial)';
7339                } elsif (scalar @{$co{'parents'}} == 1) {
7340                        # single parent commit
7341                        $formats_nav .=
7342                                ' (parent: ' .
7343                                $cgi->a({-href => href(-replay=>1,
7344                                                       hash=>$co{'parent'}, hash_base=>undef)},
7345                                        esc_html(substr($co{'parent'}, 0, 7))) .
7346                                ')';
7347                } else {
7348                        # merge commit
7349                        if ($hash_parent eq '--cc') {
7350                                $formats_nav .= ' | ' .
7351                                        $cgi->a({-href => href(-replay=>1,
7352                                                               hash=>$hash, hash_parent=>'-c')},
7353                                                'combined');
7354                        } else { # $hash_parent eq '-c'
7355                                $formats_nav .= ' | ' .
7356                                        $cgi->a({-href => href(-replay=>1,
7357                                                               hash=>$hash, hash_parent=>'--cc')},
7358                                                'compact');
7359                        }
7360                        $formats_nav .=
7361                                ' (merge: ' .
7362                                join(' ', map {
7363                                        $cgi->a({-href => href(-replay=>1,
7364                                                               hash=>$_, hash_base=>undef)},
7365                                                esc_html(substr($_, 0, 7)));
7366                                } @{$co{'parents'}} ) .
7367                                ')';
7368                }
7369        }
7370
7371        my $hash_parent_param = $hash_parent;
7372        if (!defined $hash_parent_param) {
7373                # --cc for multiple parents, --root for parentless
7374                $hash_parent_param =
7375                        @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7376        }
7377
7378        # read commitdiff
7379        my $fd;
7380        my @difftree;
7381        if ($format eq 'html') {
7382                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7383                        "--no-commit-id", "--patch-with-raw", "--full-index",
7384                        $hash_parent_param, $hash, "--"
7385                        or die_error(500, "Open git-diff-tree failed");
7386
7387                while (my $line = <$fd>) {
7388                        chomp $line;
7389                        # empty line ends raw part of diff-tree output
7390                        last unless $line;
7391                        push @difftree, scalar parse_difftree_raw_line($line);
7392                }
7393
7394        } elsif ($format eq 'plain') {
7395                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7396                        '-p', $hash_parent_param, $hash, "--"
7397                        or die_error(500, "Open git-diff-tree failed");
7398        } elsif ($format eq 'patch') {
7399                # For commit ranges, we limit the output to the number of
7400                # patches specified in the 'patches' feature.
7401                # For single commits, we limit the output to a single patch,
7402                # diverging from the git-format-patch default.
7403                my @commit_spec = ();
7404                if ($hash_parent) {
7405                        if ($patch_max > 0) {
7406                                push @commit_spec, "-$patch_max";
7407                        }
7408                        push @commit_spec, '-n', "$hash_parent..$hash";
7409                } else {
7410                        if ($params{-single}) {
7411                                push @commit_spec, '-1';
7412                        } else {
7413                                if ($patch_max > 0) {
7414                                        push @commit_spec, "-$patch_max";
7415                                }
7416                                push @commit_spec, "-n";
7417                        }
7418                        push @commit_spec, '--root', $hash;
7419                }
7420                open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7421                        '--encoding=utf8', '--stdout', @commit_spec
7422                        or die_error(500, "Open git-format-patch failed");
7423        } else {
7424                die_error(400, "Unknown commitdiff format");
7425        }
7426
7427        # non-textual hash id's can be cached
7428        my $expires;
7429        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7430                $expires = "+1d";
7431        }
7432
7433        # write commit message
7434        if ($format eq 'html') {
7435                my $refs = git_get_references();
7436                my $ref = format_ref_marker($refs, $co{'id'});
7437
7438                git_header_html(undef, $expires);
7439                git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7440                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7441                print "<div class=\"title_text\">\n" .
7442                      "<table class=\"object_header\">\n";
7443                git_print_authorship_rows(\%co);
7444                print "</table>".
7445                      "</div>\n";
7446                print "<div class=\"page_body\">\n";
7447                if (@{$co{'comment'}} > 1) {
7448                        print "<div class=\"log\">\n";
7449                        git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7450                        print "</div>\n"; # class="log"
7451                }
7452
7453        } elsif ($format eq 'plain') {
7454                my $refs = git_get_references("tags");
7455                my $tagname = git_get_rev_name_tags($hash);
7456                my $filename = basename($project) . "-$hash.patch";
7457
7458                print $cgi->header(
7459                        -type => 'text/plain',
7460                        -charset => 'utf-8',
7461                        -expires => $expires,
7462                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7463                my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7464                print "From: " . to_utf8($co{'author'}) . "\n";
7465                print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7466                print "Subject: " . to_utf8($co{'title'}) . "\n";
7467
7468                print "X-Git-Tag: $tagname\n" if $tagname;
7469                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7470
7471                foreach my $line (@{$co{'comment'}}) {
7472                        print to_utf8($line) . "\n";
7473                }
7474                print "---\n\n";
7475        } elsif ($format eq 'patch') {
7476                my $filename = basename($project) . "-$hash.patch";
7477
7478                print $cgi->header(
7479                        -type => 'text/plain',
7480                        -charset => 'utf-8',
7481                        -expires => $expires,
7482                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7483        }
7484
7485        # write patch
7486        if ($format eq 'html') {
7487                my $use_parents = !defined $hash_parent ||
7488                        $hash_parent eq '-c' || $hash_parent eq '--cc';
7489                git_difftree_body(\@difftree, $hash,
7490                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7491                print "<br/>\n";
7492
7493                git_patchset_body($fd, $diff_style,
7494                                  \@difftree, $hash,
7495                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7496                close $fd;
7497                print "</div>\n"; # class="page_body"
7498                git_footer_html();
7499
7500        } elsif ($format eq 'plain') {
7501                local $/ = undef;
7502                print <$fd>;
7503                close $fd
7504                        or print "Reading git-diff-tree failed\n";
7505        } elsif ($format eq 'patch') {
7506                local $/ = undef;
7507                print <$fd>;
7508                close $fd
7509                        or print "Reading git-format-patch failed\n";
7510        }
7511}
7512
7513sub git_commitdiff_plain {
7514        git_commitdiff(-format => 'plain');
7515}
7516
7517# format-patch-style patches
7518sub git_patch {
7519        git_commitdiff(-format => 'patch', -single => 1);
7520}
7521
7522sub git_patches {
7523        git_commitdiff(-format => 'patch');
7524}
7525
7526sub git_history {
7527        git_log_generic('history', \&git_history_body,
7528                        $hash_base, $hash_parent_base,
7529                        $file_name, $hash);
7530}
7531
7532sub git_search {
7533        $searchtype ||= 'commit';
7534
7535        # check if appropriate features are enabled
7536        gitweb_check_feature('search')
7537                or die_error(403, "Search is disabled");
7538        if ($searchtype eq 'pickaxe') {
7539                # pickaxe may take all resources of your box and run for several minutes
7540                # with every query - so decide by yourself how public you make this feature
7541                gitweb_check_feature('pickaxe')
7542                        or die_error(403, "Pickaxe search is disabled");
7543        }
7544        if ($searchtype eq 'grep') {
7545                # grep search might be potentially CPU-intensive, too
7546                gitweb_check_feature('grep')
7547                        or die_error(403, "Grep search is disabled");
7548        }
7549
7550        if (!defined $searchtext) {
7551                die_error(400, "Text field is empty");
7552        }
7553        if (!defined $hash) {
7554                $hash = git_get_head_hash($project);
7555        }
7556        my %co = parse_commit($hash);
7557        if (!%co) {
7558                die_error(404, "Unknown commit object");
7559        }
7560        if (!defined $page) {
7561                $page = 0;
7562        }
7563
7564        if ($searchtype eq 'commit' ||
7565            $searchtype eq 'author' ||
7566            $searchtype eq 'committer') {
7567                git_search_message(%co);
7568        } elsif ($searchtype eq 'pickaxe') {
7569                git_search_changes(%co);
7570        } elsif ($searchtype eq 'grep') {
7571                git_search_files(%co);
7572        } else {
7573                die_error(400, "Unknown search type");
7574        }
7575}
7576
7577sub git_search_help {
7578        git_header_html();
7579        git_print_page_nav('','', $hash,$hash,$hash);
7580        print <<EOT;
7581<p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7582regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7583the pattern entered is recognized as the POSIX extended
7584<a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7585insensitive).</p>
7586<dl>
7587<dt><b>commit</b></dt>
7588<dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7589EOT
7590        my $have_grep = gitweb_check_feature('grep');
7591        if ($have_grep) {
7592                print <<EOT;
7593<dt><b>grep</b></dt>
7594<dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7595    a different one) are searched for the given pattern. On large trees, this search can take
7596a while and put some strain on the server, so please use it with some consideration. Note that
7597due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7598case-sensitive.</dd>
7599EOT
7600        }
7601        print <<EOT;
7602<dt><b>author</b></dt>
7603<dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7604<dt><b>committer</b></dt>
7605<dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7606EOT
7607        my $have_pickaxe = gitweb_check_feature('pickaxe');
7608        if ($have_pickaxe) {
7609                print <<EOT;
7610<dt><b>pickaxe</b></dt>
7611<dd>All commits that caused the string to appear or disappear from any file (changes that
7612added, removed or "modified" the string) will be listed. This search can take a while and
7613takes a lot of strain on the server, so please use it wisely. Note that since you may be
7614interested even in changes just changing the case as well, this search is case sensitive.</dd>
7615EOT
7616        }
7617        print "</dl>\n";
7618        git_footer_html();
7619}
7620
7621sub git_shortlog {
7622        git_log_generic('shortlog', \&git_shortlog_body,
7623                        $hash, $hash_parent);
7624}
7625
7626## ......................................................................
7627## feeds (RSS, Atom; OPML)
7628
7629sub git_feed {
7630        my $format = shift || 'atom';
7631        my $have_blame = gitweb_check_feature('blame');
7632
7633        # Atom: http://www.atomenabled.org/developers/syndication/
7634        # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7635        if ($format ne 'rss' && $format ne 'atom') {
7636                die_error(400, "Unknown web feed format");
7637        }
7638
7639        # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7640        my $head = $hash || 'HEAD';
7641        my @commitlist = parse_commits($head, 150, 0, $file_name);
7642
7643        my %latest_commit;
7644        my %latest_date;
7645        my $content_type = "application/$format+xml";
7646        if (defined $cgi->http('HTTP_ACCEPT') &&
7647                 $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7648                # browser (feed reader) prefers text/xml
7649                $content_type = 'text/xml';
7650        }
7651        if (defined($commitlist[0])) {
7652                %latest_commit = %{$commitlist[0]};
7653                my $latest_epoch = $latest_commit{'committer_epoch'};
7654                %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7655                my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7656                if (defined $if_modified) {
7657                        my $since;
7658                        if (eval { require HTTP::Date; 1; }) {
7659                                $since = HTTP::Date::str2time($if_modified);
7660                        } elsif (eval { require Time::ParseDate; 1; }) {
7661                                $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7662                        }
7663                        if (defined $since && $latest_epoch <= $since) {
7664                                print $cgi->header(
7665                                        -type => $content_type,
7666                                        -charset => 'utf-8',
7667                                        -last_modified => $latest_date{'rfc2822'},
7668                                        -status => '304 Not Modified');
7669                                return;
7670                        }
7671                }
7672                print $cgi->header(
7673                        -type => $content_type,
7674                        -charset => 'utf-8',
7675                        -last_modified => $latest_date{'rfc2822'});
7676        } else {
7677                print $cgi->header(
7678                        -type => $content_type,
7679                        -charset => 'utf-8');
7680        }
7681
7682        # Optimization: skip generating the body if client asks only
7683        # for Last-Modified date.
7684        return if ($cgi->request_method() eq 'HEAD');
7685
7686        # header variables
7687        my $title = "$site_name - $project/$action";
7688        my $feed_type = 'log';
7689        if (defined $hash) {
7690                $title .= " - '$hash'";
7691                $feed_type = 'branch log';
7692                if (defined $file_name) {
7693                        $title .= " :: $file_name";
7694                        $feed_type = 'history';
7695                }
7696        } elsif (defined $file_name) {
7697                $title .= " - $file_name";
7698                $feed_type = 'history';
7699        }
7700        $title .= " $feed_type";
7701        my $descr = git_get_project_description($project);
7702        if (defined $descr) {
7703                $descr = esc_html($descr);
7704        } else {
7705                $descr = "$project " .
7706                         ($format eq 'rss' ? 'RSS' : 'Atom') .
7707                         " feed";
7708        }
7709        my $owner = git_get_project_owner($project);
7710        $owner = esc_html($owner);
7711
7712        #header
7713        my $alt_url;
7714        if (defined $file_name) {
7715                $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7716        } elsif (defined $hash) {
7717                $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7718        } else {
7719                $alt_url = href(-full=>1, action=>"summary");
7720        }
7721        print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7722        if ($format eq 'rss') {
7723                print <<XML;
7724<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7725<channel>
7726XML
7727                print "<title>$title</title>\n" .
7728                      "<link>$alt_url</link>\n" .
7729                      "<description>$descr</description>\n" .
7730                      "<language>en</language>\n" .
7731                      # project owner is responsible for 'editorial' content
7732                      "<managingEditor>$owner</managingEditor>\n";
7733                if (defined $logo || defined $favicon) {
7734                        # prefer the logo to the favicon, since RSS
7735                        # doesn't allow both
7736                        my $img = esc_url($logo || $favicon);
7737                        print "<image>\n" .
7738                              "<url>$img</url>\n" .
7739                              "<title>$title</title>\n" .
7740                              "<link>$alt_url</link>\n" .
7741                              "</image>\n";
7742                }
7743                if (%latest_date) {
7744                        print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7745                        print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7746                }
7747                print "<generator>gitweb v.$version/$git_version</generator>\n";
7748        } elsif ($format eq 'atom') {
7749                print <<XML;
7750<feed xmlns="http://www.w3.org/2005/Atom">
7751XML
7752                print "<title>$title</title>\n" .
7753                      "<subtitle>$descr</subtitle>\n" .
7754                      '<link rel="alternate" type="text/html" href="' .
7755                      $alt_url . '" />' . "\n" .
7756                      '<link rel="self" type="' . $content_type . '" href="' .
7757                      $cgi->self_url() . '" />' . "\n" .
7758                      "<id>" . href(-full=>1) . "</id>\n" .
7759                      # use project owner for feed author
7760                      "<author><name>$owner</name></author>\n";
7761                if (defined $favicon) {
7762                        print "<icon>" . esc_url($favicon) . "</icon>\n";
7763                }
7764                if (defined $logo) {
7765                        # not twice as wide as tall: 72 x 27 pixels
7766                        print "<logo>" . esc_url($logo) . "</logo>\n";
7767                }
7768                if (! %latest_date) {
7769                        # dummy date to keep the feed valid until commits trickle in:
7770                        print "<updated>1970-01-01T00:00:00Z</updated>\n";
7771                } else {
7772                        print "<updated>$latest_date{'iso-8601'}</updated>\n";
7773                }
7774                print "<generator version='$version/$git_version'>gitweb</generator>\n";
7775        }
7776
7777        # contents
7778        for (my $i = 0; $i <= $#commitlist; $i++) {
7779                my %co = %{$commitlist[$i]};
7780                my $commit = $co{'id'};
7781                # we read 150, we always show 30 and the ones more recent than 48 hours
7782                if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7783                        last;
7784                }
7785                my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7786
7787                # get list of changed files
7788                open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7789                        $co{'parent'} || "--root",
7790                        $co{'id'}, "--", (defined $file_name ? $file_name : ())
7791                        or next;
7792                my @difftree = map { chomp; $_ } <$fd>;
7793                close $fd
7794                        or next;
7795
7796                # print element (entry, item)
7797                my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7798                if ($format eq 'rss') {
7799                        print "<item>\n" .
7800                              "<title>" . esc_html($co{'title'}) . "</title>\n" .
7801                              "<author>" . esc_html($co{'author'}) . "</author>\n" .
7802                              "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7803                              "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7804                              "<link>$co_url</link>\n" .
7805                              "<description>" . esc_html($co{'title'}) . "</description>\n" .
7806                              "<content:encoded>" .
7807                              "<![CDATA[\n";
7808                } elsif ($format eq 'atom') {
7809                        print "<entry>\n" .
7810                              "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7811                              "<updated>$cd{'iso-8601'}</updated>\n" .
7812                              "<author>\n" .
7813                              "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7814                        if ($co{'author_email'}) {
7815                                print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7816                        }
7817                        print "</author>\n" .
7818                              # use committer for contributor
7819                              "<contributor>\n" .
7820                              "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7821                        if ($co{'committer_email'}) {
7822                                print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7823                        }
7824                        print "</contributor>\n" .
7825                              "<published>$cd{'iso-8601'}</published>\n" .
7826                              "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7827                              "<id>$co_url</id>\n" .
7828                              "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
7829                              "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
7830                }
7831                my $comment = $co{'comment'};
7832                print "<pre>\n";
7833                foreach my $line (@$comment) {
7834                        $line = esc_html($line);
7835                        print "$line\n";
7836                }
7837                print "</pre><ul>\n";
7838                foreach my $difftree_line (@difftree) {
7839                        my %difftree = parse_difftree_raw_line($difftree_line);
7840                        next if !$difftree{'from_id'};
7841
7842                        my $file = $difftree{'file'} || $difftree{'to_file'};
7843
7844                        print "<li>" .
7845                              "[" .
7846                              $cgi->a({-href => href(-full=>1, action=>"blobdiff",
7847                                                     hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
7848                                                     hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
7849                                                     file_name=>$file, file_parent=>$difftree{'from_file'}),
7850                                      -title => "diff"}, 'D');
7851                        if ($have_blame) {
7852                                print $cgi->a({-href => href(-full=>1, action=>"blame",
7853                                                             file_name=>$file, hash_base=>$commit),
7854                                              -title => "blame"}, 'B');
7855                        }
7856                        # if this is not a feed of a file history
7857                        if (!defined $file_name || $file_name ne $file) {
7858                                print $cgi->a({-href => href(-full=>1, action=>"history",
7859                                                             file_name=>$file, hash=>$commit),
7860                                              -title => "history"}, 'H');
7861                        }
7862                        $file = esc_path($file);
7863                        print "] ".
7864                              "$file</li>\n";
7865                }
7866                if ($format eq 'rss') {
7867                        print "</ul>]]>\n" .
7868                              "</content:encoded>\n" .
7869                              "</item>\n";
7870                } elsif ($format eq 'atom') {
7871                        print "</ul>\n</div>\n" .
7872                              "</content>\n" .
7873                              "</entry>\n";
7874                }
7875        }
7876
7877        # end of feed
7878        if ($format eq 'rss') {
7879                print "</channel>\n</rss>\n";
7880        } elsif ($format eq 'atom') {
7881                print "</feed>\n";
7882        }
7883}
7884
7885sub git_rss {
7886        git_feed('rss');
7887}
7888
7889sub git_atom {
7890        git_feed('atom');
7891}
7892
7893sub git_opml {
7894        my @list = git_get_projects_list($project_filter, $strict_export);
7895        if (!@list) {
7896                die_error(404, "No projects found");
7897        }
7898
7899        print $cgi->header(
7900                -type => 'text/xml',
7901                -charset => 'utf-8',
7902                -content_disposition => 'inline; filename="opml.xml"');
7903
7904        my $title = esc_html($site_name);
7905        my $filter = " within subdirectory ";
7906        if (defined $project_filter) {
7907                $filter .= esc_html($project_filter);
7908        } else {
7909                $filter = "";
7910        }
7911        print <<XML;
7912<?xml version="1.0" encoding="utf-8"?>
7913<opml version="1.0">
7914<head>
7915  <title>$title OPML Export$filter</title>
7916</head>
7917<body>
7918<outline text="git RSS feeds">
7919XML
7920
7921        foreach my $pr (@list) {
7922                my %proj = %$pr;
7923                my $head = git_get_head_hash($proj{'path'});
7924                if (!defined $head) {
7925                        next;
7926                }
7927                $git_dir = "$projectroot/$proj{'path'}";
7928                my %co = parse_commit($head);
7929                if (!%co) {
7930                        next;
7931                }
7932
7933                my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7934                my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7935                my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7936                print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7937        }
7938        print <<XML;
7939</outline>
7940</body>
7941</opml>
7942XML
7943}