48a2a375be490f54edb9712ccafcac3d66b7e22d
   1#!/usr/bin/perl
   2
   3# gitweb - simple web interface to track changes in git repositories
   4#
   5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
   6# (C) 2005, Christian Gierke
   7#
   8# This program is licensed under the GPLv2
   9
  10use 5.008;
  11use strict;
  12use warnings;
  13use CGI qw(:standard :escapeHTML -nosticky);
  14use CGI::Util qw(unescape);
  15use CGI::Carp qw(fatalsToBrowser set_message);
  16use Encode;
  17use Fcntl ':mode';
  18use File::Find qw();
  19use File::Basename qw(basename);
  20use Time::HiRes qw(gettimeofday tv_interval);
  21binmode STDOUT, ':utf8';
  22
  23our $t0 = [ gettimeofday() ];
  24our $number_of_git_cmds = 0;
  25
  26BEGIN {
  27        CGI->compile() if $ENV{'MOD_PERL'};
  28}
  29
  30our $version = "++GIT_VERSION++";
  31
  32our ($my_url, $my_uri, $base_url, $path_info, $home_link);
  33sub evaluate_uri {
  34        our $cgi;
  35
  36        our $my_url = $cgi->url();
  37        our $my_uri = $cgi->url(-absolute => 1);
  38
  39        # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
  40        # needed and used only for URLs with nonempty PATH_INFO
  41        our $base_url = $my_url;
  42
  43        # When the script is used as DirectoryIndex, the URL does not contain the name
  44        # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
  45        # have to do it ourselves. We make $path_info global because it's also used
  46        # later on.
  47        #
  48        # Another issue with the script being the DirectoryIndex is that the resulting
  49        # $my_url data is not the full script URL: this is good, because we want
  50        # generated links to keep implying the script name if it wasn't explicitly
  51        # indicated in the URL we're handling, but it means that $my_url cannot be used
  52        # as base URL.
  53        # Therefore, if we needed to strip PATH_INFO, then we know that we have
  54        # to build the base URL ourselves:
  55        our $path_info = $ENV{"PATH_INFO"};
  56        if ($path_info) {
  57                if ($my_url =~ s,\Q$path_info\E$,, &&
  58                    $my_uri =~ s,\Q$path_info\E$,, &&
  59                    defined $ENV{'SCRIPT_NAME'}) {
  60                        $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
  61                }
  62        }
  63
  64        # target of the home link on top of all pages
  65        our $home_link = $my_uri || "/";
  66}
  67
  68# core git executable to use
  69# this can just be "git" if your webserver has a sensible PATH
  70our $GIT = "++GIT_BINDIR++/git";
  71
  72# absolute fs-path which will be prepended to the project path
  73#our $projectroot = "/pub/scm";
  74our $projectroot = "++GITWEB_PROJECTROOT++";
  75
  76# fs traversing limit for getting project list
  77# the number is relative to the projectroot
  78our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
  79
  80# string of the home link on top of all pages
  81our $home_link_str = "++GITWEB_HOME_LINK_STR++";
  82
  83# name of your site or organization to appear in page titles
  84# replace this with something more descriptive for clearer bookmarks
  85our $site_name = "++GITWEB_SITENAME++"
  86                 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
  87
  88# html snippet to include in the <head> section of each page
  89our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
  90# filename of html text to include at top of each page
  91our $site_header = "++GITWEB_SITE_HEADER++";
  92# html text to include at home page
  93our $home_text = "++GITWEB_HOMETEXT++";
  94# filename of html text to include at bottom of each page
  95our $site_footer = "++GITWEB_SITE_FOOTER++";
  96
  97# URI of stylesheets
  98our @stylesheets = ("++GITWEB_CSS++");
  99# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
 100our $stylesheet = undef;
 101# URI of GIT logo (72x27 size)
 102our $logo = "++GITWEB_LOGO++";
 103# URI of GIT favicon, assumed to be image/png type
 104our $favicon = "++GITWEB_FAVICON++";
 105# URI of gitweb.js (JavaScript code for gitweb)
 106our $javascript = "++GITWEB_JS++";
 107
 108# URI and label (title) of GIT logo link
 109#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
 110#our $logo_label = "git documentation";
 111our $logo_url = "http://git-scm.com/";
 112our $logo_label = "git homepage";
 113
 114# source of projects list
 115our $projects_list = "++GITWEB_LIST++";
 116
 117# the width (in characters) of the projects list "Description" column
 118our $projects_list_description_width = 25;
 119
 120# group projects by category on the projects list
 121# (enabled if this variable evaluates to true)
 122our $projects_list_group_categories = 0;
 123
 124# default category if none specified
 125# (leave the empty string for no category)
 126our $project_list_default_category = "";
 127
 128# default order of projects list
 129# valid values are none, project, descr, owner, and age
 130our $default_projects_order = "project";
 131
 132# show repository only if this file exists
 133# (only effective if this variable evaluates to true)
 134our $export_ok = "++GITWEB_EXPORT_OK++";
 135
 136# show repository only if this subroutine returns true
 137# when given the path to the project, for example:
 138#    sub { return -e "$_[0]/git-daemon-export-ok"; }
 139our $export_auth_hook = undef;
 140
 141# only allow viewing of repositories also shown on the overview page
 142our $strict_export = "++GITWEB_STRICT_EXPORT++";
 143
 144# list of git base URLs used for URL to where fetch project from,
 145# i.e. full URL is "$git_base_url/$project"
 146our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
 147
 148# default blob_plain mimetype and default charset for text/plain blob
 149our $default_blob_plain_mimetype = 'text/plain';
 150our $default_text_plain_charset  = undef;
 151
 152# file to use for guessing MIME types before trying /etc/mime.types
 153# (relative to the current git repository)
 154our $mimetypes_file = undef;
 155
 156# assume this charset if line contains non-UTF-8 characters;
 157# it should be valid encoding (see Encoding::Supported(3pm) for list),
 158# for which encoding all byte sequences are valid, for example
 159# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
 160# could be even 'utf-8' for the old behavior)
 161our $fallback_encoding = 'latin1';
 162
 163# rename detection options for git-diff and git-diff-tree
 164# - default is '-M', with the cost proportional to
 165#   (number of removed files) * (number of new files).
 166# - more costly is '-C' (which implies '-M'), with the cost proportional to
 167#   (number of changed files + number of removed files) * (number of new files)
 168# - even more costly is '-C', '--find-copies-harder' with cost
 169#   (number of files in the original tree) * (number of new files)
 170# - one might want to include '-B' option, e.g. '-B', '-M'
 171our @diff_opts = ('-M'); # taken from git_commit
 172
 173# Disables features that would allow repository owners to inject script into
 174# the gitweb domain.
 175our $prevent_xss = 0;
 176
 177# Path to the highlight executable to use (must be the one from
 178# http://www.andre-simon.de due to assumptions about parameters and output).
 179# Useful if highlight is not installed on your webserver's PATH.
 180# [Default: highlight]
 181our $highlight_bin = "++HIGHLIGHT_BIN++";
 182
 183# information about snapshot formats that gitweb is capable of serving
 184our %known_snapshot_formats = (
 185        # name => {
 186        #       'display' => display name,
 187        #       'type' => mime type,
 188        #       'suffix' => filename suffix,
 189        #       'format' => --format for git-archive,
 190        #       'compressor' => [compressor command and arguments]
 191        #                       (array reference, optional)
 192        #       'disabled' => boolean (optional)}
 193        #
 194        'tgz' => {
 195                'display' => 'tar.gz',
 196                'type' => 'application/x-gzip',
 197                'suffix' => '.tar.gz',
 198                'format' => 'tar',
 199                'compressor' => ['gzip', '-n']},
 200
 201        'tbz2' => {
 202                'display' => 'tar.bz2',
 203                'type' => 'application/x-bzip2',
 204                'suffix' => '.tar.bz2',
 205                'format' => 'tar',
 206                'compressor' => ['bzip2']},
 207
 208        'txz' => {
 209                'display' => 'tar.xz',
 210                'type' => 'application/x-xz',
 211                'suffix' => '.tar.xz',
 212                'format' => 'tar',
 213                'compressor' => ['xz'],
 214                'disabled' => 1},
 215
 216        'zip' => {
 217                'display' => 'zip',
 218                'type' => 'application/x-zip',
 219                'suffix' => '.zip',
 220                'format' => 'zip'},
 221);
 222
 223# Aliases so we understand old gitweb.snapshot values in repository
 224# configuration.
 225our %known_snapshot_format_aliases = (
 226        'gzip'  => 'tgz',
 227        'bzip2' => 'tbz2',
 228        'xz'    => 'txz',
 229
 230        # backward compatibility: legacy gitweb config support
 231        'x-gzip' => undef, 'gz' => undef,
 232        'x-bzip2' => undef, 'bz2' => undef,
 233        'x-zip' => undef, '' => undef,
 234);
 235
 236# Pixel sizes for icons and avatars. If the default font sizes or lineheights
 237# are changed, it may be appropriate to change these values too via
 238# $GITWEB_CONFIG.
 239our %avatar_size = (
 240        'default' => 16,
 241        'double'  => 32
 242);
 243
 244# Used to set the maximum load that we will still respond to gitweb queries.
 245# If server load exceed this value then return "503 server busy" error.
 246# If gitweb cannot determined server load, it is taken to be 0.
 247# Leave it undefined (or set to 'undef') to turn off load checking.
 248our $maxload = 300;
 249
 250# configuration for 'highlight' (http://www.andre-simon.de/)
 251# match by basename
 252our %highlight_basename = (
 253        #'Program' => 'py',
 254        #'Library' => 'py',
 255        'SConstruct' => 'py', # SCons equivalent of Makefile
 256        'Makefile' => 'make',
 257);
 258# match by extension
 259our %highlight_ext = (
 260        # main extensions, defining name of syntax;
 261        # see files in /usr/share/highlight/langDefs/ directory
 262        map { $_ => $_ }
 263                qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
 264        # alternate extensions, see /etc/highlight/filetypes.conf
 265        'h' => 'c',
 266        map { $_ => 'sh'  } qw(bash zsh ksh),
 267        map { $_ => 'cpp' } qw(cxx c++ cc),
 268        map { $_ => 'php' } qw(php3 php4 php5 phps),
 269        map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
 270        map { $_ => 'make'} qw(mak mk),
 271        map { $_ => 'xml' } qw(xhtml html htm),
 272);
 273
 274# You define site-wide feature defaults here; override them with
 275# $GITWEB_CONFIG as necessary.
 276our %feature = (
 277        # feature => {
 278        #       'sub' => feature-sub (subroutine),
 279        #       'override' => allow-override (boolean),
 280        #       'default' => [ default options...] (array reference)}
 281        #
 282        # if feature is overridable (it means that allow-override has true value),
 283        # then feature-sub will be called with default options as parameters;
 284        # return value of feature-sub indicates if to enable specified feature
 285        #
 286        # if there is no 'sub' key (no feature-sub), then feature cannot be
 287        # overridden
 288        #
 289        # use gitweb_get_feature(<feature>) to retrieve the <feature> value
 290        # (an array) or gitweb_check_feature(<feature>) to check if <feature>
 291        # is enabled
 292
 293        # Enable the 'blame' blob view, showing the last commit that modified
 294        # each line in the file. This can be very CPU-intensive.
 295
 296        # To enable system wide have in $GITWEB_CONFIG
 297        # $feature{'blame'}{'default'} = [1];
 298        # To have project specific config enable override in $GITWEB_CONFIG
 299        # $feature{'blame'}{'override'} = 1;
 300        # and in project config gitweb.blame = 0|1;
 301        'blame' => {
 302                'sub' => sub { feature_bool('blame', @_) },
 303                'override' => 0,
 304                'default' => [0]},
 305
 306        # Enable the 'snapshot' link, providing a compressed archive of any
 307        # tree. This can potentially generate high traffic if you have large
 308        # project.
 309
 310        # Value is a list of formats defined in %known_snapshot_formats that
 311        # you wish to offer.
 312        # To disable system wide have in $GITWEB_CONFIG
 313        # $feature{'snapshot'}{'default'} = [];
 314        # To have project specific config enable override in $GITWEB_CONFIG
 315        # $feature{'snapshot'}{'override'} = 1;
 316        # and in project config, a comma-separated list of formats or "none"
 317        # to disable.  Example: gitweb.snapshot = tbz2,zip;
 318        'snapshot' => {
 319                'sub' => \&feature_snapshot,
 320                'override' => 0,
 321                'default' => ['tgz']},
 322
 323        # Enable text search, which will list the commits which match author,
 324        # committer or commit text to a given string.  Enabled by default.
 325        # Project specific override is not supported.
 326        #
 327        # Note that this controls all search features, which means that if
 328        # it is disabled, then 'grep' and 'pickaxe' search would also be
 329        # disabled.
 330        'search' => {
 331                'override' => 0,
 332                'default' => [1]},
 333
 334        # Enable grep search, which will list the files in currently selected
 335        # tree containing the given string. Enabled by default. This can be
 336        # potentially CPU-intensive, of course.
 337        # Note that you need to have 'search' feature enabled too.
 338
 339        # To enable system wide have in $GITWEB_CONFIG
 340        # $feature{'grep'}{'default'} = [1];
 341        # To have project specific config enable override in $GITWEB_CONFIG
 342        # $feature{'grep'}{'override'} = 1;
 343        # and in project config gitweb.grep = 0|1;
 344        'grep' => {
 345                'sub' => sub { feature_bool('grep', @_) },
 346                'override' => 0,
 347                'default' => [1]},
 348
 349        # Enable the pickaxe search, which will list the commits that modified
 350        # a given string in a file. This can be practical and quite faster
 351        # alternative to 'blame', but still potentially CPU-intensive.
 352        # Note that you need to have 'search' feature enabled too.
 353
 354        # To enable system wide have in $GITWEB_CONFIG
 355        # $feature{'pickaxe'}{'default'} = [1];
 356        # To have project specific config enable override in $GITWEB_CONFIG
 357        # $feature{'pickaxe'}{'override'} = 1;
 358        # and in project config gitweb.pickaxe = 0|1;
 359        'pickaxe' => {
 360                'sub' => sub { feature_bool('pickaxe', @_) },
 361                'override' => 0,
 362                'default' => [1]},
 363
 364        # Enable showing size of blobs in a 'tree' view, in a separate
 365        # column, similar to what 'ls -l' does.  This cost a bit of IO.
 366
 367        # To disable system wide have in $GITWEB_CONFIG
 368        # $feature{'show-sizes'}{'default'} = [0];
 369        # To have project specific config enable override in $GITWEB_CONFIG
 370        # $feature{'show-sizes'}{'override'} = 1;
 371        # and in project config gitweb.showsizes = 0|1;
 372        'show-sizes' => {
 373                'sub' => sub { feature_bool('showsizes', @_) },
 374                'override' => 0,
 375                'default' => [1]},
 376
 377        # Make gitweb use an alternative format of the URLs which can be
 378        # more readable and natural-looking: project name is embedded
 379        # directly in the path and the query string contains other
 380        # auxiliary information. All gitweb installations recognize
 381        # URL in either format; this configures in which formats gitweb
 382        # generates links.
 383
 384        # To enable system wide have in $GITWEB_CONFIG
 385        # $feature{'pathinfo'}{'default'} = [1];
 386        # Project specific override is not supported.
 387
 388        # Note that you will need to change the default location of CSS,
 389        # favicon, logo and possibly other files to an absolute URL. Also,
 390        # if gitweb.cgi serves as your indexfile, you will need to force
 391        # $my_uri to contain the script name in your $GITWEB_CONFIG.
 392        'pathinfo' => {
 393                'override' => 0,
 394                'default' => [0]},
 395
 396        # Make gitweb consider projects in project root subdirectories
 397        # to be forks of existing projects. Given project $projname.git,
 398        # projects matching $projname/*.git will not be shown in the main
 399        # projects list, instead a '+' mark will be added to $projname
 400        # there and a 'forks' view will be enabled for the project, listing
 401        # all the forks. If project list is taken from a file, forks have
 402        # to be listed after the main project.
 403
 404        # To enable system wide have in $GITWEB_CONFIG
 405        # $feature{'forks'}{'default'} = [1];
 406        # Project specific override is not supported.
 407        'forks' => {
 408                'override' => 0,
 409                'default' => [0]},
 410
 411        # Insert custom links to the action bar of all project pages.
 412        # This enables you mainly to link to third-party scripts integrating
 413        # into gitweb; e.g. git-browser for graphical history representation
 414        # or custom web-based repository administration interface.
 415
 416        # The 'default' value consists of a list of triplets in the form
 417        # (label, link, position) where position is the label after which
 418        # to insert the link and link is a format string where %n expands
 419        # to the project name, %f to the project path within the filesystem,
 420        # %h to the current hash (h gitweb parameter) and %b to the current
 421        # hash base (hb gitweb parameter); %% expands to %.
 422
 423        # To enable system wide have in $GITWEB_CONFIG e.g.
 424        # $feature{'actions'}{'default'} = [('graphiclog',
 425        #       '/git-browser/by-commit.html?r=%n', 'summary')];
 426        # Project specific override is not supported.
 427        'actions' => {
 428                'override' => 0,
 429                'default' => []},
 430
 431        # Allow gitweb scan project content tags of project repository,
 432        # and display the popular Web 2.0-ish "tag cloud" near the projects
 433        # list.  Note that this is something COMPLETELY different from the
 434        # normal Git tags.
 435
 436        # gitweb by itself can show existing tags, but it does not handle
 437        # tagging itself; you need to do it externally, outside gitweb.
 438        # The format is described in git_get_project_ctags() subroutine.
 439        # You may want to install the HTML::TagCloud Perl module to get
 440        # a pretty tag cloud instead of just a list of tags.
 441
 442        # To enable system wide have in $GITWEB_CONFIG
 443        # $feature{'ctags'}{'default'} = [1];
 444        # Project specific override is not supported.
 445
 446        # In the future whether ctags editing is enabled might depend
 447        # on the value, but using 1 should always mean no editing of ctags.
 448        'ctags' => {
 449                'override' => 0,
 450                'default' => [0]},
 451
 452        # The maximum number of patches in a patchset generated in patch
 453        # view. Set this to 0 or undef to disable patch view, or to a
 454        # negative number to remove any limit.
 455
 456        # To disable system wide have in $GITWEB_CONFIG
 457        # $feature{'patches'}{'default'} = [0];
 458        # To have project specific config enable override in $GITWEB_CONFIG
 459        # $feature{'patches'}{'override'} = 1;
 460        # and in project config gitweb.patches = 0|n;
 461        # where n is the maximum number of patches allowed in a patchset.
 462        'patches' => {
 463                'sub' => \&feature_patches,
 464                'override' => 0,
 465                'default' => [16]},
 466
 467        # Avatar support. When this feature is enabled, views such as
 468        # shortlog or commit will display an avatar associated with
 469        # the email of the committer(s) and/or author(s).
 470
 471        # Currently available providers are gravatar and picon.
 472        # If an unknown provider is specified, the feature is disabled.
 473
 474        # Gravatar depends on Digest::MD5.
 475        # Picon currently relies on the indiana.edu database.
 476
 477        # To enable system wide have in $GITWEB_CONFIG
 478        # $feature{'avatar'}{'default'} = ['<provider>'];
 479        # where <provider> is either gravatar or picon.
 480        # To have project specific config enable override in $GITWEB_CONFIG
 481        # $feature{'avatar'}{'override'} = 1;
 482        # and in project config gitweb.avatar = <provider>;
 483        'avatar' => {
 484                'sub' => \&feature_avatar,
 485                'override' => 0,
 486                'default' => ['']},
 487
 488        # Enable displaying how much time and how many git commands
 489        # it took to generate and display page.  Disabled by default.
 490        # Project specific override is not supported.
 491        'timed' => {
 492                'override' => 0,
 493                'default' => [0]},
 494
 495        # Enable turning some links into links to actions which require
 496        # JavaScript to run (like 'blame_incremental').  Not enabled by
 497        # default.  Project specific override is currently not supported.
 498        'javascript-actions' => {
 499                'override' => 0,
 500                'default' => [0]},
 501
 502        # Enable and configure ability to change common timezone for dates
 503        # in gitweb output via JavaScript.  Enabled by default.
 504        # Project specific override is not supported.
 505        'javascript-timezone' => {
 506                'override' => 0,
 507                'default' => [
 508                        'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
 509                                     # or undef to turn off this feature
 510                        'gitweb_tz', # name of cookie where to store selected timezone
 511                        'datetime',  # CSS class used to mark up dates for manipulation
 512                ]},
 513
 514        # Syntax highlighting support. This is based on Daniel Svensson's
 515        # and Sham Chukoury's work in gitweb-xmms2.git.
 516        # It requires the 'highlight' program present in $PATH,
 517        # and therefore is disabled by default.
 518
 519        # To enable system wide have in $GITWEB_CONFIG
 520        # $feature{'highlight'}{'default'} = [1];
 521
 522        'highlight' => {
 523                'sub' => sub { feature_bool('highlight', @_) },
 524                'override' => 0,
 525                'default' => [0]},
 526
 527        # Enable displaying of remote heads in the heads list
 528
 529        # To enable system wide have in $GITWEB_CONFIG
 530        # $feature{'remote_heads'}{'default'} = [1];
 531        # To have project specific config enable override in $GITWEB_CONFIG
 532        # $feature{'remote_heads'}{'override'} = 1;
 533        # and in project config gitweb.remote_heads = 0|1;
 534        'remote_heads' => {
 535                'sub' => sub { feature_bool('remote_heads', @_) },
 536                'override' => 0,
 537                'default' => [0]},
 538);
 539
 540sub gitweb_get_feature {
 541        my ($name) = @_;
 542        return unless exists $feature{$name};
 543        my ($sub, $override, @defaults) = (
 544                $feature{$name}{'sub'},
 545                $feature{$name}{'override'},
 546                @{$feature{$name}{'default'}});
 547        # project specific override is possible only if we have project
 548        our $git_dir; # global variable, declared later
 549        if (!$override || !defined $git_dir) {
 550                return @defaults;
 551        }
 552        if (!defined $sub) {
 553                warn "feature $name is not overridable";
 554                return @defaults;
 555        }
 556        return $sub->(@defaults);
 557}
 558
 559# A wrapper to check if a given feature is enabled.
 560# With this, you can say
 561#
 562#   my $bool_feat = gitweb_check_feature('bool_feat');
 563#   gitweb_check_feature('bool_feat') or somecode;
 564#
 565# instead of
 566#
 567#   my ($bool_feat) = gitweb_get_feature('bool_feat');
 568#   (gitweb_get_feature('bool_feat'))[0] or somecode;
 569#
 570sub gitweb_check_feature {
 571        return (gitweb_get_feature(@_))[0];
 572}
 573
 574
 575sub feature_bool {
 576        my $key = shift;
 577        my ($val) = git_get_project_config($key, '--bool');
 578
 579        if (!defined $val) {
 580                return ($_[0]);
 581        } elsif ($val eq 'true') {
 582                return (1);
 583        } elsif ($val eq 'false') {
 584                return (0);
 585        }
 586}
 587
 588sub feature_snapshot {
 589        my (@fmts) = @_;
 590
 591        my ($val) = git_get_project_config('snapshot');
 592
 593        if ($val) {
 594                @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
 595        }
 596
 597        return @fmts;
 598}
 599
 600sub feature_patches {
 601        my @val = (git_get_project_config('patches', '--int'));
 602
 603        if (@val) {
 604                return @val;
 605        }
 606
 607        return ($_[0]);
 608}
 609
 610sub feature_avatar {
 611        my @val = (git_get_project_config('avatar'));
 612
 613        return @val ? @val : @_;
 614}
 615
 616# checking HEAD file with -e is fragile if the repository was
 617# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
 618# and then pruned.
 619sub check_head_link {
 620        my ($dir) = @_;
 621        my $headfile = "$dir/HEAD";
 622        return ((-e $headfile) ||
 623                (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
 624}
 625
 626sub check_export_ok {
 627        my ($dir) = @_;
 628        return (check_head_link($dir) &&
 629                (!$export_ok || -e "$dir/$export_ok") &&
 630                (!$export_auth_hook || $export_auth_hook->($dir)));
 631}
 632
 633# process alternate names for backward compatibility
 634# filter out unsupported (unknown) snapshot formats
 635sub filter_snapshot_fmts {
 636        my @fmts = @_;
 637
 638        @fmts = map {
 639                exists $known_snapshot_format_aliases{$_} ?
 640                       $known_snapshot_format_aliases{$_} : $_} @fmts;
 641        @fmts = grep {
 642                exists $known_snapshot_formats{$_} &&
 643                !$known_snapshot_formats{$_}{'disabled'}} @fmts;
 644}
 645
 646# If it is set to code reference, it is code that it is to be run once per
 647# request, allowing updating configurations that change with each request,
 648# while running other code in config file only once.
 649#
 650# Otherwise, if it is false then gitweb would process config file only once;
 651# if it is true then gitweb config would be run for each request.
 652our $per_request_config = 1;
 653
 654# read and parse gitweb config file given by its parameter.
 655# returns true on success, false on recoverable error, allowing
 656# to chain this subroutine, using first file that exists.
 657# dies on errors during parsing config file, as it is unrecoverable.
 658sub read_config_file {
 659        my $filename = shift;
 660        return unless defined $filename;
 661        # die if there are errors parsing config file
 662        if (-e $filename) {
 663                do $filename;
 664                die $@ if $@;
 665                return 1;
 666        }
 667        return;
 668}
 669
 670our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
 671sub evaluate_gitweb_config {
 672        our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
 673        our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
 674        our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
 675
 676        # Protect agains duplications of file names, to not read config twice.
 677        # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
 678        # there possibility of duplication of filename there doesn't matter.
 679        $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
 680        $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
 681
 682        # Common system-wide settings for convenience.
 683        # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
 684        read_config_file($GITWEB_CONFIG_COMMON);
 685
 686        # Use first config file that exists.  This means use the per-instance
 687        # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
 688        read_config_file($GITWEB_CONFIG) and return;
 689        read_config_file($GITWEB_CONFIG_SYSTEM);
 690}
 691
 692# Get loadavg of system, to compare against $maxload.
 693# Currently it requires '/proc/loadavg' present to get loadavg;
 694# if it is not present it returns 0, which means no load checking.
 695sub get_loadavg {
 696        if( -e '/proc/loadavg' ){
 697                open my $fd, '<', '/proc/loadavg'
 698                        or return 0;
 699                my @load = split(/\s+/, scalar <$fd>);
 700                close $fd;
 701
 702                # The first three columns measure CPU and IO utilization of the last one,
 703                # five, and 10 minute periods.  The fourth column shows the number of
 704                # currently running processes and the total number of processes in the m/n
 705                # format.  The last column displays the last process ID used.
 706                return $load[0] || 0;
 707        }
 708        # additional checks for load average should go here for things that don't export
 709        # /proc/loadavg
 710
 711        return 0;
 712}
 713
 714# version of the core git binary
 715our $git_version;
 716sub evaluate_git_version {
 717        our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
 718        $number_of_git_cmds++;
 719}
 720
 721sub check_loadavg {
 722        if (defined $maxload && get_loadavg() > $maxload) {
 723                die_error(503, "The load average on the server is too high");
 724        }
 725}
 726
 727# ======================================================================
 728# input validation and dispatch
 729
 730# input parameters can be collected from a variety of sources (presently, CGI
 731# and PATH_INFO), so we define an %input_params hash that collects them all
 732# together during validation: this allows subsequent uses (e.g. href()) to be
 733# agnostic of the parameter origin
 734
 735our %input_params = ();
 736
 737# input parameters are stored with the long parameter name as key. This will
 738# also be used in the href subroutine to convert parameters to their CGI
 739# equivalent, and since the href() usage is the most frequent one, we store
 740# the name -> CGI key mapping here, instead of the reverse.
 741#
 742# XXX: Warning: If you touch this, check the search form for updating,
 743# too.
 744
 745our @cgi_param_mapping = (
 746        project => "p",
 747        action => "a",
 748        file_name => "f",
 749        file_parent => "fp",
 750        hash => "h",
 751        hash_parent => "hp",
 752        hash_base => "hb",
 753        hash_parent_base => "hpb",
 754        page => "pg",
 755        order => "o",
 756        searchtext => "s",
 757        searchtype => "st",
 758        snapshot_format => "sf",
 759        extra_options => "opt",
 760        search_use_regexp => "sr",
 761        ctag => "by_tag",
 762        diff_style => "ds",
 763        # this must be last entry (for manipulation from JavaScript)
 764        javascript => "js"
 765);
 766our %cgi_param_mapping = @cgi_param_mapping;
 767
 768# we will also need to know the possible actions, for validation
 769our %actions = (
 770        "blame" => \&git_blame,
 771        "blame_incremental" => \&git_blame_incremental,
 772        "blame_data" => \&git_blame_data,
 773        "blobdiff" => \&git_blobdiff,
 774        "blobdiff_plain" => \&git_blobdiff_plain,
 775        "blob" => \&git_blob,
 776        "blob_plain" => \&git_blob_plain,
 777        "commitdiff" => \&git_commitdiff,
 778        "commitdiff_plain" => \&git_commitdiff_plain,
 779        "commit" => \&git_commit,
 780        "forks" => \&git_forks,
 781        "heads" => \&git_heads,
 782        "history" => \&git_history,
 783        "log" => \&git_log,
 784        "patch" => \&git_patch,
 785        "patches" => \&git_patches,
 786        "remotes" => \&git_remotes,
 787        "rss" => \&git_rss,
 788        "atom" => \&git_atom,
 789        "search" => \&git_search,
 790        "search_help" => \&git_search_help,
 791        "shortlog" => \&git_shortlog,
 792        "summary" => \&git_summary,
 793        "tag" => \&git_tag,
 794        "tags" => \&git_tags,
 795        "tree" => \&git_tree,
 796        "snapshot" => \&git_snapshot,
 797        "object" => \&git_object,
 798        # those below don't need $project
 799        "opml" => \&git_opml,
 800        "project_list" => \&git_project_list,
 801        "project_index" => \&git_project_index,
 802);
 803
 804# finally, we have the hash of allowed extra_options for the commands that
 805# allow them
 806our %allowed_options = (
 807        "--no-merges" => [ qw(rss atom log shortlog history) ],
 808);
 809
 810# fill %input_params with the CGI parameters. All values except for 'opt'
 811# should be single values, but opt can be an array. We should probably
 812# build an array of parameters that can be multi-valued, but since for the time
 813# being it's only this one, we just single it out
 814sub evaluate_query_params {
 815        our $cgi;
 816
 817        while (my ($name, $symbol) = each %cgi_param_mapping) {
 818                if ($symbol eq 'opt') {
 819                        $input_params{$name} = [ $cgi->param($symbol) ];
 820                } else {
 821                        $input_params{$name} = $cgi->param($symbol);
 822                }
 823        }
 824}
 825
 826# now read PATH_INFO and update the parameter list for missing parameters
 827sub evaluate_path_info {
 828        return if defined $input_params{'project'};
 829        return if !$path_info;
 830        $path_info =~ s,^/+,,;
 831        return if !$path_info;
 832
 833        # find which part of PATH_INFO is project
 834        my $project = $path_info;
 835        $project =~ s,/+$,,;
 836        while ($project && !check_head_link("$projectroot/$project")) {
 837                $project =~ s,/*[^/]*$,,;
 838        }
 839        return unless $project;
 840        $input_params{'project'} = $project;
 841
 842        # do not change any parameters if an action is given using the query string
 843        return if $input_params{'action'};
 844        $path_info =~ s,^\Q$project\E/*,,;
 845
 846        # next, check if we have an action
 847        my $action = $path_info;
 848        $action =~ s,/.*$,,;
 849        if (exists $actions{$action}) {
 850                $path_info =~ s,^$action/*,,;
 851                $input_params{'action'} = $action;
 852        }
 853
 854        # list of actions that want hash_base instead of hash, but can have no
 855        # pathname (f) parameter
 856        my @wants_base = (
 857                'tree',
 858                'history',
 859        );
 860
 861        # we want to catch, among others
 862        # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
 863        my ($parentrefname, $parentpathname, $refname, $pathname) =
 864                ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
 865
 866        # first, analyze the 'current' part
 867        if (defined $pathname) {
 868                # we got "branch:filename" or "branch:dir/"
 869                # we could use git_get_type(branch:pathname), but:
 870                # - it needs $git_dir
 871                # - it does a git() call
 872                # - the convention of terminating directories with a slash
 873                #   makes it superfluous
 874                # - embedding the action in the PATH_INFO would make it even
 875                #   more superfluous
 876                $pathname =~ s,^/+,,;
 877                if (!$pathname || substr($pathname, -1) eq "/") {
 878                        $input_params{'action'} ||= "tree";
 879                        $pathname =~ s,/$,,;
 880                } else {
 881                        # the default action depends on whether we had parent info
 882                        # or not
 883                        if ($parentrefname) {
 884                                $input_params{'action'} ||= "blobdiff_plain";
 885                        } else {
 886                                $input_params{'action'} ||= "blob_plain";
 887                        }
 888                }
 889                $input_params{'hash_base'} ||= $refname;
 890                $input_params{'file_name'} ||= $pathname;
 891        } elsif (defined $refname) {
 892                # we got "branch". In this case we have to choose if we have to
 893                # set hash or hash_base.
 894                #
 895                # Most of the actions without a pathname only want hash to be
 896                # set, except for the ones specified in @wants_base that want
 897                # hash_base instead. It should also be noted that hand-crafted
 898                # links having 'history' as an action and no pathname or hash
 899                # set will fail, but that happens regardless of PATH_INFO.
 900                if (defined $parentrefname) {
 901                        # if there is parent let the default be 'shortlog' action
 902                        # (for http://git.example.com/repo.git/A..B links); if there
 903                        # is no parent, dispatch will detect type of object and set
 904                        # action appropriately if required (if action is not set)
 905                        $input_params{'action'} ||= "shortlog";
 906                }
 907                if ($input_params{'action'} &&
 908                    grep { $_ eq $input_params{'action'} } @wants_base) {
 909                        $input_params{'hash_base'} ||= $refname;
 910                } else {
 911                        $input_params{'hash'} ||= $refname;
 912                }
 913        }
 914
 915        # next, handle the 'parent' part, if present
 916        if (defined $parentrefname) {
 917                # a missing pathspec defaults to the 'current' filename, allowing e.g.
 918                # someproject/blobdiff/oldrev..newrev:/filename
 919                if ($parentpathname) {
 920                        $parentpathname =~ s,^/+,,;
 921                        $parentpathname =~ s,/$,,;
 922                        $input_params{'file_parent'} ||= $parentpathname;
 923                } else {
 924                        $input_params{'file_parent'} ||= $input_params{'file_name'};
 925                }
 926                # we assume that hash_parent_base is wanted if a path was specified,
 927                # or if the action wants hash_base instead of hash
 928                if (defined $input_params{'file_parent'} ||
 929                        grep { $_ eq $input_params{'action'} } @wants_base) {
 930                        $input_params{'hash_parent_base'} ||= $parentrefname;
 931                } else {
 932                        $input_params{'hash_parent'} ||= $parentrefname;
 933                }
 934        }
 935
 936        # for the snapshot action, we allow URLs in the form
 937        # $project/snapshot/$hash.ext
 938        # where .ext determines the snapshot and gets removed from the
 939        # passed $refname to provide the $hash.
 940        #
 941        # To be able to tell that $refname includes the format extension, we
 942        # require the following two conditions to be satisfied:
 943        # - the hash input parameter MUST have been set from the $refname part
 944        #   of the URL (i.e. they must be equal)
 945        # - the snapshot format MUST NOT have been defined already (e.g. from
 946        #   CGI parameter sf)
 947        # It's also useless to try any matching unless $refname has a dot,
 948        # so we check for that too
 949        if (defined $input_params{'action'} &&
 950                $input_params{'action'} eq 'snapshot' &&
 951                defined $refname && index($refname, '.') != -1 &&
 952                $refname eq $input_params{'hash'} &&
 953                !defined $input_params{'snapshot_format'}) {
 954                # We loop over the known snapshot formats, checking for
 955                # extensions. Allowed extensions are both the defined suffix
 956                # (which includes the initial dot already) and the snapshot
 957                # format key itself, with a prepended dot
 958                while (my ($fmt, $opt) = each %known_snapshot_formats) {
 959                        my $hash = $refname;
 960                        unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
 961                                next;
 962                        }
 963                        my $sfx = $1;
 964                        # a valid suffix was found, so set the snapshot format
 965                        # and reset the hash parameter
 966                        $input_params{'snapshot_format'} = $fmt;
 967                        $input_params{'hash'} = $hash;
 968                        # we also set the format suffix to the one requested
 969                        # in the URL: this way a request for e.g. .tgz returns
 970                        # a .tgz instead of a .tar.gz
 971                        $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
 972                        last;
 973                }
 974        }
 975}
 976
 977our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
 978     $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
 979     $searchtext, $search_regexp);
 980sub evaluate_and_validate_params {
 981        our $action = $input_params{'action'};
 982        if (defined $action) {
 983                if (!validate_action($action)) {
 984                        die_error(400, "Invalid action parameter");
 985                }
 986        }
 987
 988        # parameters which are pathnames
 989        our $project = $input_params{'project'};
 990        if (defined $project) {
 991                if (!validate_project($project)) {
 992                        undef $project;
 993                        die_error(404, "No such project");
 994                }
 995        }
 996
 997        our $file_name = $input_params{'file_name'};
 998        if (defined $file_name) {
 999                if (!validate_pathname($file_name)) {
1000                        die_error(400, "Invalid file parameter");
1001                }
1002        }
1003
1004        our $file_parent = $input_params{'file_parent'};
1005        if (defined $file_parent) {
1006                if (!validate_pathname($file_parent)) {
1007                        die_error(400, "Invalid file parent parameter");
1008                }
1009        }
1010
1011        # parameters which are refnames
1012        our $hash = $input_params{'hash'};
1013        if (defined $hash) {
1014                if (!validate_refname($hash)) {
1015                        die_error(400, "Invalid hash parameter");
1016                }
1017        }
1018
1019        our $hash_parent = $input_params{'hash_parent'};
1020        if (defined $hash_parent) {
1021                if (!validate_refname($hash_parent)) {
1022                        die_error(400, "Invalid hash parent parameter");
1023                }
1024        }
1025
1026        our $hash_base = $input_params{'hash_base'};
1027        if (defined $hash_base) {
1028                if (!validate_refname($hash_base)) {
1029                        die_error(400, "Invalid hash base parameter");
1030                }
1031        }
1032
1033        our @extra_options = @{$input_params{'extra_options'}};
1034        # @extra_options is always defined, since it can only be (currently) set from
1035        # CGI, and $cgi->param() returns the empty array in array context if the param
1036        # is not set
1037        foreach my $opt (@extra_options) {
1038                if (not exists $allowed_options{$opt}) {
1039                        die_error(400, "Invalid option parameter");
1040                }
1041                if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1042                        die_error(400, "Invalid option parameter for this action");
1043                }
1044        }
1045
1046        our $hash_parent_base = $input_params{'hash_parent_base'};
1047        if (defined $hash_parent_base) {
1048                if (!validate_refname($hash_parent_base)) {
1049                        die_error(400, "Invalid hash parent base parameter");
1050                }
1051        }
1052
1053        # other parameters
1054        our $page = $input_params{'page'};
1055        if (defined $page) {
1056                if ($page =~ m/[^0-9]/) {
1057                        die_error(400, "Invalid page parameter");
1058                }
1059        }
1060
1061        our $searchtype = $input_params{'searchtype'};
1062        if (defined $searchtype) {
1063                if ($searchtype =~ m/[^a-z]/) {
1064                        die_error(400, "Invalid searchtype parameter");
1065                }
1066        }
1067
1068        our $search_use_regexp = $input_params{'search_use_regexp'};
1069
1070        our $searchtext = $input_params{'searchtext'};
1071        our $search_regexp;
1072        if (defined $searchtext) {
1073                if (length($searchtext) < 2) {
1074                        die_error(403, "At least two characters are required for search parameter");
1075                }
1076                $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
1077        }
1078}
1079
1080# path to the current git repository
1081our $git_dir;
1082sub evaluate_git_dir {
1083        our $git_dir = "$projectroot/$project" if $project;
1084}
1085
1086our (@snapshot_fmts, $git_avatar);
1087sub configure_gitweb_features {
1088        # list of supported snapshot formats
1089        our @snapshot_fmts = gitweb_get_feature('snapshot');
1090        @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1091
1092        # check that the avatar feature is set to a known provider name,
1093        # and for each provider check if the dependencies are satisfied.
1094        # if the provider name is invalid or the dependencies are not met,
1095        # reset $git_avatar to the empty string.
1096        our ($git_avatar) = gitweb_get_feature('avatar');
1097        if ($git_avatar eq 'gravatar') {
1098                $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1099        } elsif ($git_avatar eq 'picon') {
1100                # no dependencies
1101        } else {
1102                $git_avatar = '';
1103        }
1104}
1105
1106# custom error handler: 'die <message>' is Internal Server Error
1107sub handle_errors_html {
1108        my $msg = shift; # it is already HTML escaped
1109
1110        # to avoid infinite loop where error occurs in die_error,
1111        # change handler to default handler, disabling handle_errors_html
1112        set_message("Error occured when inside die_error:\n$msg");
1113
1114        # you cannot jump out of die_error when called as error handler;
1115        # the subroutine set via CGI::Carp::set_message is called _after_
1116        # HTTP headers are already written, so it cannot write them itself
1117        die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1118}
1119set_message(\&handle_errors_html);
1120
1121# dispatch
1122sub dispatch {
1123        if (!defined $action) {
1124                if (defined $hash) {
1125                        $action = git_get_type($hash);
1126                } elsif (defined $hash_base && defined $file_name) {
1127                        $action = git_get_type("$hash_base:$file_name");
1128                } elsif (defined $project) {
1129                        $action = 'summary';
1130                } else {
1131                        $action = 'project_list';
1132                }
1133        }
1134        if (!defined($actions{$action})) {
1135                die_error(400, "Unknown action");
1136        }
1137        if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1138            !$project) {
1139                die_error(400, "Project needed");
1140        }
1141        $actions{$action}->();
1142}
1143
1144sub reset_timer {
1145        our $t0 = [ gettimeofday() ]
1146                if defined $t0;
1147        our $number_of_git_cmds = 0;
1148}
1149
1150our $first_request = 1;
1151sub run_request {
1152        reset_timer();
1153
1154        evaluate_uri();
1155        if ($first_request) {
1156                evaluate_gitweb_config();
1157                evaluate_git_version();
1158        }
1159        if ($per_request_config) {
1160                if (ref($per_request_config) eq 'CODE') {
1161                        $per_request_config->();
1162                } elsif (!$first_request) {
1163                        evaluate_gitweb_config();
1164                }
1165        }
1166        check_loadavg();
1167
1168        # $projectroot and $projects_list might be set in gitweb config file
1169        $projects_list ||= $projectroot;
1170
1171        evaluate_query_params();
1172        evaluate_path_info();
1173        evaluate_and_validate_params();
1174        evaluate_git_dir();
1175
1176        configure_gitweb_features();
1177
1178        dispatch();
1179}
1180
1181our $is_last_request = sub { 1 };
1182our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1183our $CGI = 'CGI';
1184our $cgi;
1185sub configure_as_fcgi {
1186        require CGI::Fast;
1187        our $CGI = 'CGI::Fast';
1188
1189        my $request_number = 0;
1190        # let each child service 100 requests
1191        our $is_last_request = sub { ++$request_number > 100 };
1192}
1193sub evaluate_argv {
1194        my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1195        configure_as_fcgi()
1196                if $script_name =~ /\.fcgi$/;
1197
1198        return unless (@ARGV);
1199
1200        require Getopt::Long;
1201        Getopt::Long::GetOptions(
1202                'fastcgi|fcgi|f' => \&configure_as_fcgi,
1203                'nproc|n=i' => sub {
1204                        my ($arg, $val) = @_;
1205                        return unless eval { require FCGI::ProcManager; 1; };
1206                        my $proc_manager = FCGI::ProcManager->new({
1207                                n_processes => $val,
1208                        });
1209                        our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1210                        our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1211                        our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1212                },
1213        );
1214}
1215
1216sub run {
1217        evaluate_argv();
1218
1219        $first_request = 1;
1220        $pre_listen_hook->()
1221                if $pre_listen_hook;
1222
1223 REQUEST:
1224        while ($cgi = $CGI->new()) {
1225                $pre_dispatch_hook->()
1226                        if $pre_dispatch_hook;
1227
1228                run_request();
1229
1230                $post_dispatch_hook->()
1231                        if $post_dispatch_hook;
1232                $first_request = 0;
1233
1234                last REQUEST if ($is_last_request->());
1235        }
1236
1237 DONE_GITWEB:
1238        1;
1239}
1240
1241run();
1242
1243if (defined caller) {
1244        # wrapped in a subroutine processing requests,
1245        # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1246        return;
1247} else {
1248        # pure CGI script, serving single request
1249        exit;
1250}
1251
1252## ======================================================================
1253## action links
1254
1255# possible values of extra options
1256# -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1257# -replay => 1      - start from a current view (replay with modifications)
1258# -path_info => 0|1 - don't use/use path_info URL (if possible)
1259# -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1260sub href {
1261        my %params = @_;
1262        # default is to use -absolute url() i.e. $my_uri
1263        my $href = $params{-full} ? $my_url : $my_uri;
1264
1265        # implicit -replay, must be first of implicit params
1266        $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1267
1268        $params{'project'} = $project unless exists $params{'project'};
1269
1270        if ($params{-replay}) {
1271                while (my ($name, $symbol) = each %cgi_param_mapping) {
1272                        if (!exists $params{$name}) {
1273                                $params{$name} = $input_params{$name};
1274                        }
1275                }
1276        }
1277
1278        my $use_pathinfo = gitweb_check_feature('pathinfo');
1279        if (defined $params{'project'} &&
1280            (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1281                # try to put as many parameters as possible in PATH_INFO:
1282                #   - project name
1283                #   - action
1284                #   - hash_parent or hash_parent_base:/file_parent
1285                #   - hash or hash_base:/filename
1286                #   - the snapshot_format as an appropriate suffix
1287
1288                # When the script is the root DirectoryIndex for the domain,
1289                # $href here would be something like http://gitweb.example.com/
1290                # Thus, we strip any trailing / from $href, to spare us double
1291                # slashes in the final URL
1292                $href =~ s,/$,,;
1293
1294                # Then add the project name, if present
1295                $href .= "/".esc_path_info($params{'project'});
1296                delete $params{'project'};
1297
1298                # since we destructively absorb parameters, we keep this
1299                # boolean that remembers if we're handling a snapshot
1300                my $is_snapshot = $params{'action'} eq 'snapshot';
1301
1302                # Summary just uses the project path URL, any other action is
1303                # added to the URL
1304                if (defined $params{'action'}) {
1305                        $href .= "/".esc_path_info($params{'action'})
1306                                unless $params{'action'} eq 'summary';
1307                        delete $params{'action'};
1308                }
1309
1310                # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1311                # stripping nonexistent or useless pieces
1312                $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1313                        || $params{'hash_parent'} || $params{'hash'});
1314                if (defined $params{'hash_base'}) {
1315                        if (defined $params{'hash_parent_base'}) {
1316                                $href .= esc_path_info($params{'hash_parent_base'});
1317                                # skip the file_parent if it's the same as the file_name
1318                                if (defined $params{'file_parent'}) {
1319                                        if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1320                                                delete $params{'file_parent'};
1321                                        } elsif ($params{'file_parent'} !~ /\.\./) {
1322                                                $href .= ":/".esc_path_info($params{'file_parent'});
1323                                                delete $params{'file_parent'};
1324                                        }
1325                                }
1326                                $href .= "..";
1327                                delete $params{'hash_parent'};
1328                                delete $params{'hash_parent_base'};
1329                        } elsif (defined $params{'hash_parent'}) {
1330                                $href .= esc_path_info($params{'hash_parent'}). "..";
1331                                delete $params{'hash_parent'};
1332                        }
1333
1334                        $href .= esc_path_info($params{'hash_base'});
1335                        if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1336                                $href .= ":/".esc_path_info($params{'file_name'});
1337                                delete $params{'file_name'};
1338                        }
1339                        delete $params{'hash'};
1340                        delete $params{'hash_base'};
1341                } elsif (defined $params{'hash'}) {
1342                        $href .= esc_path_info($params{'hash'});
1343                        delete $params{'hash'};
1344                }
1345
1346                # If the action was a snapshot, we can absorb the
1347                # snapshot_format parameter too
1348                if ($is_snapshot) {
1349                        my $fmt = $params{'snapshot_format'};
1350                        # snapshot_format should always be defined when href()
1351                        # is called, but just in case some code forgets, we
1352                        # fall back to the default
1353                        $fmt ||= $snapshot_fmts[0];
1354                        $href .= $known_snapshot_formats{$fmt}{'suffix'};
1355                        delete $params{'snapshot_format'};
1356                }
1357        }
1358
1359        # now encode the parameters explicitly
1360        my @result = ();
1361        for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1362                my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1363                if (defined $params{$name}) {
1364                        if (ref($params{$name}) eq "ARRAY") {
1365                                foreach my $par (@{$params{$name}}) {
1366                                        push @result, $symbol . "=" . esc_param($par);
1367                                }
1368                        } else {
1369                                push @result, $symbol . "=" . esc_param($params{$name});
1370                        }
1371                }
1372        }
1373        $href .= "?" . join(';', @result) if scalar @result;
1374
1375        # final transformation: trailing spaces must be escaped (URI-encoded)
1376        $href =~ s/(\s+)$/CGI::escape($1)/e;
1377
1378        if ($params{-anchor}) {
1379                $href .= "#".esc_param($params{-anchor});
1380        }
1381
1382        return $href;
1383}
1384
1385
1386## ======================================================================
1387## validation, quoting/unquoting and escaping
1388
1389sub validate_action {
1390        my $input = shift || return undef;
1391        return undef unless exists $actions{$input};
1392        return $input;
1393}
1394
1395sub validate_project {
1396        my $input = shift || return undef;
1397        if (!validate_pathname($input) ||
1398                !(-d "$projectroot/$input") ||
1399                !check_export_ok("$projectroot/$input") ||
1400                ($strict_export && !project_in_list($input))) {
1401                return undef;
1402        } else {
1403                return $input;
1404        }
1405}
1406
1407sub validate_pathname {
1408        my $input = shift || return undef;
1409
1410        # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1411        # at the beginning, at the end, and between slashes.
1412        # also this catches doubled slashes
1413        if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1414                return undef;
1415        }
1416        # no null characters
1417        if ($input =~ m!\0!) {
1418                return undef;
1419        }
1420        return $input;
1421}
1422
1423sub validate_refname {
1424        my $input = shift || return undef;
1425
1426        # textual hashes are O.K.
1427        if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1428                return $input;
1429        }
1430        # it must be correct pathname
1431        $input = validate_pathname($input)
1432                or return undef;
1433        # restrictions on ref name according to git-check-ref-format
1434        if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1435                return undef;
1436        }
1437        return $input;
1438}
1439
1440# decode sequences of octets in utf8 into Perl's internal form,
1441# which is utf-8 with utf8 flag set if needed.  gitweb writes out
1442# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1443sub to_utf8 {
1444        my $str = shift;
1445        return undef unless defined $str;
1446
1447        if (utf8::is_utf8($str) || utf8::decode($str)) {
1448                return $str;
1449        } else {
1450                return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1451        }
1452}
1453
1454# quote unsafe chars, but keep the slash, even when it's not
1455# correct, but quoted slashes look too horrible in bookmarks
1456sub esc_param {
1457        my $str = shift;
1458        return undef unless defined $str;
1459        $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1460        $str =~ s/ /\+/g;
1461        return $str;
1462}
1463
1464# the quoting rules for path_info fragment are slightly different
1465sub esc_path_info {
1466        my $str = shift;
1467        return undef unless defined $str;
1468
1469        # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1470        $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1471
1472        return $str;
1473}
1474
1475# quote unsafe chars in whole URL, so some characters cannot be quoted
1476sub esc_url {
1477        my $str = shift;
1478        return undef unless defined $str;
1479        $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1480        $str =~ s/ /\+/g;
1481        return $str;
1482}
1483
1484# quote unsafe characters in HTML attributes
1485sub esc_attr {
1486
1487        # for XHTML conformance escaping '"' to '&quot;' is not enough
1488        return esc_html(@_);
1489}
1490
1491# replace invalid utf8 character with SUBSTITUTION sequence
1492sub esc_html {
1493        my $str = shift;
1494        my %opts = @_;
1495
1496        return undef unless defined $str;
1497
1498        $str = to_utf8($str);
1499        $str = $cgi->escapeHTML($str);
1500        if ($opts{'-nbsp'}) {
1501                $str =~ s/ /&nbsp;/g;
1502        }
1503        $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1504        return $str;
1505}
1506
1507# quote control characters and escape filename to HTML
1508sub esc_path {
1509        my $str = shift;
1510        my %opts = @_;
1511
1512        return undef unless defined $str;
1513
1514        $str = to_utf8($str);
1515        $str = $cgi->escapeHTML($str);
1516        if ($opts{'-nbsp'}) {
1517                $str =~ s/ /&nbsp;/g;
1518        }
1519        $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1520        return $str;
1521}
1522
1523# Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1524sub sanitize {
1525        my $str = shift;
1526
1527        return undef unless defined $str;
1528
1529        $str = to_utf8($str);
1530        $str =~ s|([[:cntrl:]])|($1 =~ /[\t\n\r]/ ? $1 : quot_cec($1))|eg;
1531        return $str;
1532}
1533
1534# Make control characters "printable", using character escape codes (CEC)
1535sub quot_cec {
1536        my $cntrl = shift;
1537        my %opts = @_;
1538        my %es = ( # character escape codes, aka escape sequences
1539                "\t" => '\t',   # tab            (HT)
1540                "\n" => '\n',   # line feed      (LF)
1541                "\r" => '\r',   # carrige return (CR)
1542                "\f" => '\f',   # form feed      (FF)
1543                "\b" => '\b',   # backspace      (BS)
1544                "\a" => '\a',   # alarm (bell)   (BEL)
1545                "\e" => '\e',   # escape         (ESC)
1546                "\013" => '\v', # vertical tab   (VT)
1547                "\000" => '\0', # nul character  (NUL)
1548        );
1549        my $chr = ( (exists $es{$cntrl})
1550                    ? $es{$cntrl}
1551                    : sprintf('\%2x', ord($cntrl)) );
1552        if ($opts{-nohtml}) {
1553                return $chr;
1554        } else {
1555                return "<span class=\"cntrl\">$chr</span>";
1556        }
1557}
1558
1559# Alternatively use unicode control pictures codepoints,
1560# Unicode "printable representation" (PR)
1561sub quot_upr {
1562        my $cntrl = shift;
1563        my %opts = @_;
1564
1565        my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1566        if ($opts{-nohtml}) {
1567                return $chr;
1568        } else {
1569                return "<span class=\"cntrl\">$chr</span>";
1570        }
1571}
1572
1573# git may return quoted and escaped filenames
1574sub unquote {
1575        my $str = shift;
1576
1577        sub unq {
1578                my $seq = shift;
1579                my %es = ( # character escape codes, aka escape sequences
1580                        't' => "\t",   # tab            (HT, TAB)
1581                        'n' => "\n",   # newline        (NL)
1582                        'r' => "\r",   # return         (CR)
1583                        'f' => "\f",   # form feed      (FF)
1584                        'b' => "\b",   # backspace      (BS)
1585                        'a' => "\a",   # alarm (bell)   (BEL)
1586                        'e' => "\e",   # escape         (ESC)
1587                        'v' => "\013", # vertical tab   (VT)
1588                );
1589
1590                if ($seq =~ m/^[0-7]{1,3}$/) {
1591                        # octal char sequence
1592                        return chr(oct($seq));
1593                } elsif (exists $es{$seq}) {
1594                        # C escape sequence, aka character escape code
1595                        return $es{$seq};
1596                }
1597                # quoted ordinary character
1598                return $seq;
1599        }
1600
1601        if ($str =~ m/^"(.*)"$/) {
1602                # needs unquoting
1603                $str = $1;
1604                $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1605        }
1606        return $str;
1607}
1608
1609# escape tabs (convert tabs to spaces)
1610sub untabify {
1611        my $line = shift;
1612
1613        while ((my $pos = index($line, "\t")) != -1) {
1614                if (my $count = (8 - ($pos % 8))) {
1615                        my $spaces = ' ' x $count;
1616                        $line =~ s/\t/$spaces/;
1617                }
1618        }
1619
1620        return $line;
1621}
1622
1623sub project_in_list {
1624        my $project = shift;
1625        my @list = git_get_projects_list();
1626        return @list && scalar(grep { $_->{'path'} eq $project } @list);
1627}
1628
1629## ----------------------------------------------------------------------
1630## HTML aware string manipulation
1631
1632# Try to chop given string on a word boundary between position
1633# $len and $len+$add_len. If there is no word boundary there,
1634# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1635# (marking chopped part) would be longer than given string.
1636sub chop_str {
1637        my $str = shift;
1638        my $len = shift;
1639        my $add_len = shift || 10;
1640        my $where = shift || 'right'; # 'left' | 'center' | 'right'
1641
1642        # Make sure perl knows it is utf8 encoded so we don't
1643        # cut in the middle of a utf8 multibyte char.
1644        $str = to_utf8($str);
1645
1646        # allow only $len chars, but don't cut a word if it would fit in $add_len
1647        # if it doesn't fit, cut it if it's still longer than the dots we would add
1648        # remove chopped character entities entirely
1649
1650        # when chopping in the middle, distribute $len into left and right part
1651        # return early if chopping wouldn't make string shorter
1652        if ($where eq 'center') {
1653                return $str if ($len + 5 >= length($str)); # filler is length 5
1654                $len = int($len/2);
1655        } else {
1656                return $str if ($len + 4 >= length($str)); # filler is length 4
1657        }
1658
1659        # regexps: ending and beginning with word part up to $add_len
1660        my $endre = qr/.{$len}\w{0,$add_len}/;
1661        my $begre = qr/\w{0,$add_len}.{$len}/;
1662
1663        if ($where eq 'left') {
1664                $str =~ m/^(.*?)($begre)$/;
1665                my ($lead, $body) = ($1, $2);
1666                if (length($lead) > 4) {
1667                        $lead = " ...";
1668                }
1669                return "$lead$body";
1670
1671        } elsif ($where eq 'center') {
1672                $str =~ m/^($endre)(.*)$/;
1673                my ($left, $str)  = ($1, $2);
1674                $str =~ m/^(.*?)($begre)$/;
1675                my ($mid, $right) = ($1, $2);
1676                if (length($mid) > 5) {
1677                        $mid = " ... ";
1678                }
1679                return "$left$mid$right";
1680
1681        } else {
1682                $str =~ m/^($endre)(.*)$/;
1683                my $body = $1;
1684                my $tail = $2;
1685                if (length($tail) > 4) {
1686                        $tail = "... ";
1687                }
1688                return "$body$tail";
1689        }
1690}
1691
1692# takes the same arguments as chop_str, but also wraps a <span> around the
1693# result with a title attribute if it does get chopped. Additionally, the
1694# string is HTML-escaped.
1695sub chop_and_escape_str {
1696        my ($str) = @_;
1697
1698        my $chopped = chop_str(@_);
1699        $str = to_utf8($str);
1700        if ($chopped eq $str) {
1701                return esc_html($chopped);
1702        } else {
1703                $str =~ s/[[:cntrl:]]/?/g;
1704                return $cgi->span({-title=>$str}, esc_html($chopped));
1705        }
1706}
1707
1708## ----------------------------------------------------------------------
1709## functions returning short strings
1710
1711# CSS class for given age value (in seconds)
1712sub age_class {
1713        my $age = shift;
1714
1715        if (!defined $age) {
1716                return "noage";
1717        } elsif ($age < 60*60*2) {
1718                return "age0";
1719        } elsif ($age < 60*60*24*2) {
1720                return "age1";
1721        } else {
1722                return "age2";
1723        }
1724}
1725
1726# convert age in seconds to "nn units ago" string
1727sub age_string {
1728        my $age = shift;
1729        my $age_str;
1730
1731        if ($age > 60*60*24*365*2) {
1732                $age_str = (int $age/60/60/24/365);
1733                $age_str .= " years ago";
1734        } elsif ($age > 60*60*24*(365/12)*2) {
1735                $age_str = int $age/60/60/24/(365/12);
1736                $age_str .= " months ago";
1737        } elsif ($age > 60*60*24*7*2) {
1738                $age_str = int $age/60/60/24/7;
1739                $age_str .= " weeks ago";
1740        } elsif ($age > 60*60*24*2) {
1741                $age_str = int $age/60/60/24;
1742                $age_str .= " days ago";
1743        } elsif ($age > 60*60*2) {
1744                $age_str = int $age/60/60;
1745                $age_str .= " hours ago";
1746        } elsif ($age > 60*2) {
1747                $age_str = int $age/60;
1748                $age_str .= " min ago";
1749        } elsif ($age > 2) {
1750                $age_str = int $age;
1751                $age_str .= " sec ago";
1752        } else {
1753                $age_str .= " right now";
1754        }
1755        return $age_str;
1756}
1757
1758use constant {
1759        S_IFINVALID => 0030000,
1760        S_IFGITLINK => 0160000,
1761};
1762
1763# submodule/subproject, a commit object reference
1764sub S_ISGITLINK {
1765        my $mode = shift;
1766
1767        return (($mode & S_IFMT) == S_IFGITLINK)
1768}
1769
1770# convert file mode in octal to symbolic file mode string
1771sub mode_str {
1772        my $mode = oct shift;
1773
1774        if (S_ISGITLINK($mode)) {
1775                return 'm---------';
1776        } elsif (S_ISDIR($mode & S_IFMT)) {
1777                return 'drwxr-xr-x';
1778        } elsif (S_ISLNK($mode)) {
1779                return 'lrwxrwxrwx';
1780        } elsif (S_ISREG($mode)) {
1781                # git cares only about the executable bit
1782                if ($mode & S_IXUSR) {
1783                        return '-rwxr-xr-x';
1784                } else {
1785                        return '-rw-r--r--';
1786                };
1787        } else {
1788                return '----------';
1789        }
1790}
1791
1792# convert file mode in octal to file type string
1793sub file_type {
1794        my $mode = shift;
1795
1796        if ($mode !~ m/^[0-7]+$/) {
1797                return $mode;
1798        } else {
1799                $mode = oct $mode;
1800        }
1801
1802        if (S_ISGITLINK($mode)) {
1803                return "submodule";
1804        } elsif (S_ISDIR($mode & S_IFMT)) {
1805                return "directory";
1806        } elsif (S_ISLNK($mode)) {
1807                return "symlink";
1808        } elsif (S_ISREG($mode)) {
1809                return "file";
1810        } else {
1811                return "unknown";
1812        }
1813}
1814
1815# convert file mode in octal to file type description string
1816sub file_type_long {
1817        my $mode = shift;
1818
1819        if ($mode !~ m/^[0-7]+$/) {
1820                return $mode;
1821        } else {
1822                $mode = oct $mode;
1823        }
1824
1825        if (S_ISGITLINK($mode)) {
1826                return "submodule";
1827        } elsif (S_ISDIR($mode & S_IFMT)) {
1828                return "directory";
1829        } elsif (S_ISLNK($mode)) {
1830                return "symlink";
1831        } elsif (S_ISREG($mode)) {
1832                if ($mode & S_IXUSR) {
1833                        return "executable";
1834                } else {
1835                        return "file";
1836                };
1837        } else {
1838                return "unknown";
1839        }
1840}
1841
1842
1843## ----------------------------------------------------------------------
1844## functions returning short HTML fragments, or transforming HTML fragments
1845## which don't belong to other sections
1846
1847# format line of commit message.
1848sub format_log_line_html {
1849        my $line = shift;
1850
1851        $line = esc_html($line, -nbsp=>1);
1852        $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1853                $cgi->a({-href => href(action=>"object", hash=>$1),
1854                                        -class => "text"}, $1);
1855        }eg;
1856
1857        return $line;
1858}
1859
1860# format marker of refs pointing to given object
1861
1862# the destination action is chosen based on object type and current context:
1863# - for annotated tags, we choose the tag view unless it's the current view
1864#   already, in which case we go to shortlog view
1865# - for other refs, we keep the current view if we're in history, shortlog or
1866#   log view, and select shortlog otherwise
1867sub format_ref_marker {
1868        my ($refs, $id) = @_;
1869        my $markers = '';
1870
1871        if (defined $refs->{$id}) {
1872                foreach my $ref (@{$refs->{$id}}) {
1873                        # this code exploits the fact that non-lightweight tags are the
1874                        # only indirect objects, and that they are the only objects for which
1875                        # we want to use tag instead of shortlog as action
1876                        my ($type, $name) = qw();
1877                        my $indirect = ($ref =~ s/\^\{\}$//);
1878                        # e.g. tags/v2.6.11 or heads/next
1879                        if ($ref =~ m!^(.*?)s?/(.*)$!) {
1880                                $type = $1;
1881                                $name = $2;
1882                        } else {
1883                                $type = "ref";
1884                                $name = $ref;
1885                        }
1886
1887                        my $class = $type;
1888                        $class .= " indirect" if $indirect;
1889
1890                        my $dest_action = "shortlog";
1891
1892                        if ($indirect) {
1893                                $dest_action = "tag" unless $action eq "tag";
1894                        } elsif ($action =~ /^(history|(short)?log)$/) {
1895                                $dest_action = $action;
1896                        }
1897
1898                        my $dest = "";
1899                        $dest .= "refs/" unless $ref =~ m!^refs/!;
1900                        $dest .= $ref;
1901
1902                        my $link = $cgi->a({
1903                                -href => href(
1904                                        action=>$dest_action,
1905                                        hash=>$dest
1906                                )}, $name);
1907
1908                        $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
1909                                $link . "</span>";
1910                }
1911        }
1912
1913        if ($markers) {
1914                return ' <span class="refs">'. $markers . '</span>';
1915        } else {
1916                return "";
1917        }
1918}
1919
1920# format, perhaps shortened and with markers, title line
1921sub format_subject_html {
1922        my ($long, $short, $href, $extra) = @_;
1923        $extra = '' unless defined($extra);
1924
1925        if (length($short) < length($long)) {
1926                $long =~ s/[[:cntrl:]]/?/g;
1927                return $cgi->a({-href => $href, -class => "list subject",
1928                                -title => to_utf8($long)},
1929                       esc_html($short)) . $extra;
1930        } else {
1931                return $cgi->a({-href => $href, -class => "list subject"},
1932                       esc_html($long)) . $extra;
1933        }
1934}
1935
1936# Rather than recomputing the url for an email multiple times, we cache it
1937# after the first hit. This gives a visible benefit in views where the avatar
1938# for the same email is used repeatedly (e.g. shortlog).
1939# The cache is shared by all avatar engines (currently gravatar only), which
1940# are free to use it as preferred. Since only one avatar engine is used for any
1941# given page, there's no risk for cache conflicts.
1942our %avatar_cache = ();
1943
1944# Compute the picon url for a given email, by using the picon search service over at
1945# http://www.cs.indiana.edu/picons/search.html
1946sub picon_url {
1947        my $email = lc shift;
1948        if (!$avatar_cache{$email}) {
1949                my ($user, $domain) = split('@', $email);
1950                $avatar_cache{$email} =
1951                        "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1952                        "$domain/$user/" .
1953                        "users+domains+unknown/up/single";
1954        }
1955        return $avatar_cache{$email};
1956}
1957
1958# Compute the gravatar url for a given email, if it's not in the cache already.
1959# Gravatar stores only the part of the URL before the size, since that's the
1960# one computationally more expensive. This also allows reuse of the cache for
1961# different sizes (for this particular engine).
1962sub gravatar_url {
1963        my $email = lc shift;
1964        my $size = shift;
1965        $avatar_cache{$email} ||=
1966                "http://www.gravatar.com/avatar/" .
1967                        Digest::MD5::md5_hex($email) . "?s=";
1968        return $avatar_cache{$email} . $size;
1969}
1970
1971# Insert an avatar for the given $email at the given $size if the feature
1972# is enabled.
1973sub git_get_avatar {
1974        my ($email, %opts) = @_;
1975        my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1976        my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1977        $opts{-size} ||= 'default';
1978        my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1979        my $url = "";
1980        if ($git_avatar eq 'gravatar') {
1981                $url = gravatar_url($email, $size);
1982        } elsif ($git_avatar eq 'picon') {
1983                $url = picon_url($email);
1984        }
1985        # Other providers can be added by extending the if chain, defining $url
1986        # as needed. If no variant puts something in $url, we assume avatars
1987        # are completely disabled/unavailable.
1988        if ($url) {
1989                return $pre_white .
1990                       "<img width=\"$size\" " .
1991                            "class=\"avatar\" " .
1992                            "src=\"".esc_url($url)."\" " .
1993                            "alt=\"\" " .
1994                       "/>" . $post_white;
1995        } else {
1996                return "";
1997        }
1998}
1999
2000sub format_search_author {
2001        my ($author, $searchtype, $displaytext) = @_;
2002        my $have_search = gitweb_check_feature('search');
2003
2004        if ($have_search) {
2005                my $performed = "";
2006                if ($searchtype eq 'author') {
2007                        $performed = "authored";
2008                } elsif ($searchtype eq 'committer') {
2009                        $performed = "committed";
2010                }
2011
2012                return $cgi->a({-href => href(action=>"search", hash=>$hash,
2013                                searchtext=>$author,
2014                                searchtype=>$searchtype), class=>"list",
2015                                title=>"Search for commits $performed by $author"},
2016                                $displaytext);
2017
2018        } else {
2019                return $displaytext;
2020        }
2021}
2022
2023# format the author name of the given commit with the given tag
2024# the author name is chopped and escaped according to the other
2025# optional parameters (see chop_str).
2026sub format_author_html {
2027        my $tag = shift;
2028        my $co = shift;
2029        my $author = chop_and_escape_str($co->{'author_name'}, @_);
2030        return "<$tag class=\"author\">" .
2031               format_search_author($co->{'author_name'}, "author",
2032                       git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2033                       $author) .
2034               "</$tag>";
2035}
2036
2037# format git diff header line, i.e. "diff --(git|combined|cc) ..."
2038sub format_git_diff_header_line {
2039        my $line = shift;
2040        my $diffinfo = shift;
2041        my ($from, $to) = @_;
2042
2043        if ($diffinfo->{'nparents'}) {
2044                # combined diff
2045                $line =~ s!^(diff (.*?) )"?.*$!$1!;
2046                if ($to->{'href'}) {
2047                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2048                                         esc_path($to->{'file'}));
2049                } else { # file was deleted (no href)
2050                        $line .= esc_path($to->{'file'});
2051                }
2052        } else {
2053                # "ordinary" diff
2054                $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2055                if ($from->{'href'}) {
2056                        $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2057                                         'a/' . esc_path($from->{'file'}));
2058                } else { # file was added (no href)
2059                        $line .= 'a/' . esc_path($from->{'file'});
2060                }
2061                $line .= ' ';
2062                if ($to->{'href'}) {
2063                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2064                                         'b/' . esc_path($to->{'file'}));
2065                } else { # file was deleted
2066                        $line .= 'b/' . esc_path($to->{'file'});
2067                }
2068        }
2069
2070        return "<div class=\"diff header\">$line</div>\n";
2071}
2072
2073# format extended diff header line, before patch itself
2074sub format_extended_diff_header_line {
2075        my $line = shift;
2076        my $diffinfo = shift;
2077        my ($from, $to) = @_;
2078
2079        # match <path>
2080        if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2081                $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2082                                       esc_path($from->{'file'}));
2083        }
2084        if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2085                $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2086                                 esc_path($to->{'file'}));
2087        }
2088        # match single <mode>
2089        if ($line =~ m/\s(\d{6})$/) {
2090                $line .= '<span class="info"> (' .
2091                         file_type_long($1) .
2092                         ')</span>';
2093        }
2094        # match <hash>
2095        if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2096                # can match only for combined diff
2097                $line = 'index ';
2098                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2099                        if ($from->{'href'}[$i]) {
2100                                $line .= $cgi->a({-href=>$from->{'href'}[$i],
2101                                                  -class=>"hash"},
2102                                                 substr($diffinfo->{'from_id'}[$i],0,7));
2103                        } else {
2104                                $line .= '0' x 7;
2105                        }
2106                        # separator
2107                        $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2108                }
2109                $line .= '..';
2110                if ($to->{'href'}) {
2111                        $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2112                                         substr($diffinfo->{'to_id'},0,7));
2113                } else {
2114                        $line .= '0' x 7;
2115                }
2116
2117        } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2118                # can match only for ordinary diff
2119                my ($from_link, $to_link);
2120                if ($from->{'href'}) {
2121                        $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2122                                             substr($diffinfo->{'from_id'},0,7));
2123                } else {
2124                        $from_link = '0' x 7;
2125                }
2126                if ($to->{'href'}) {
2127                        $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2128                                           substr($diffinfo->{'to_id'},0,7));
2129                } else {
2130                        $to_link = '0' x 7;
2131                }
2132                my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2133                $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2134        }
2135
2136        return $line . "<br/>\n";
2137}
2138
2139# format from-file/to-file diff header
2140sub format_diff_from_to_header {
2141        my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2142        my $line;
2143        my $result = '';
2144
2145        $line = $from_line;
2146        #assert($line =~ m/^---/) if DEBUG;
2147        # no extra formatting for "^--- /dev/null"
2148        if (! $diffinfo->{'nparents'}) {
2149                # ordinary (single parent) diff
2150                if ($line =~ m!^--- "?a/!) {
2151                        if ($from->{'href'}) {
2152                                $line = '--- a/' .
2153                                        $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2154                                                esc_path($from->{'file'}));
2155                        } else {
2156                                $line = '--- a/' .
2157                                        esc_path($from->{'file'});
2158                        }
2159                }
2160                $result .= qq!<div class="diff from_file">$line</div>\n!;
2161
2162        } else {
2163                # combined diff (merge commit)
2164                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2165                        if ($from->{'href'}[$i]) {
2166                                $line = '--- ' .
2167                                        $cgi->a({-href=>href(action=>"blobdiff",
2168                                                             hash_parent=>$diffinfo->{'from_id'}[$i],
2169                                                             hash_parent_base=>$parents[$i],
2170                                                             file_parent=>$from->{'file'}[$i],
2171                                                             hash=>$diffinfo->{'to_id'},
2172                                                             hash_base=>$hash,
2173                                                             file_name=>$to->{'file'}),
2174                                                 -class=>"path",
2175                                                 -title=>"diff" . ($i+1)},
2176                                                $i+1) .
2177                                        '/' .
2178                                        $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2179                                                esc_path($from->{'file'}[$i]));
2180                        } else {
2181                                $line = '--- /dev/null';
2182                        }
2183                        $result .= qq!<div class="diff from_file">$line</div>\n!;
2184                }
2185        }
2186
2187        $line = $to_line;
2188        #assert($line =~ m/^\+\+\+/) if DEBUG;
2189        # no extra formatting for "^+++ /dev/null"
2190        if ($line =~ m!^\+\+\+ "?b/!) {
2191                if ($to->{'href'}) {
2192                        $line = '+++ b/' .
2193                                $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2194                                        esc_path($to->{'file'}));
2195                } else {
2196                        $line = '+++ b/' .
2197                                esc_path($to->{'file'});
2198                }
2199        }
2200        $result .= qq!<div class="diff to_file">$line</div>\n!;
2201
2202        return $result;
2203}
2204
2205# create note for patch simplified by combined diff
2206sub format_diff_cc_simplified {
2207        my ($diffinfo, @parents) = @_;
2208        my $result = '';
2209
2210        $result .= "<div class=\"diff header\">" .
2211                   "diff --cc ";
2212        if (!is_deleted($diffinfo)) {
2213                $result .= $cgi->a({-href => href(action=>"blob",
2214                                                  hash_base=>$hash,
2215                                                  hash=>$diffinfo->{'to_id'},
2216                                                  file_name=>$diffinfo->{'to_file'}),
2217                                    -class => "path"},
2218                                   esc_path($diffinfo->{'to_file'}));
2219        } else {
2220                $result .= esc_path($diffinfo->{'to_file'});
2221        }
2222        $result .= "</div>\n" . # class="diff header"
2223                   "<div class=\"diff nodifferences\">" .
2224                   "Simple merge" .
2225                   "</div>\n"; # class="diff nodifferences"
2226
2227        return $result;
2228}
2229
2230sub diff_line_class {
2231        my ($line, $from, $to) = @_;
2232
2233        # ordinary diff
2234        my $num_sign = 1;
2235        # combined diff
2236        if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2237                $num_sign = scalar @{$from->{'href'}};
2238        }
2239
2240        my @diff_line_classifier = (
2241                { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2242                { regexp => qr/^\\/,               class => "incomplete"  },
2243                { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2244                # classifier for context must come before classifier add/rem,
2245                # or we would have to use more complicated regexp, for example
2246                # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2247                { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2248                { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2249        );
2250        for my $clsfy (@diff_line_classifier) {
2251                return $clsfy->{'class'}
2252                        if ($line =~ $clsfy->{'regexp'});
2253        }
2254
2255        # fallback
2256        return "";
2257}
2258
2259# assumes that $from and $to are defined and correctly filled,
2260# and that $line holds a line of chunk header for unified diff
2261sub format_unidiff_chunk_header {
2262        my ($line, $from, $to) = @_;
2263
2264        my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2265                $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2266
2267        $from_lines = 0 unless defined $from_lines;
2268        $to_lines   = 0 unless defined $to_lines;
2269
2270        if ($from->{'href'}) {
2271                $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2272                                     -class=>"list"}, $from_text);
2273        }
2274        if ($to->{'href'}) {
2275                $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2276                                     -class=>"list"}, $to_text);
2277        }
2278        $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2279                "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2280        return $line;
2281}
2282
2283# assumes that $from and $to are defined and correctly filled,
2284# and that $line holds a line of chunk header for combined diff
2285sub format_cc_diff_chunk_header {
2286        my ($line, $from, $to) = @_;
2287
2288        my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2289        my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2290
2291        @from_text = split(' ', $ranges);
2292        for (my $i = 0; $i < @from_text; ++$i) {
2293                ($from_start[$i], $from_nlines[$i]) =
2294                        (split(',', substr($from_text[$i], 1)), 0);
2295        }
2296
2297        $to_text   = pop @from_text;
2298        $to_start  = pop @from_start;
2299        $to_nlines = pop @from_nlines;
2300
2301        $line = "<span class=\"chunk_info\">$prefix ";
2302        for (my $i = 0; $i < @from_text; ++$i) {
2303                if ($from->{'href'}[$i]) {
2304                        $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2305                                          -class=>"list"}, $from_text[$i]);
2306                } else {
2307                        $line .= $from_text[$i];
2308                }
2309                $line .= " ";
2310        }
2311        if ($to->{'href'}) {
2312                $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2313                                  -class=>"list"}, $to_text);
2314        } else {
2315                $line .= $to_text;
2316        }
2317        $line .= " $prefix</span>" .
2318                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2319        return $line;
2320}
2321
2322# process patch (diff) line (not to be used for diff headers),
2323# returning class and HTML-formatted (but not wrapped) line
2324sub process_diff_line {
2325        my $line = shift;
2326        my ($from, $to) = @_;
2327
2328        my $diff_class = diff_line_class($line, $from, $to);
2329
2330        chomp $line;
2331        $line = untabify($line);
2332
2333        if ($from && $to && $line =~ m/^\@{2} /) {
2334                $line = format_unidiff_chunk_header($line, $from, $to);
2335                return $diff_class, $line;
2336
2337        } elsif ($from && $to && $line =~ m/^\@{3}/) {
2338                $line = format_cc_diff_chunk_header($line, $from, $to);
2339                return $diff_class, $line;
2340
2341        }
2342        return $diff_class, esc_html($line, -nbsp=>1);
2343}
2344
2345# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2346# linked.  Pass the hash of the tree/commit to snapshot.
2347sub format_snapshot_links {
2348        my ($hash) = @_;
2349        my $num_fmts = @snapshot_fmts;
2350        if ($num_fmts > 1) {
2351                # A parenthesized list of links bearing format names.
2352                # e.g. "snapshot (_tar.gz_ _zip_)"
2353                return "snapshot (" . join(' ', map
2354                        $cgi->a({
2355                                -href => href(
2356                                        action=>"snapshot",
2357                                        hash=>$hash,
2358                                        snapshot_format=>$_
2359                                )
2360                        }, $known_snapshot_formats{$_}{'display'})
2361                , @snapshot_fmts) . ")";
2362        } elsif ($num_fmts == 1) {
2363                # A single "snapshot" link whose tooltip bears the format name.
2364                # i.e. "_snapshot_"
2365                my ($fmt) = @snapshot_fmts;
2366                return
2367                        $cgi->a({
2368                                -href => href(
2369                                        action=>"snapshot",
2370                                        hash=>$hash,
2371                                        snapshot_format=>$fmt
2372                                ),
2373                                -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2374                        }, "snapshot");
2375        } else { # $num_fmts == 0
2376                return undef;
2377        }
2378}
2379
2380## ......................................................................
2381## functions returning values to be passed, perhaps after some
2382## transformation, to other functions; e.g. returning arguments to href()
2383
2384# returns hash to be passed to href to generate gitweb URL
2385# in -title key it returns description of link
2386sub get_feed_info {
2387        my $format = shift || 'Atom';
2388        my %res = (action => lc($format));
2389
2390        # feed links are possible only for project views
2391        return unless (defined $project);
2392        # some views should link to OPML, or to generic project feed,
2393        # or don't have specific feed yet (so they should use generic)
2394        return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2395
2396        my $branch;
2397        # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2398        # from tag links; this also makes possible to detect branch links
2399        if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2400            (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2401                $branch = $1;
2402        }
2403        # find log type for feed description (title)
2404        my $type = 'log';
2405        if (defined $file_name) {
2406                $type  = "history of $file_name";
2407                $type .= "/" if ($action eq 'tree');
2408                $type .= " on '$branch'" if (defined $branch);
2409        } else {
2410                $type = "log of $branch" if (defined $branch);
2411        }
2412
2413        $res{-title} = $type;
2414        $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2415        $res{'file_name'} = $file_name;
2416
2417        return %res;
2418}
2419
2420## ----------------------------------------------------------------------
2421## git utility subroutines, invoking git commands
2422
2423# returns path to the core git executable and the --git-dir parameter as list
2424sub git_cmd {
2425        $number_of_git_cmds++;
2426        return $GIT, '--git-dir='.$git_dir;
2427}
2428
2429# quote the given arguments for passing them to the shell
2430# quote_command("command", "arg 1", "arg with ' and ! characters")
2431# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2432# Try to avoid using this function wherever possible.
2433sub quote_command {
2434        return join(' ',
2435                map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2436}
2437
2438# get HEAD ref of given project as hash
2439sub git_get_head_hash {
2440        return git_get_full_hash(shift, 'HEAD');
2441}
2442
2443sub git_get_full_hash {
2444        return git_get_hash(@_);
2445}
2446
2447sub git_get_short_hash {
2448        return git_get_hash(@_, '--short=7');
2449}
2450
2451sub git_get_hash {
2452        my ($project, $hash, @options) = @_;
2453        my $o_git_dir = $git_dir;
2454        my $retval = undef;
2455        $git_dir = "$projectroot/$project";
2456        if (open my $fd, '-|', git_cmd(), 'rev-parse',
2457            '--verify', '-q', @options, $hash) {
2458                $retval = <$fd>;
2459                chomp $retval if defined $retval;
2460                close $fd;
2461        }
2462        if (defined $o_git_dir) {
2463                $git_dir = $o_git_dir;
2464        }
2465        return $retval;
2466}
2467
2468# get type of given object
2469sub git_get_type {
2470        my $hash = shift;
2471
2472        open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2473        my $type = <$fd>;
2474        close $fd or return;
2475        chomp $type;
2476        return $type;
2477}
2478
2479# repository configuration
2480our $config_file = '';
2481our %config;
2482
2483# store multiple values for single key as anonymous array reference
2484# single values stored directly in the hash, not as [ <value> ]
2485sub hash_set_multi {
2486        my ($hash, $key, $value) = @_;
2487
2488        if (!exists $hash->{$key}) {
2489                $hash->{$key} = $value;
2490        } elsif (!ref $hash->{$key}) {
2491                $hash->{$key} = [ $hash->{$key}, $value ];
2492        } else {
2493                push @{$hash->{$key}}, $value;
2494        }
2495}
2496
2497# return hash of git project configuration
2498# optionally limited to some section, e.g. 'gitweb'
2499sub git_parse_project_config {
2500        my $section_regexp = shift;
2501        my %config;
2502
2503        local $/ = "\0";
2504
2505        open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2506                or return;
2507
2508        while (my $keyval = <$fh>) {
2509                chomp $keyval;
2510                my ($key, $value) = split(/\n/, $keyval, 2);
2511
2512                hash_set_multi(\%config, $key, $value)
2513                        if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2514        }
2515        close $fh;
2516
2517        return %config;
2518}
2519
2520# convert config value to boolean: 'true' or 'false'
2521# no value, number > 0, 'true' and 'yes' values are true
2522# rest of values are treated as false (never as error)
2523sub config_to_bool {
2524        my $val = shift;
2525
2526        return 1 if !defined $val;             # section.key
2527
2528        # strip leading and trailing whitespace
2529        $val =~ s/^\s+//;
2530        $val =~ s/\s+$//;
2531
2532        return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2533                ($val =~ /^(?:true|yes)$/i));  # section.key = true
2534}
2535
2536# convert config value to simple decimal number
2537# an optional value suffix of 'k', 'm', or 'g' will cause the value
2538# to be multiplied by 1024, 1048576, or 1073741824
2539sub config_to_int {
2540        my $val = shift;
2541
2542        # strip leading and trailing whitespace
2543        $val =~ s/^\s+//;
2544        $val =~ s/\s+$//;
2545
2546        if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2547                $unit = lc($unit);
2548                # unknown unit is treated as 1
2549                return $num * ($unit eq 'g' ? 1073741824 :
2550                               $unit eq 'm' ?    1048576 :
2551                               $unit eq 'k' ?       1024 : 1);
2552        }
2553        return $val;
2554}
2555
2556# convert config value to array reference, if needed
2557sub config_to_multi {
2558        my $val = shift;
2559
2560        return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2561}
2562
2563sub git_get_project_config {
2564        my ($key, $type) = @_;
2565
2566        return unless defined $git_dir;
2567
2568        # key sanity check
2569        return unless ($key);
2570        # only subsection, if exists, is case sensitive,
2571        # and not lowercased by 'git config -z -l'
2572        if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2573                $key = join(".", lc($hi), $mi, lc($lo));
2574        } else {
2575                $key = lc($key);
2576        }
2577        $key =~ s/^gitweb\.//;
2578        return if ($key =~ m/\W/);
2579
2580        # type sanity check
2581        if (defined $type) {
2582                $type =~ s/^--//;
2583                $type = undef
2584                        unless ($type eq 'bool' || $type eq 'int');
2585        }
2586
2587        # get config
2588        if (!defined $config_file ||
2589            $config_file ne "$git_dir/config") {
2590                %config = git_parse_project_config('gitweb');
2591                $config_file = "$git_dir/config";
2592        }
2593
2594        # check if config variable (key) exists
2595        return unless exists $config{"gitweb.$key"};
2596
2597        # ensure given type
2598        if (!defined $type) {
2599                return $config{"gitweb.$key"};
2600        } elsif ($type eq 'bool') {
2601                # backward compatibility: 'git config --bool' returns true/false
2602                return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2603        } elsif ($type eq 'int') {
2604                return config_to_int($config{"gitweb.$key"});
2605        }
2606        return $config{"gitweb.$key"};
2607}
2608
2609# get hash of given path at given ref
2610sub git_get_hash_by_path {
2611        my $base = shift;
2612        my $path = shift || return undef;
2613        my $type = shift;
2614
2615        $path =~ s,/+$,,;
2616
2617        open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2618                or die_error(500, "Open git-ls-tree failed");
2619        my $line = <$fd>;
2620        close $fd or return undef;
2621
2622        if (!defined $line) {
2623                # there is no tree or hash given by $path at $base
2624                return undef;
2625        }
2626
2627        #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2628        $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2629        if (defined $type && $type ne $2) {
2630                # type doesn't match
2631                return undef;
2632        }
2633        return $3;
2634}
2635
2636# get path of entry with given hash at given tree-ish (ref)
2637# used to get 'from' filename for combined diff (merge commit) for renames
2638sub git_get_path_by_hash {
2639        my $base = shift || return;
2640        my $hash = shift || return;
2641
2642        local $/ = "\0";
2643
2644        open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2645                or return undef;
2646        while (my $line = <$fd>) {
2647                chomp $line;
2648
2649                #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2650                #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2651                if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2652                        close $fd;
2653                        return $1;
2654                }
2655        }
2656        close $fd;
2657        return undef;
2658}
2659
2660## ......................................................................
2661## git utility functions, directly accessing git repository
2662
2663# get the value of config variable either from file named as the variable
2664# itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2665# configuration variable in the repository config file.
2666sub git_get_file_or_project_config {
2667        my ($path, $name) = @_;
2668
2669        $git_dir = "$projectroot/$path";
2670        open my $fd, '<', "$git_dir/$name"
2671                or return git_get_project_config($name);
2672        my $conf = <$fd>;
2673        close $fd;
2674        if (defined $conf) {
2675                chomp $conf;
2676        }
2677        return $conf;
2678}
2679
2680sub git_get_project_description {
2681        my $path = shift;
2682        return git_get_file_or_project_config($path, 'description');
2683}
2684
2685sub git_get_project_category {
2686        my $path = shift;
2687        return git_get_file_or_project_config($path, 'category');
2688}
2689
2690
2691# supported formats:
2692# * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2693#   - if its contents is a number, use it as tag weight,
2694#   - otherwise add a tag with weight 1
2695# * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2696#   the same value multiple times increases tag weight
2697# * `gitweb.ctag' multi-valued repo config variable
2698sub git_get_project_ctags {
2699        my $project = shift;
2700        my $ctags = {};
2701
2702        $git_dir = "$projectroot/$project";
2703        if (opendir my $dh, "$git_dir/ctags") {
2704                my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2705                foreach my $tagfile (@files) {
2706                        open my $ct, '<', $tagfile
2707                                or next;
2708                        my $val = <$ct>;
2709                        chomp $val if $val;
2710                        close $ct;
2711
2712                        (my $ctag = $tagfile) =~ s#.*/##;
2713                        if ($val =~ /^\d+$/) {
2714                                $ctags->{$ctag} = $val;
2715                        } else {
2716                                $ctags->{$ctag} = 1;
2717                        }
2718                }
2719                closedir $dh;
2720
2721        } elsif (open my $fh, '<', "$git_dir/ctags") {
2722                while (my $line = <$fh>) {
2723                        chomp $line;
2724                        $ctags->{$line}++ if $line;
2725                }
2726                close $fh;
2727
2728        } else {
2729                my $taglist = config_to_multi(git_get_project_config('ctag'));
2730                foreach my $tag (@$taglist) {
2731                        $ctags->{$tag}++;
2732                }
2733        }
2734
2735        return $ctags;
2736}
2737
2738# return hash, where keys are content tags ('ctags'),
2739# and values are sum of weights of given tag in every project
2740sub git_gather_all_ctags {
2741        my $projects = shift;
2742        my $ctags = {};
2743
2744        foreach my $p (@$projects) {
2745                foreach my $ct (keys %{$p->{'ctags'}}) {
2746                        $ctags->{$ct} += $p->{'ctags'}->{$ct};
2747                }
2748        }
2749
2750        return $ctags;
2751}
2752
2753sub git_populate_project_tagcloud {
2754        my $ctags = shift;
2755
2756        # First, merge different-cased tags; tags vote on casing
2757        my %ctags_lc;
2758        foreach (keys %$ctags) {
2759                $ctags_lc{lc $_}->{count} += $ctags->{$_};
2760                if (not $ctags_lc{lc $_}->{topcount}
2761                    or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2762                        $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2763                        $ctags_lc{lc $_}->{topname} = $_;
2764                }
2765        }
2766
2767        my $cloud;
2768        my $matched = $cgi->param('by_tag');
2769        if (eval { require HTML::TagCloud; 1; }) {
2770                $cloud = HTML::TagCloud->new;
2771                foreach my $ctag (sort keys %ctags_lc) {
2772                        # Pad the title with spaces so that the cloud looks
2773                        # less crammed.
2774                        my $title = esc_html($ctags_lc{$ctag}->{topname});
2775                        $title =~ s/ /&nbsp;/g;
2776                        $title =~ s/^/&nbsp;/g;
2777                        $title =~ s/$/&nbsp;/g;
2778                        if (defined $matched && $matched eq $ctag) {
2779                                $title = qq(<span class="match">$title</span>);
2780                        }
2781                        $cloud->add($title, href(project=>undef, ctag=>$ctag),
2782                                    $ctags_lc{$ctag}->{count});
2783                }
2784        } else {
2785                $cloud = {};
2786                foreach my $ctag (keys %ctags_lc) {
2787                        my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2788                        if (defined $matched && $matched eq $ctag) {
2789                                $title = qq(<span class="match">$title</span>);
2790                        }
2791                        $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2792                        $cloud->{$ctag}{ctag} =
2793                                $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2794                }
2795        }
2796        return $cloud;
2797}
2798
2799sub git_show_project_tagcloud {
2800        my ($cloud, $count) = @_;
2801        if (ref $cloud eq 'HTML::TagCloud') {
2802                return $cloud->html_and_css($count);
2803        } else {
2804                my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2805                return
2806                        '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2807                        join (', ', map {
2808                                $cloud->{$_}->{'ctag'}
2809                        } splice(@tags, 0, $count)) .
2810                        '</div>';
2811        }
2812}
2813
2814sub git_get_project_url_list {
2815        my $path = shift;
2816
2817        $git_dir = "$projectroot/$path";
2818        open my $fd, '<', "$git_dir/cloneurl"
2819                or return wantarray ?
2820                @{ config_to_multi(git_get_project_config('url')) } :
2821                   config_to_multi(git_get_project_config('url'));
2822        my @git_project_url_list = map { chomp; $_ } <$fd>;
2823        close $fd;
2824
2825        return wantarray ? @git_project_url_list : \@git_project_url_list;
2826}
2827
2828sub git_get_projects_list {
2829        my $filter = shift || '';
2830        my $paranoid = shift;
2831        my @list;
2832
2833        if (-d $projects_list) {
2834                # search in directory
2835                my $dir = $projects_list;
2836                # remove the trailing "/"
2837                $dir =~ s!/+$!!;
2838                my $pfxlen = length("$dir");
2839                my $pfxdepth = ($dir =~ tr!/!!);
2840                # when filtering, search only given subdirectory
2841                if ($filter && !$paranoid) {
2842                        $dir .= "/$filter";
2843                        $dir =~ s!/+$!!;
2844                }
2845
2846                File::Find::find({
2847                        follow_fast => 1, # follow symbolic links
2848                        follow_skip => 2, # ignore duplicates
2849                        dangling_symlinks => 0, # ignore dangling symlinks, silently
2850                        wanted => sub {
2851                                # global variables
2852                                our $project_maxdepth;
2853                                our $projectroot;
2854                                # skip project-list toplevel, if we get it.
2855                                return if (m!^[/.]$!);
2856                                # only directories can be git repositories
2857                                return unless (-d $_);
2858                                # don't traverse too deep (Find is super slow on os x)
2859                                # $project_maxdepth excludes depth of $projectroot
2860                                if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2861                                        $File::Find::prune = 1;
2862                                        return;
2863                                }
2864
2865                                my $path = substr($File::Find::name, $pfxlen + 1);
2866                                # paranoidly only filter here
2867                                if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
2868                                        next;
2869                                }
2870                                # we check related file in $projectroot
2871                                if (check_export_ok("$projectroot/$path")) {
2872                                        push @list, { path => $path };
2873                                        $File::Find::prune = 1;
2874                                }
2875                        },
2876                }, "$dir");
2877
2878        } elsif (-f $projects_list) {
2879                # read from file(url-encoded):
2880                # 'git%2Fgit.git Linus+Torvalds'
2881                # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2882                # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2883                open my $fd, '<', $projects_list or return;
2884        PROJECT:
2885                while (my $line = <$fd>) {
2886                        chomp $line;
2887                        my ($path, $owner) = split ' ', $line;
2888                        $path = unescape($path);
2889                        $owner = unescape($owner);
2890                        if (!defined $path) {
2891                                next;
2892                        }
2893                        # if $filter is rpovided, check if $path begins with $filter
2894                        if ($filter && $path !~ m!^\Q$filter\E/!) {
2895                                next;
2896                        }
2897                        if (check_export_ok("$projectroot/$path")) {
2898                                my $pr = {
2899                                        path => $path,
2900                                        owner => to_utf8($owner),
2901                                };
2902                                push @list, $pr;
2903                        }
2904                }
2905                close $fd;
2906        }
2907        return @list;
2908}
2909
2910# written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
2911# as side effects it sets 'forks' field to list of forks for forked projects
2912sub filter_forks_from_projects_list {
2913        my $projects = shift;
2914
2915        my %trie; # prefix tree of directories (path components)
2916        # generate trie out of those directories that might contain forks
2917        foreach my $pr (@$projects) {
2918                my $path = $pr->{'path'};
2919                $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
2920                next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
2921                next unless ($path);      # skip '.git' repository: tests, git-instaweb
2922                next unless (-d "$projectroot/$path"); # containing directory exists
2923                $pr->{'forks'} = [];      # there can be 0 or more forks of project
2924
2925                # add to trie
2926                my @dirs = split('/', $path);
2927                # walk the trie, until either runs out of components or out of trie
2928                my $ref = \%trie;
2929                while (scalar @dirs &&
2930                       exists($ref->{$dirs[0]})) {
2931                        $ref = $ref->{shift @dirs};
2932                }
2933                # create rest of trie structure from rest of components
2934                foreach my $dir (@dirs) {
2935                        $ref = $ref->{$dir} = {};
2936                }
2937                # create end marker, store $pr as a data
2938                $ref->{''} = $pr if (!exists $ref->{''});
2939        }
2940
2941        # filter out forks, by finding shortest prefix match for paths
2942        my @filtered;
2943 PROJECT:
2944        foreach my $pr (@$projects) {
2945                # trie lookup
2946                my $ref = \%trie;
2947        DIR:
2948                foreach my $dir (split('/', $pr->{'path'})) {
2949                        if (exists $ref->{''}) {
2950                                # found [shortest] prefix, is a fork - skip it
2951                                push @{$ref->{''}{'forks'}}, $pr;
2952                                next PROJECT;
2953                        }
2954                        if (!exists $ref->{$dir}) {
2955                                # not in trie, cannot have prefix, not a fork
2956                                push @filtered, $pr;
2957                                next PROJECT;
2958                        }
2959                        # If the dir is there, we just walk one step down the trie.
2960                        $ref = $ref->{$dir};
2961                }
2962                # we ran out of trie
2963                # (shouldn't happen: it's either no match, or end marker)
2964                push @filtered, $pr;
2965        }
2966
2967        return @filtered;
2968}
2969
2970# note: fill_project_list_info must be run first,
2971# for 'descr_long' and 'ctags' to be filled
2972sub search_projects_list {
2973        my ($projlist, %opts) = @_;
2974        my $tagfilter  = $opts{'tagfilter'};
2975        my $searchtext = $opts{'searchtext'};
2976
2977        return @$projlist
2978                unless ($tagfilter || $searchtext);
2979
2980        my @projects;
2981 PROJECT:
2982        foreach my $pr (@$projlist) {
2983
2984                if ($tagfilter) {
2985                        next unless ref($pr->{'ctags'}) eq 'HASH';
2986                        next unless
2987                                grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
2988                }
2989
2990                if ($searchtext) {
2991                        next unless
2992                                $pr->{'path'} =~ /$searchtext/ ||
2993                                $pr->{'descr_long'} =~ /$searchtext/;
2994                }
2995
2996                push @projects, $pr;
2997        }
2998
2999        return @projects;
3000}
3001
3002our $gitweb_project_owner = undef;
3003sub git_get_project_list_from_file {
3004
3005        return if (defined $gitweb_project_owner);
3006
3007        $gitweb_project_owner = {};
3008        # read from file (url-encoded):
3009        # 'git%2Fgit.git Linus+Torvalds'
3010        # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3011        # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3012        if (-f $projects_list) {
3013                open(my $fd, '<', $projects_list);
3014                while (my $line = <$fd>) {
3015                        chomp $line;
3016                        my ($pr, $ow) = split ' ', $line;
3017                        $pr = unescape($pr);
3018                        $ow = unescape($ow);
3019                        $gitweb_project_owner->{$pr} = to_utf8($ow);
3020                }
3021                close $fd;
3022        }
3023}
3024
3025sub git_get_project_owner {
3026        my $project = shift;
3027        my $owner;
3028
3029        return undef unless $project;
3030        $git_dir = "$projectroot/$project";
3031
3032        if (!defined $gitweb_project_owner) {
3033                git_get_project_list_from_file();
3034        }
3035
3036        if (exists $gitweb_project_owner->{$project}) {
3037                $owner = $gitweb_project_owner->{$project};
3038        }
3039        if (!defined $owner){
3040                $owner = git_get_project_config('owner');
3041        }
3042        if (!defined $owner) {
3043                $owner = get_file_owner("$git_dir");
3044        }
3045
3046        return $owner;
3047}
3048
3049sub git_get_last_activity {
3050        my ($path) = @_;
3051        my $fd;
3052
3053        $git_dir = "$projectroot/$path";
3054        open($fd, "-|", git_cmd(), 'for-each-ref',
3055             '--format=%(committer)',
3056             '--sort=-committerdate',
3057             '--count=1',
3058             'refs/heads') or return;
3059        my $most_recent = <$fd>;
3060        close $fd or return;
3061        if (defined $most_recent &&
3062            $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3063                my $timestamp = $1;
3064                my $age = time - $timestamp;
3065                return ($age, age_string($age));
3066        }
3067        return (undef, undef);
3068}
3069
3070# Implementation note: when a single remote is wanted, we cannot use 'git
3071# remote show -n' because that command always work (assuming it's a remote URL
3072# if it's not defined), and we cannot use 'git remote show' because that would
3073# try to make a network roundtrip. So the only way to find if that particular
3074# remote is defined is to walk the list provided by 'git remote -v' and stop if
3075# and when we find what we want.
3076sub git_get_remotes_list {
3077        my $wanted = shift;
3078        my %remotes = ();
3079
3080        open my $fd, '-|' , git_cmd(), 'remote', '-v';
3081        return unless $fd;
3082        while (my $remote = <$fd>) {
3083                chomp $remote;
3084                $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3085                next if $wanted and not $remote eq $wanted;
3086                my ($url, $key) = ($1, $2);
3087
3088                $remotes{$remote} ||= { 'heads' => () };
3089                $remotes{$remote}{$key} = $url;
3090        }
3091        close $fd or return;
3092        return wantarray ? %remotes : \%remotes;
3093}
3094
3095# Takes a hash of remotes as first parameter and fills it by adding the
3096# available remote heads for each of the indicated remotes.
3097sub fill_remote_heads {
3098        my $remotes = shift;
3099        my @heads = map { "remotes/$_" } keys %$remotes;
3100        my @remoteheads = git_get_heads_list(undef, @heads);
3101        foreach my $remote (keys %$remotes) {
3102                $remotes->{$remote}{'heads'} = [ grep {
3103                        $_->{'name'} =~ s!^$remote/!!
3104                        } @remoteheads ];
3105        }
3106}
3107
3108sub git_get_references {
3109        my $type = shift || "";
3110        my %refs;
3111        # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3112        # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3113        open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3114                ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3115                or return;
3116
3117        while (my $line = <$fd>) {
3118                chomp $line;
3119                if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3120                        if (defined $refs{$1}) {
3121                                push @{$refs{$1}}, $2;
3122                        } else {
3123                                $refs{$1} = [ $2 ];
3124                        }
3125                }
3126        }
3127        close $fd or return;
3128        return \%refs;
3129}
3130
3131sub git_get_rev_name_tags {
3132        my $hash = shift || return undef;
3133
3134        open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3135                or return;
3136        my $name_rev = <$fd>;
3137        close $fd;
3138
3139        if ($name_rev =~ m|^$hash tags/(.*)$|) {
3140                return $1;
3141        } else {
3142                # catches also '$hash undefined' output
3143                return undef;
3144        }
3145}
3146
3147## ----------------------------------------------------------------------
3148## parse to hash functions
3149
3150sub parse_date {
3151        my $epoch = shift;
3152        my $tz = shift || "-0000";
3153
3154        my %date;
3155        my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3156        my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3157        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3158        $date{'hour'} = $hour;
3159        $date{'minute'} = $min;
3160        $date{'mday'} = $mday;
3161        $date{'day'} = $days[$wday];
3162        $date{'month'} = $months[$mon];
3163        $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3164                             $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3165        $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3166                             $mday, $months[$mon], $hour ,$min;
3167        $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3168                             1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3169
3170        my ($tz_sign, $tz_hour, $tz_min) =
3171                ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3172        $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3173        my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3174        ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3175        $date{'hour_local'} = $hour;
3176        $date{'minute_local'} = $min;
3177        $date{'tz_local'} = $tz;
3178        $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3179                                  1900+$year, $mon+1, $mday,
3180                                  $hour, $min, $sec, $tz);
3181        return %date;
3182}
3183
3184sub parse_tag {
3185        my $tag_id = shift;
3186        my %tag;
3187        my @comment;
3188
3189        open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3190        $tag{'id'} = $tag_id;
3191        while (my $line = <$fd>) {
3192                chomp $line;
3193                if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3194                        $tag{'object'} = $1;
3195                } elsif ($line =~ m/^type (.+)$/) {
3196                        $tag{'type'} = $1;
3197                } elsif ($line =~ m/^tag (.+)$/) {
3198                        $tag{'name'} = $1;
3199                } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3200                        $tag{'author'} = $1;
3201                        $tag{'author_epoch'} = $2;
3202                        $tag{'author_tz'} = $3;
3203                        if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3204                                $tag{'author_name'}  = $1;
3205                                $tag{'author_email'} = $2;
3206                        } else {
3207                                $tag{'author_name'} = $tag{'author'};
3208                        }
3209                } elsif ($line =~ m/--BEGIN/) {
3210                        push @comment, $line;
3211                        last;
3212                } elsif ($line eq "") {
3213                        last;
3214                }
3215        }
3216        push @comment, <$fd>;
3217        $tag{'comment'} = \@comment;
3218        close $fd or return;
3219        if (!defined $tag{'name'}) {
3220                return
3221        };
3222        return %tag
3223}
3224
3225sub parse_commit_text {
3226        my ($commit_text, $withparents) = @_;
3227        my @commit_lines = split '\n', $commit_text;
3228        my %co;
3229
3230        pop @commit_lines; # Remove '\0'
3231
3232        if (! @commit_lines) {
3233                return;
3234        }
3235
3236        my $header = shift @commit_lines;
3237        if ($header !~ m/^[0-9a-fA-F]{40}/) {
3238                return;
3239        }
3240        ($co{'id'}, my @parents) = split ' ', $header;
3241        while (my $line = shift @commit_lines) {
3242                last if $line eq "\n";
3243                if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3244                        $co{'tree'} = $1;
3245                } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3246                        push @parents, $1;
3247                } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3248                        $co{'author'} = to_utf8($1);
3249                        $co{'author_epoch'} = $2;
3250                        $co{'author_tz'} = $3;
3251                        if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3252                                $co{'author_name'}  = $1;
3253                                $co{'author_email'} = $2;
3254                        } else {
3255                                $co{'author_name'} = $co{'author'};
3256                        }
3257                } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3258                        $co{'committer'} = to_utf8($1);
3259                        $co{'committer_epoch'} = $2;
3260                        $co{'committer_tz'} = $3;
3261                        if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3262                                $co{'committer_name'}  = $1;
3263                                $co{'committer_email'} = $2;
3264                        } else {
3265                                $co{'committer_name'} = $co{'committer'};
3266                        }
3267                }
3268        }
3269        if (!defined $co{'tree'}) {
3270                return;
3271        };
3272        $co{'parents'} = \@parents;
3273        $co{'parent'} = $parents[0];
3274
3275        foreach my $title (@commit_lines) {
3276                $title =~ s/^    //;
3277                if ($title ne "") {
3278                        $co{'title'} = chop_str($title, 80, 5);
3279                        # remove leading stuff of merges to make the interesting part visible
3280                        if (length($title) > 50) {
3281                                $title =~ s/^Automatic //;
3282                                $title =~ s/^merge (of|with) /Merge ... /i;
3283                                if (length($title) > 50) {
3284                                        $title =~ s/(http|rsync):\/\///;
3285                                }
3286                                if (length($title) > 50) {
3287                                        $title =~ s/(master|www|rsync)\.//;
3288                                }
3289                                if (length($title) > 50) {
3290                                        $title =~ s/kernel.org:?//;
3291                                }
3292                                if (length($title) > 50) {
3293                                        $title =~ s/\/pub\/scm//;
3294                                }
3295                        }
3296                        $co{'title_short'} = chop_str($title, 50, 5);
3297                        last;
3298                }
3299        }
3300        if (! defined $co{'title'} || $co{'title'} eq "") {
3301                $co{'title'} = $co{'title_short'} = '(no commit message)';
3302        }
3303        # remove added spaces
3304        foreach my $line (@commit_lines) {
3305                $line =~ s/^    //;
3306        }
3307        $co{'comment'} = \@commit_lines;
3308
3309        my $age = time - $co{'committer_epoch'};
3310        $co{'age'} = $age;
3311        $co{'age_string'} = age_string($age);
3312        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3313        if ($age > 60*60*24*7*2) {
3314                $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3315                $co{'age_string_age'} = $co{'age_string'};
3316        } else {
3317                $co{'age_string_date'} = $co{'age_string'};
3318                $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3319        }
3320        return %co;
3321}
3322
3323sub parse_commit {
3324        my ($commit_id) = @_;
3325        my %co;
3326
3327        local $/ = "\0";
3328
3329        open my $fd, "-|", git_cmd(), "rev-list",
3330                "--parents",
3331                "--header",
3332                "--max-count=1",
3333                $commit_id,
3334                "--",
3335                or die_error(500, "Open git-rev-list failed");
3336        %co = parse_commit_text(<$fd>, 1);
3337        close $fd;
3338
3339        return %co;
3340}
3341
3342sub parse_commits {
3343        my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3344        my @cos;
3345
3346        $maxcount ||= 1;
3347        $skip ||= 0;
3348
3349        local $/ = "\0";
3350
3351        open my $fd, "-|", git_cmd(), "rev-list",
3352                "--header",
3353                @args,
3354                ("--max-count=" . $maxcount),
3355                ("--skip=" . $skip),
3356                @extra_options,
3357                $commit_id,
3358                "--",
3359                ($filename ? ($filename) : ())
3360                or die_error(500, "Open git-rev-list failed");
3361        while (my $line = <$fd>) {
3362                my %co = parse_commit_text($line);
3363                push @cos, \%co;
3364        }
3365        close $fd;
3366
3367        return wantarray ? @cos : \@cos;
3368}
3369
3370# parse line of git-diff-tree "raw" output
3371sub parse_difftree_raw_line {
3372        my $line = shift;
3373        my %res;
3374
3375        # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3376        # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3377        if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3378                $res{'from_mode'} = $1;
3379                $res{'to_mode'} = $2;
3380                $res{'from_id'} = $3;
3381                $res{'to_id'} = $4;
3382                $res{'status'} = $5;
3383                $res{'similarity'} = $6;
3384                if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3385                        ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3386                } else {
3387                        $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3388                }
3389        }
3390        # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3391        # combined diff (for merge commit)
3392        elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3393                $res{'nparents'}  = length($1);
3394                $res{'from_mode'} = [ split(' ', $2) ];
3395                $res{'to_mode'} = pop @{$res{'from_mode'}};
3396                $res{'from_id'} = [ split(' ', $3) ];
3397                $res{'to_id'} = pop @{$res{'from_id'}};
3398                $res{'status'} = [ split('', $4) ];
3399                $res{'to_file'} = unquote($5);
3400        }
3401        # 'c512b523472485aef4fff9e57b229d9d243c967f'
3402        elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3403                $res{'commit'} = $1;
3404        }
3405
3406        return wantarray ? %res : \%res;
3407}
3408
3409# wrapper: return parsed line of git-diff-tree "raw" output
3410# (the argument might be raw line, or parsed info)
3411sub parsed_difftree_line {
3412        my $line_or_ref = shift;
3413
3414        if (ref($line_or_ref) eq "HASH") {
3415                # pre-parsed (or generated by hand)
3416                return $line_or_ref;
3417        } else {
3418                return parse_difftree_raw_line($line_or_ref);
3419        }
3420}
3421
3422# parse line of git-ls-tree output
3423sub parse_ls_tree_line {
3424        my $line = shift;
3425        my %opts = @_;
3426        my %res;
3427
3428        if ($opts{'-l'}) {
3429                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3430                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3431
3432                $res{'mode'} = $1;
3433                $res{'type'} = $2;
3434                $res{'hash'} = $3;
3435                $res{'size'} = $4;
3436                if ($opts{'-z'}) {
3437                        $res{'name'} = $5;
3438                } else {
3439                        $res{'name'} = unquote($5);
3440                }
3441        } else {
3442                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3443                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3444
3445                $res{'mode'} = $1;
3446                $res{'type'} = $2;
3447                $res{'hash'} = $3;
3448                if ($opts{'-z'}) {
3449                        $res{'name'} = $4;
3450                } else {
3451                        $res{'name'} = unquote($4);
3452                }
3453        }
3454
3455        return wantarray ? %res : \%res;
3456}
3457
3458# generates _two_ hashes, references to which are passed as 2 and 3 argument
3459sub parse_from_to_diffinfo {
3460        my ($diffinfo, $from, $to, @parents) = @_;
3461
3462        if ($diffinfo->{'nparents'}) {
3463                # combined diff
3464                $from->{'file'} = [];
3465                $from->{'href'} = [];
3466                fill_from_file_info($diffinfo, @parents)
3467                        unless exists $diffinfo->{'from_file'};
3468                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3469                        $from->{'file'}[$i] =
3470                                defined $diffinfo->{'from_file'}[$i] ?
3471                                        $diffinfo->{'from_file'}[$i] :
3472                                        $diffinfo->{'to_file'};
3473                        if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3474                                $from->{'href'}[$i] = href(action=>"blob",
3475                                                           hash_base=>$parents[$i],
3476                                                           hash=>$diffinfo->{'from_id'}[$i],
3477                                                           file_name=>$from->{'file'}[$i]);
3478                        } else {
3479                                $from->{'href'}[$i] = undef;
3480                        }
3481                }
3482        } else {
3483                # ordinary (not combined) diff
3484                $from->{'file'} = $diffinfo->{'from_file'};
3485                if ($diffinfo->{'status'} ne "A") { # not new (added) file
3486                        $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3487                                               hash=>$diffinfo->{'from_id'},
3488                                               file_name=>$from->{'file'});
3489                } else {
3490                        delete $from->{'href'};
3491                }
3492        }
3493
3494        $to->{'file'} = $diffinfo->{'to_file'};
3495        if (!is_deleted($diffinfo)) { # file exists in result
3496                $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3497                                     hash=>$diffinfo->{'to_id'},
3498                                     file_name=>$to->{'file'});
3499        } else {
3500                delete $to->{'href'};
3501        }
3502}
3503
3504## ......................................................................
3505## parse to array of hashes functions
3506
3507sub git_get_heads_list {
3508        my ($limit, @classes) = @_;
3509        @classes = ('heads') unless @classes;
3510        my @patterns = map { "refs/$_" } @classes;
3511        my @headslist;
3512
3513        open my $fd, '-|', git_cmd(), 'for-each-ref',
3514                ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3515                '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3516                @patterns
3517                or return;
3518        while (my $line = <$fd>) {
3519                my %ref_item;
3520
3521                chomp $line;
3522                my ($refinfo, $committerinfo) = split(/\0/, $line);
3523                my ($hash, $name, $title) = split(' ', $refinfo, 3);
3524                my ($committer, $epoch, $tz) =
3525                        ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3526                $ref_item{'fullname'}  = $name;
3527                $name =~ s!^refs/(?:head|remote)s/!!;
3528
3529                $ref_item{'name'}  = $name;
3530                $ref_item{'id'}    = $hash;
3531                $ref_item{'title'} = $title || '(no commit message)';
3532                $ref_item{'epoch'} = $epoch;
3533                if ($epoch) {
3534                        $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3535                } else {
3536                        $ref_item{'age'} = "unknown";
3537                }
3538
3539                push @headslist, \%ref_item;
3540        }
3541        close $fd;
3542
3543        return wantarray ? @headslist : \@headslist;
3544}
3545
3546sub git_get_tags_list {
3547        my $limit = shift;
3548        my @tagslist;
3549
3550        open my $fd, '-|', git_cmd(), 'for-each-ref',
3551                ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3552                '--format=%(objectname) %(objecttype) %(refname) '.
3553                '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3554                'refs/tags'
3555                or return;
3556        while (my $line = <$fd>) {
3557                my %ref_item;
3558
3559                chomp $line;
3560                my ($refinfo, $creatorinfo) = split(/\0/, $line);
3561                my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3562                my ($creator, $epoch, $tz) =
3563                        ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3564                $ref_item{'fullname'} = $name;
3565                $name =~ s!^refs/tags/!!;
3566
3567                $ref_item{'type'} = $type;
3568                $ref_item{'id'} = $id;
3569                $ref_item{'name'} = $name;
3570                if ($type eq "tag") {
3571                        $ref_item{'subject'} = $title;
3572                        $ref_item{'reftype'} = $reftype;
3573                        $ref_item{'refid'}   = $refid;
3574                } else {
3575                        $ref_item{'reftype'} = $type;
3576                        $ref_item{'refid'}   = $id;
3577                }
3578
3579                if ($type eq "tag" || $type eq "commit") {
3580                        $ref_item{'epoch'} = $epoch;
3581                        if ($epoch) {
3582                                $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3583                        } else {
3584                                $ref_item{'age'} = "unknown";
3585                        }
3586                }
3587
3588                push @tagslist, \%ref_item;
3589        }
3590        close $fd;
3591
3592        return wantarray ? @tagslist : \@tagslist;
3593}
3594
3595## ----------------------------------------------------------------------
3596## filesystem-related functions
3597
3598sub get_file_owner {
3599        my $path = shift;
3600
3601        my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3602        my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3603        if (!defined $gcos) {
3604                return undef;
3605        }
3606        my $owner = $gcos;
3607        $owner =~ s/[,;].*$//;
3608        return to_utf8($owner);
3609}
3610
3611# assume that file exists
3612sub insert_file {
3613        my $filename = shift;
3614
3615        open my $fd, '<', $filename;
3616        print map { to_utf8($_) } <$fd>;
3617        close $fd;
3618}
3619
3620## ......................................................................
3621## mimetype related functions
3622
3623sub mimetype_guess_file {
3624        my $filename = shift;
3625        my $mimemap = shift;
3626        -r $mimemap or return undef;
3627
3628        my %mimemap;
3629        open(my $mh, '<', $mimemap) or return undef;
3630        while (<$mh>) {
3631                next if m/^#/; # skip comments
3632                my ($mimetype, @exts) = split(/\s+/);
3633                foreach my $ext (@exts) {
3634                        $mimemap{$ext} = $mimetype;
3635                }
3636        }
3637        close($mh);
3638
3639        $filename =~ /\.([^.]*)$/;
3640        return $mimemap{$1};
3641}
3642
3643sub mimetype_guess {
3644        my $filename = shift;
3645        my $mime;
3646        $filename =~ /\./ or return undef;
3647
3648        if ($mimetypes_file) {
3649                my $file = $mimetypes_file;
3650                if ($file !~ m!^/!) { # if it is relative path
3651                        # it is relative to project
3652                        $file = "$projectroot/$project/$file";
3653                }
3654                $mime = mimetype_guess_file($filename, $file);
3655        }
3656        $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3657        return $mime;
3658}
3659
3660sub blob_mimetype {
3661        my $fd = shift;
3662        my $filename = shift;
3663
3664        if ($filename) {
3665                my $mime = mimetype_guess($filename);
3666                $mime and return $mime;
3667        }
3668
3669        # just in case
3670        return $default_blob_plain_mimetype unless $fd;
3671
3672        if (-T $fd) {
3673                return 'text/plain';
3674        } elsif (! $filename) {
3675                return 'application/octet-stream';
3676        } elsif ($filename =~ m/\.png$/i) {
3677                return 'image/png';
3678        } elsif ($filename =~ m/\.gif$/i) {
3679                return 'image/gif';
3680        } elsif ($filename =~ m/\.jpe?g$/i) {
3681                return 'image/jpeg';
3682        } else {
3683                return 'application/octet-stream';
3684        }
3685}
3686
3687sub blob_contenttype {
3688        my ($fd, $file_name, $type) = @_;
3689
3690        $type ||= blob_mimetype($fd, $file_name);
3691        if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3692                $type .= "; charset=$default_text_plain_charset";
3693        }
3694
3695        return $type;
3696}
3697
3698# guess file syntax for syntax highlighting; return undef if no highlighting
3699# the name of syntax can (in the future) depend on syntax highlighter used
3700sub guess_file_syntax {
3701        my ($highlight, $mimetype, $file_name) = @_;
3702        return undef unless ($highlight && defined $file_name);
3703        my $basename = basename($file_name, '.in');
3704        return $highlight_basename{$basename}
3705                if exists $highlight_basename{$basename};
3706
3707        $basename =~ /\.([^.]*)$/;
3708        my $ext = $1 or return undef;
3709        return $highlight_ext{$ext}
3710                if exists $highlight_ext{$ext};
3711
3712        return undef;
3713}
3714
3715# run highlighter and return FD of its output,
3716# or return original FD if no highlighting
3717sub run_highlighter {
3718        my ($fd, $highlight, $syntax) = @_;
3719        return $fd unless ($highlight && defined $syntax);
3720
3721        close $fd;
3722        open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3723                  quote_command($highlight_bin).
3724                  " --replace-tabs=8 --fragment --syntax $syntax |"
3725                or die_error(500, "Couldn't open file or run syntax highlighter");
3726        return $fd;
3727}
3728
3729## ======================================================================
3730## functions printing HTML: header, footer, error page
3731
3732sub get_page_title {
3733        my $title = to_utf8($site_name);
3734
3735        return $title unless (defined $project);
3736        $title .= " - " . to_utf8($project);
3737
3738        return $title unless (defined $action);
3739        $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3740
3741        return $title unless (defined $file_name);
3742        $title .= " - " . esc_path($file_name);
3743        if ($action eq "tree" && $file_name !~ m|/$|) {
3744                $title .= "/";
3745        }
3746
3747        return $title;
3748}
3749
3750sub get_content_type_html {
3751        # require explicit support from the UA if we are to send the page as
3752        # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3753        # we have to do this because MSIE sometimes globs '*/*', pretending to
3754        # support xhtml+xml but choking when it gets what it asked for.
3755        if (defined $cgi->http('HTTP_ACCEPT') &&
3756            $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3757            $cgi->Accept('application/xhtml+xml') != 0) {
3758                return 'application/xhtml+xml';
3759        } else {
3760                return 'text/html';
3761        }
3762}
3763
3764sub print_feed_meta {
3765        if (defined $project) {
3766                my %href_params = get_feed_info();
3767                if (!exists $href_params{'-title'}) {
3768                        $href_params{'-title'} = 'log';
3769                }
3770
3771                foreach my $format (qw(RSS Atom)) {
3772                        my $type = lc($format);
3773                        my %link_attr = (
3774                                '-rel' => 'alternate',
3775                                '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3776                                '-type' => "application/$type+xml"
3777                        );
3778
3779                        $href_params{'action'} = $type;
3780                        $link_attr{'-href'} = href(%href_params);
3781                        print "<link ".
3782                              "rel=\"$link_attr{'-rel'}\" ".
3783                              "title=\"$link_attr{'-title'}\" ".
3784                              "href=\"$link_attr{'-href'}\" ".
3785                              "type=\"$link_attr{'-type'}\" ".
3786                              "/>\n";
3787
3788                        $href_params{'extra_options'} = '--no-merges';
3789                        $link_attr{'-href'} = href(%href_params);
3790                        $link_attr{'-title'} .= ' (no merges)';
3791                        print "<link ".
3792                              "rel=\"$link_attr{'-rel'}\" ".
3793                              "title=\"$link_attr{'-title'}\" ".
3794                              "href=\"$link_attr{'-href'}\" ".
3795                              "type=\"$link_attr{'-type'}\" ".
3796                              "/>\n";
3797                }
3798
3799        } else {
3800                printf('<link rel="alternate" title="%s projects list" '.
3801                       'href="%s" type="text/plain; charset=utf-8" />'."\n",
3802                       esc_attr($site_name), href(project=>undef, action=>"project_index"));
3803                printf('<link rel="alternate" title="%s projects feeds" '.
3804                       'href="%s" type="text/x-opml" />'."\n",
3805                       esc_attr($site_name), href(project=>undef, action=>"opml"));
3806        }
3807}
3808
3809sub print_header_links {
3810        my $status = shift;
3811
3812        # print out each stylesheet that exist, providing backwards capability
3813        # for those people who defined $stylesheet in a config file
3814        if (defined $stylesheet) {
3815                print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3816        } else {
3817                foreach my $stylesheet (@stylesheets) {
3818                        next unless $stylesheet;
3819                        print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3820                }
3821        }
3822        print_feed_meta()
3823                if ($status eq '200 OK');
3824        if (defined $favicon) {
3825                print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3826        }
3827}
3828
3829sub print_nav_breadcrumbs {
3830        my %opts = @_;
3831
3832        print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3833        if (defined $project) {
3834                print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3835                if (defined $action) {
3836                        my $action_print = $action ;
3837                        if (defined $opts{-action_extra}) {
3838                                $action_print = $cgi->a({-href => href(action=>$action)},
3839                                        $action);
3840                        }
3841                        print " / $action_print";
3842                }
3843                if (defined $opts{-action_extra}) {
3844                        print " / $opts{-action_extra}";
3845                }
3846                print "\n";
3847        }
3848}
3849
3850sub print_search_form {
3851        if (!defined $searchtext) {
3852                $searchtext = "";
3853        }
3854        my $search_hash;
3855        if (defined $hash_base) {
3856                $search_hash = $hash_base;
3857        } elsif (defined $hash) {
3858                $search_hash = $hash;
3859        } else {
3860                $search_hash = "HEAD";
3861        }
3862        my $action = $my_uri;
3863        my $use_pathinfo = gitweb_check_feature('pathinfo');
3864        if ($use_pathinfo) {
3865                $action .= "/".esc_url($project);
3866        }
3867        print $cgi->startform(-method => "get", -action => $action) .
3868              "<div class=\"search\">\n" .
3869              (!$use_pathinfo &&
3870              $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3871              $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3872              $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3873              $cgi->popup_menu(-name => 'st', -default => 'commit',
3874                               -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3875              $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3876              " search:\n",
3877              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3878              "<span title=\"Extended regular expression\">" .
3879              $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3880                             -checked => $search_use_regexp) .
3881              "</span>" .
3882              "</div>" .
3883              $cgi->end_form() . "\n";
3884}
3885
3886sub git_header_html {
3887        my $status = shift || "200 OK";
3888        my $expires = shift;
3889        my %opts = @_;
3890
3891        my $title = get_page_title();
3892        my $content_type = get_content_type_html();
3893        print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3894                           -status=> $status, -expires => $expires)
3895                unless ($opts{'-no_http_header'});
3896        my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3897        print <<EOF;
3898<?xml version="1.0" encoding="utf-8"?>
3899<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3900<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3901<!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3902<!-- git core binaries version $git_version -->
3903<head>
3904<meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3905<meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3906<meta name="robots" content="index, nofollow"/>
3907<title>$title</title>
3908EOF
3909        # the stylesheet, favicon etc urls won't work correctly with path_info
3910        # unless we set the appropriate base URL
3911        if ($ENV{'PATH_INFO'}) {
3912                print "<base href=\"".esc_url($base_url)."\" />\n";
3913        }
3914        print_header_links($status);
3915
3916        if (defined $site_html_head_string) {
3917                print to_utf8($site_html_head_string);
3918        }
3919
3920        print "</head>\n" .
3921              "<body>\n";
3922
3923        if (defined $site_header && -f $site_header) {
3924                insert_file($site_header);
3925        }
3926
3927        print "<div class=\"page_header\">\n";
3928        if (defined $logo) {
3929                print $cgi->a({-href => esc_url($logo_url),
3930                               -title => $logo_label},
3931                              $cgi->img({-src => esc_url($logo),
3932                                         -width => 72, -height => 27,
3933                                         -alt => "git",
3934                                         -class => "logo"}));
3935        }
3936        print_nav_breadcrumbs(%opts);
3937        print "</div>\n";
3938
3939        my $have_search = gitweb_check_feature('search');
3940        if (defined $project && $have_search) {
3941                print_search_form();
3942        }
3943}
3944
3945sub git_footer_html {
3946        my $feed_class = 'rss_logo';
3947
3948        print "<div class=\"page_footer\">\n";
3949        if (defined $project) {
3950                my $descr = git_get_project_description($project);
3951                if (defined $descr) {
3952                        print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3953                }
3954
3955                my %href_params = get_feed_info();
3956                if (!%href_params) {
3957                        $feed_class .= ' generic';
3958                }
3959                $href_params{'-title'} ||= 'log';
3960
3961                foreach my $format (qw(RSS Atom)) {
3962                        $href_params{'action'} = lc($format);
3963                        print $cgi->a({-href => href(%href_params),
3964                                      -title => "$href_params{'-title'} $format feed",
3965                                      -class => $feed_class}, $format)."\n";
3966                }
3967
3968        } else {
3969                print $cgi->a({-href => href(project=>undef, action=>"opml"),
3970                              -class => $feed_class}, "OPML") . " ";
3971                print $cgi->a({-href => href(project=>undef, action=>"project_index"),
3972                              -class => $feed_class}, "TXT") . "\n";
3973        }
3974        print "</div>\n"; # class="page_footer"
3975
3976        if (defined $t0 && gitweb_check_feature('timed')) {
3977                print "<div id=\"generating_info\">\n";
3978                print 'This page took '.
3979                      '<span id="generating_time" class="time_span">'.
3980                      tv_interval($t0, [ gettimeofday() ]).
3981                      ' seconds </span>'.
3982                      ' and '.
3983                      '<span id="generating_cmd">'.
3984                      $number_of_git_cmds.
3985                      '</span> git commands '.
3986                      " to generate.\n";
3987                print "</div>\n"; # class="page_footer"
3988        }
3989
3990        if (defined $site_footer && -f $site_footer) {
3991                insert_file($site_footer);
3992        }
3993
3994        print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
3995        if (defined $action &&
3996            $action eq 'blame_incremental') {
3997                print qq!<script type="text/javascript">\n!.
3998                      qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
3999                      qq!           "!. href() .qq!");\n!.
4000                      qq!</script>\n!;
4001        } else {
4002                my ($jstimezone, $tz_cookie, $datetime_class) =
4003                        gitweb_get_feature('javascript-timezone');
4004
4005                print qq!<script type="text/javascript">\n!.
4006                      qq!window.onload = function () {\n!;
4007                if (gitweb_check_feature('javascript-actions')) {
4008                        print qq!       fixLinks();\n!;
4009                }
4010                if ($jstimezone && $tz_cookie && $datetime_class) {
4011                        print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4012                              qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4013                }
4014                print qq!};\n!.
4015                      qq!</script>\n!;
4016        }
4017
4018        print "</body>\n" .
4019              "</html>";
4020}
4021
4022# die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4023# Example: die_error(404, 'Hash not found')
4024# By convention, use the following status codes (as defined in RFC 2616):
4025# 400: Invalid or missing CGI parameters, or
4026#      requested object exists but has wrong type.
4027# 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4028#      this server or project.
4029# 404: Requested object/revision/project doesn't exist.
4030# 500: The server isn't configured properly, or
4031#      an internal error occurred (e.g. failed assertions caused by bugs), or
4032#      an unknown error occurred (e.g. the git binary died unexpectedly).
4033# 503: The server is currently unavailable (because it is overloaded,
4034#      or down for maintenance).  Generally, this is a temporary state.
4035sub die_error {
4036        my $status = shift || 500;
4037        my $error = esc_html(shift) || "Internal Server Error";
4038        my $extra = shift;
4039        my %opts = @_;
4040
4041        my %http_responses = (
4042                400 => '400 Bad Request',
4043                403 => '403 Forbidden',
4044                404 => '404 Not Found',
4045                500 => '500 Internal Server Error',
4046                503 => '503 Service Unavailable',
4047        );
4048        git_header_html($http_responses{$status}, undef, %opts);
4049        print <<EOF;
4050<div class="page_body">
4051<br /><br />
4052$status - $error
4053<br />
4054EOF
4055        if (defined $extra) {
4056                print "<hr />\n" .
4057                      "$extra\n";
4058        }
4059        print "</div>\n";
4060
4061        git_footer_html();
4062        goto DONE_GITWEB
4063                unless ($opts{'-error_handler'});
4064}
4065
4066## ----------------------------------------------------------------------
4067## functions printing or outputting HTML: navigation
4068
4069sub git_print_page_nav {
4070        my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4071        $extra = '' if !defined $extra; # pager or formats
4072
4073        my @navs = qw(summary shortlog log commit commitdiff tree);
4074        if ($suppress) {
4075                @navs = grep { $_ ne $suppress } @navs;
4076        }
4077
4078        my %arg = map { $_ => {action=>$_} } @navs;
4079        if (defined $head) {
4080                for (qw(commit commitdiff)) {
4081                        $arg{$_}{'hash'} = $head;
4082                }
4083                if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4084                        for (qw(shortlog log)) {
4085                                $arg{$_}{'hash'} = $head;
4086                        }
4087                }
4088        }
4089
4090        $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4091        $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4092
4093        my @actions = gitweb_get_feature('actions');
4094        my %repl = (
4095                '%' => '%',
4096                'n' => $project,         # project name
4097                'f' => $git_dir,         # project path within filesystem
4098                'h' => $treehead || '',  # current hash ('h' parameter)
4099                'b' => $treebase || '',  # hash base ('hb' parameter)
4100        );
4101        while (@actions) {
4102                my ($label, $link, $pos) = splice(@actions,0,3);
4103                # insert
4104                @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4105                # munch munch
4106                $link =~ s/%([%nfhb])/$repl{$1}/g;
4107                $arg{$label}{'_href'} = $link;
4108        }
4109
4110        print "<div class=\"page_nav\">\n" .
4111                (join " | ",
4112                 map { $_ eq $current ?
4113                       $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4114                 } @navs);
4115        print "<br/>\n$extra<br/>\n" .
4116              "</div>\n";
4117}
4118
4119# returns a submenu for the nagivation of the refs views (tags, heads,
4120# remotes) with the current view disabled and the remotes view only
4121# available if the feature is enabled
4122sub format_ref_views {
4123        my ($current) = @_;
4124        my @ref_views = qw{tags heads};
4125        push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4126        return join " | ", map {
4127                $_ eq $current ? $_ :
4128                $cgi->a({-href => href(action=>$_)}, $_)
4129        } @ref_views
4130}
4131
4132sub format_paging_nav {
4133        my ($action, $page, $has_next_link) = @_;
4134        my $paging_nav;
4135
4136
4137        if ($page > 0) {
4138                $paging_nav .=
4139                        $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4140                        " &sdot; " .
4141                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
4142                                 -accesskey => "p", -title => "Alt-p"}, "prev");
4143        } else {
4144                $paging_nav .= "first &sdot; prev";
4145        }
4146
4147        if ($has_next_link) {
4148                $paging_nav .= " &sdot; " .
4149                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
4150                                 -accesskey => "n", -title => "Alt-n"}, "next");
4151        } else {
4152                $paging_nav .= " &sdot; next";
4153        }
4154
4155        return $paging_nav;
4156}
4157
4158## ......................................................................
4159## functions printing or outputting HTML: div
4160
4161sub git_print_header_div {
4162        my ($action, $title, $hash, $hash_base) = @_;
4163        my %args = ();
4164
4165        $args{'action'} = $action;
4166        $args{'hash'} = $hash if $hash;
4167        $args{'hash_base'} = $hash_base if $hash_base;
4168
4169        print "<div class=\"header\">\n" .
4170              $cgi->a({-href => href(%args), -class => "title"},
4171              $title ? $title : $action) .
4172              "\n</div>\n";
4173}
4174
4175sub format_repo_url {
4176        my ($name, $url) = @_;
4177        return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4178}
4179
4180# Group output by placing it in a DIV element and adding a header.
4181# Options for start_div() can be provided by passing a hash reference as the
4182# first parameter to the function.
4183# Options to git_print_header_div() can be provided by passing an array
4184# reference. This must follow the options to start_div if they are present.
4185# The content can be a scalar, which is output as-is, a scalar reference, which
4186# is output after html escaping, an IO handle passed either as *handle or
4187# *handle{IO}, or a function reference. In the latter case all following
4188# parameters will be taken as argument to the content function call.
4189sub git_print_section {
4190        my ($div_args, $header_args, $content);
4191        my $arg = shift;
4192        if (ref($arg) eq 'HASH') {
4193                $div_args = $arg;
4194                $arg = shift;
4195        }
4196        if (ref($arg) eq 'ARRAY') {
4197                $header_args = $arg;
4198                $arg = shift;
4199        }
4200        $content = $arg;
4201
4202        print $cgi->start_div($div_args);
4203        git_print_header_div(@$header_args);
4204
4205        if (ref($content) eq 'CODE') {
4206                $content->(@_);
4207        } elsif (ref($content) eq 'SCALAR') {
4208                print esc_html($$content);
4209        } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4210                print <$content>;
4211        } elsif (!ref($content) && defined($content)) {
4212                print $content;
4213        }
4214
4215        print $cgi->end_div;
4216}
4217
4218sub format_timestamp_html {
4219        my $date = shift;
4220        my $strtime = $date->{'rfc2822'};
4221
4222        my (undef, undef, $datetime_class) =
4223                gitweb_get_feature('javascript-timezone');
4224        if ($datetime_class) {
4225                $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4226        }
4227
4228        my $localtime_format = '(%02d:%02d %s)';
4229        if ($date->{'hour_local'} < 6) {
4230                $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4231        }
4232        $strtime .= ' ' .
4233                    sprintf($localtime_format,
4234                            $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4235
4236        return $strtime;
4237}
4238
4239# Outputs the author name and date in long form
4240sub git_print_authorship {
4241        my $co = shift;
4242        my %opts = @_;
4243        my $tag = $opts{-tag} || 'div';
4244        my $author = $co->{'author_name'};
4245
4246        my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4247        print "<$tag class=\"author_date\">" .
4248              format_search_author($author, "author", esc_html($author)) .
4249              " [".format_timestamp_html(\%ad)."]".
4250              git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4251              "</$tag>\n";
4252}
4253
4254# Outputs table rows containing the full author or committer information,
4255# in the format expected for 'commit' view (& similar).
4256# Parameters are a commit hash reference, followed by the list of people
4257# to output information for. If the list is empty it defaults to both
4258# author and committer.
4259sub git_print_authorship_rows {
4260        my $co = shift;
4261        # too bad we can't use @people = @_ || ('author', 'committer')
4262        my @people = @_;
4263        @people = ('author', 'committer') unless @people;
4264        foreach my $who (@people) {
4265                my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4266                print "<tr><td>$who</td><td>" .
4267                      format_search_author($co->{"${who}_name"}, $who,
4268                                           esc_html($co->{"${who}_name"})) . " " .
4269                      format_search_author($co->{"${who}_email"}, $who,
4270                                           esc_html("<" . $co->{"${who}_email"} . ">")) .
4271                      "</td><td rowspan=\"2\">" .
4272                      git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4273                      "</td></tr>\n" .
4274                      "<tr>" .
4275                      "<td></td><td>" .
4276                      format_timestamp_html(\%wd) .
4277                      "</td>" .
4278                      "</tr>\n";
4279        }
4280}
4281
4282sub git_print_page_path {
4283        my $name = shift;
4284        my $type = shift;
4285        my $hb = shift;
4286
4287
4288        print "<div class=\"page_path\">";
4289        print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4290                      -title => 'tree root'}, to_utf8("[$project]"));
4291        print " / ";
4292        if (defined $name) {
4293                my @dirname = split '/', $name;
4294                my $basename = pop @dirname;
4295                my $fullname = '';
4296
4297                foreach my $dir (@dirname) {
4298                        $fullname .= ($fullname ? '/' : '') . $dir;
4299                        print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4300                                                     hash_base=>$hb),
4301                                      -title => $fullname}, esc_path($dir));
4302                        print " / ";
4303                }
4304                if (defined $type && $type eq 'blob') {
4305                        print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4306                                                     hash_base=>$hb),
4307                                      -title => $name}, esc_path($basename));
4308                } elsif (defined $type && $type eq 'tree') {
4309                        print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4310                                                     hash_base=>$hb),
4311                                      -title => $name}, esc_path($basename));
4312                        print " / ";
4313                } else {
4314                        print esc_path($basename);
4315                }
4316        }
4317        print "<br/></div>\n";
4318}
4319
4320sub git_print_log {
4321        my $log = shift;
4322        my %opts = @_;
4323
4324        if ($opts{'-remove_title'}) {
4325                # remove title, i.e. first line of log
4326                shift @$log;
4327        }
4328        # remove leading empty lines
4329        while (defined $log->[0] && $log->[0] eq "") {
4330                shift @$log;
4331        }
4332
4333        # print log
4334        my $signoff = 0;
4335        my $empty = 0;
4336        foreach my $line (@$log) {
4337                if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4338                        $signoff = 1;
4339                        $empty = 0;
4340                        if (! $opts{'-remove_signoff'}) {
4341                                print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4342                                next;
4343                        } else {
4344                                # remove signoff lines
4345                                next;
4346                        }
4347                } else {
4348                        $signoff = 0;
4349                }
4350
4351                # print only one empty line
4352                # do not print empty line after signoff
4353                if ($line eq "") {
4354                        next if ($empty || $signoff);
4355                        $empty = 1;
4356                } else {
4357                        $empty = 0;
4358                }
4359
4360                print format_log_line_html($line) . "<br/>\n";
4361        }
4362
4363        if ($opts{'-final_empty_line'}) {
4364                # end with single empty line
4365                print "<br/>\n" unless $empty;
4366        }
4367}
4368
4369# return link target (what link points to)
4370sub git_get_link_target {
4371        my $hash = shift;
4372        my $link_target;
4373
4374        # read link
4375        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4376                or return;
4377        {
4378                local $/ = undef;
4379                $link_target = <$fd>;
4380        }
4381        close $fd
4382                or return;
4383
4384        return $link_target;
4385}
4386
4387# given link target, and the directory (basedir) the link is in,
4388# return target of link relative to top directory (top tree);
4389# return undef if it is not possible (including absolute links).
4390sub normalize_link_target {
4391        my ($link_target, $basedir) = @_;
4392
4393        # absolute symlinks (beginning with '/') cannot be normalized
4394        return if (substr($link_target, 0, 1) eq '/');
4395
4396        # normalize link target to path from top (root) tree (dir)
4397        my $path;
4398        if ($basedir) {
4399                $path = $basedir . '/' . $link_target;
4400        } else {
4401                # we are in top (root) tree (dir)
4402                $path = $link_target;
4403        }
4404
4405        # remove //, /./, and /../
4406        my @path_parts;
4407        foreach my $part (split('/', $path)) {
4408                # discard '.' and ''
4409                next if (!$part || $part eq '.');
4410                # handle '..'
4411                if ($part eq '..') {
4412                        if (@path_parts) {
4413                                pop @path_parts;
4414                        } else {
4415                                # link leads outside repository (outside top dir)
4416                                return;
4417                        }
4418                } else {
4419                        push @path_parts, $part;
4420                }
4421        }
4422        $path = join('/', @path_parts);
4423
4424        return $path;
4425}
4426
4427# print tree entry (row of git_tree), but without encompassing <tr> element
4428sub git_print_tree_entry {
4429        my ($t, $basedir, $hash_base, $have_blame) = @_;
4430
4431        my %base_key = ();
4432        $base_key{'hash_base'} = $hash_base if defined $hash_base;
4433
4434        # The format of a table row is: mode list link.  Where mode is
4435        # the mode of the entry, list is the name of the entry, an href,
4436        # and link is the action links of the entry.
4437
4438        print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4439        if (exists $t->{'size'}) {
4440                print "<td class=\"size\">$t->{'size'}</td>\n";
4441        }
4442        if ($t->{'type'} eq "blob") {
4443                print "<td class=\"list\">" .
4444                        $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4445                                               file_name=>"$basedir$t->{'name'}", %base_key),
4446                                -class => "list"}, esc_path($t->{'name'}));
4447                if (S_ISLNK(oct $t->{'mode'})) {
4448                        my $link_target = git_get_link_target($t->{'hash'});
4449                        if ($link_target) {
4450                                my $norm_target = normalize_link_target($link_target, $basedir);
4451                                if (defined $norm_target) {
4452                                        print " -> " .
4453                                              $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4454                                                                     file_name=>$norm_target),
4455                                                       -title => $norm_target}, esc_path($link_target));
4456                                } else {
4457                                        print " -> " . esc_path($link_target);
4458                                }
4459                        }
4460                }
4461                print "</td>\n";
4462                print "<td class=\"link\">";
4463                print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4464                                             file_name=>"$basedir$t->{'name'}", %base_key)},
4465                              "blob");
4466                if ($have_blame) {
4467                        print " | " .
4468                              $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4469                                                     file_name=>"$basedir$t->{'name'}", %base_key)},
4470                                      "blame");
4471                }
4472                if (defined $hash_base) {
4473                        print " | " .
4474                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4475                                                     hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4476                                      "history");
4477                }
4478                print " | " .
4479                        $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4480                                               file_name=>"$basedir$t->{'name'}")},
4481                                "raw");
4482                print "</td>\n";
4483
4484        } elsif ($t->{'type'} eq "tree") {
4485                print "<td class=\"list\">";
4486                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4487                                             file_name=>"$basedir$t->{'name'}",
4488                                             %base_key)},
4489                              esc_path($t->{'name'}));
4490                print "</td>\n";
4491                print "<td class=\"link\">";
4492                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4493                                             file_name=>"$basedir$t->{'name'}",
4494                                             %base_key)},
4495                              "tree");
4496                if (defined $hash_base) {
4497                        print " | " .
4498                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4499                                                     file_name=>"$basedir$t->{'name'}")},
4500                                      "history");
4501                }
4502                print "</td>\n";
4503        } else {
4504                # unknown object: we can only present history for it
4505                # (this includes 'commit' object, i.e. submodule support)
4506                print "<td class=\"list\">" .
4507                      esc_path($t->{'name'}) .
4508                      "</td>\n";
4509                print "<td class=\"link\">";
4510                if (defined $hash_base) {
4511                        print $cgi->a({-href => href(action=>"history",
4512                                                     hash_base=>$hash_base,
4513                                                     file_name=>"$basedir$t->{'name'}")},
4514                                      "history");
4515                }
4516                print "</td>\n";
4517        }
4518}
4519
4520## ......................................................................
4521## functions printing large fragments of HTML
4522
4523# get pre-image filenames for merge (combined) diff
4524sub fill_from_file_info {
4525        my ($diff, @parents) = @_;
4526
4527        $diff->{'from_file'} = [ ];
4528        $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4529        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4530                if ($diff->{'status'}[$i] eq 'R' ||
4531                    $diff->{'status'}[$i] eq 'C') {
4532                        $diff->{'from_file'}[$i] =
4533                                git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4534                }
4535        }
4536
4537        return $diff;
4538}
4539
4540# is current raw difftree line of file deletion
4541sub is_deleted {
4542        my $diffinfo = shift;
4543
4544        return $diffinfo->{'to_id'} eq ('0' x 40);
4545}
4546
4547# does patch correspond to [previous] difftree raw line
4548# $diffinfo  - hashref of parsed raw diff format
4549# $patchinfo - hashref of parsed patch diff format
4550#              (the same keys as in $diffinfo)
4551sub is_patch_split {
4552        my ($diffinfo, $patchinfo) = @_;
4553
4554        return defined $diffinfo && defined $patchinfo
4555                && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4556}
4557
4558
4559sub git_difftree_body {
4560        my ($difftree, $hash, @parents) = @_;
4561        my ($parent) = $parents[0];
4562        my $have_blame = gitweb_check_feature('blame');
4563        print "<div class=\"list_head\">\n";
4564        if ($#{$difftree} > 10) {
4565                print(($#{$difftree} + 1) . " files changed:\n");
4566        }
4567        print "</div>\n";
4568
4569        print "<table class=\"" .
4570              (@parents > 1 ? "combined " : "") .
4571              "diff_tree\">\n";
4572
4573        # header only for combined diff in 'commitdiff' view
4574        my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4575        if ($has_header) {
4576                # table header
4577                print "<thead><tr>\n" .
4578                       "<th></th><th></th>\n"; # filename, patchN link
4579                for (my $i = 0; $i < @parents; $i++) {
4580                        my $par = $parents[$i];
4581                        print "<th>" .
4582                              $cgi->a({-href => href(action=>"commitdiff",
4583                                                     hash=>$hash, hash_parent=>$par),
4584                                       -title => 'commitdiff to parent number ' .
4585                                                  ($i+1) . ': ' . substr($par,0,7)},
4586                                      $i+1) .
4587                              "&nbsp;</th>\n";
4588                }
4589                print "</tr></thead>\n<tbody>\n";
4590        }
4591
4592        my $alternate = 1;
4593        my $patchno = 0;
4594        foreach my $line (@{$difftree}) {
4595                my $diff = parsed_difftree_line($line);
4596
4597                if ($alternate) {
4598                        print "<tr class=\"dark\">\n";
4599                } else {
4600                        print "<tr class=\"light\">\n";
4601                }
4602                $alternate ^= 1;
4603
4604                if (exists $diff->{'nparents'}) { # combined diff
4605
4606                        fill_from_file_info($diff, @parents)
4607                                unless exists $diff->{'from_file'};
4608
4609                        if (!is_deleted($diff)) {
4610                                # file exists in the result (child) commit
4611                                print "<td>" .
4612                                      $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4613                                                             file_name=>$diff->{'to_file'},
4614                                                             hash_base=>$hash),
4615                                              -class => "list"}, esc_path($diff->{'to_file'})) .
4616                                      "</td>\n";
4617                        } else {
4618                                print "<td>" .
4619                                      esc_path($diff->{'to_file'}) .
4620                                      "</td>\n";
4621                        }
4622
4623                        if ($action eq 'commitdiff') {
4624                                # link to patch
4625                                $patchno++;
4626                                print "<td class=\"link\">" .
4627                                      $cgi->a({-href => href(-anchor=>"patch$patchno")},
4628                                              "patch") .
4629                                      " | " .
4630                                      "</td>\n";
4631                        }
4632
4633                        my $has_history = 0;
4634                        my $not_deleted = 0;
4635                        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4636                                my $hash_parent = $parents[$i];
4637                                my $from_hash = $diff->{'from_id'}[$i];
4638                                my $from_path = $diff->{'from_file'}[$i];
4639                                my $status = $diff->{'status'}[$i];
4640
4641                                $has_history ||= ($status ne 'A');
4642                                $not_deleted ||= ($status ne 'D');
4643
4644                                if ($status eq 'A') {
4645                                        print "<td  class=\"link\" align=\"right\"> | </td>\n";
4646                                } elsif ($status eq 'D') {
4647                                        print "<td class=\"link\">" .
4648                                              $cgi->a({-href => href(action=>"blob",
4649                                                                     hash_base=>$hash,
4650                                                                     hash=>$from_hash,
4651                                                                     file_name=>$from_path)},
4652                                                      "blob" . ($i+1)) .
4653                                              " | </td>\n";
4654                                } else {
4655                                        if ($diff->{'to_id'} eq $from_hash) {
4656                                                print "<td class=\"link nochange\">";
4657                                        } else {
4658                                                print "<td class=\"link\">";
4659                                        }
4660                                        print $cgi->a({-href => href(action=>"blobdiff",
4661                                                                     hash=>$diff->{'to_id'},
4662                                                                     hash_parent=>$from_hash,
4663                                                                     hash_base=>$hash,
4664                                                                     hash_parent_base=>$hash_parent,
4665                                                                     file_name=>$diff->{'to_file'},
4666                                                                     file_parent=>$from_path)},
4667                                                      "diff" . ($i+1)) .
4668                                              " | </td>\n";
4669                                }
4670                        }
4671
4672                        print "<td class=\"link\">";
4673                        if ($not_deleted) {
4674                                print $cgi->a({-href => href(action=>"blob",
4675                                                             hash=>$diff->{'to_id'},
4676                                                             file_name=>$diff->{'to_file'},
4677                                                             hash_base=>$hash)},
4678                                              "blob");
4679                                print " | " if ($has_history);
4680                        }
4681                        if ($has_history) {
4682                                print $cgi->a({-href => href(action=>"history",
4683                                                             file_name=>$diff->{'to_file'},
4684                                                             hash_base=>$hash)},
4685                                              "history");
4686                        }
4687                        print "</td>\n";
4688
4689                        print "</tr>\n";
4690                        next; # instead of 'else' clause, to avoid extra indent
4691                }
4692                # else ordinary diff
4693
4694                my ($to_mode_oct, $to_mode_str, $to_file_type);
4695                my ($from_mode_oct, $from_mode_str, $from_file_type);
4696                if ($diff->{'to_mode'} ne ('0' x 6)) {
4697                        $to_mode_oct = oct $diff->{'to_mode'};
4698                        if (S_ISREG($to_mode_oct)) { # only for regular file
4699                                $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4700                        }
4701                        $to_file_type = file_type($diff->{'to_mode'});
4702                }
4703                if ($diff->{'from_mode'} ne ('0' x 6)) {
4704                        $from_mode_oct = oct $diff->{'from_mode'};
4705                        if (S_ISREG($from_mode_oct)) { # only for regular file
4706                                $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4707                        }
4708                        $from_file_type = file_type($diff->{'from_mode'});
4709                }
4710
4711                if ($diff->{'status'} eq "A") { # created
4712                        my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4713                        $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4714                        $mode_chng   .= "]</span>";
4715                        print "<td>";
4716                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4717                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4718                                      -class => "list"}, esc_path($diff->{'file'}));
4719                        print "</td>\n";
4720                        print "<td>$mode_chng</td>\n";
4721                        print "<td class=\"link\">";
4722                        if ($action eq 'commitdiff') {
4723                                # link to patch
4724                                $patchno++;
4725                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4726                                              "patch") .
4727                                      " | ";
4728                        }
4729                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4730                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4731                                      "blob");
4732                        print "</td>\n";
4733
4734                } elsif ($diff->{'status'} eq "D") { # deleted
4735                        my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4736                        print "<td>";
4737                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4738                                                     hash_base=>$parent, file_name=>$diff->{'file'}),
4739                                       -class => "list"}, esc_path($diff->{'file'}));
4740                        print "</td>\n";
4741                        print "<td>$mode_chng</td>\n";
4742                        print "<td class=\"link\">";
4743                        if ($action eq 'commitdiff') {
4744                                # link to patch
4745                                $patchno++;
4746                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4747                                              "patch") .
4748                                      " | ";
4749                        }
4750                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4751                                                     hash_base=>$parent, file_name=>$diff->{'file'})},
4752                                      "blob") . " | ";
4753                        if ($have_blame) {
4754                                print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4755                                                             file_name=>$diff->{'file'})},
4756                                              "blame") . " | ";
4757                        }
4758                        print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4759                                                     file_name=>$diff->{'file'})},
4760                                      "history");
4761                        print "</td>\n";
4762
4763                } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4764                        my $mode_chnge = "";
4765                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4766                                $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4767                                if ($from_file_type ne $to_file_type) {
4768                                        $mode_chnge .= " from $from_file_type to $to_file_type";
4769                                }
4770                                if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4771                                        if ($from_mode_str && $to_mode_str) {
4772                                                $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4773                                        } elsif ($to_mode_str) {
4774                                                $mode_chnge .= " mode: $to_mode_str";
4775                                        }
4776                                }
4777                                $mode_chnge .= "]</span>\n";
4778                        }
4779                        print "<td>";
4780                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4781                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4782                                      -class => "list"}, esc_path($diff->{'file'}));
4783                        print "</td>\n";
4784                        print "<td>$mode_chnge</td>\n";
4785                        print "<td class=\"link\">";
4786                        if ($action eq 'commitdiff') {
4787                                # link to patch
4788                                $patchno++;
4789                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4790                                              "patch") .
4791                                      " | ";
4792                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4793                                # "commit" view and modified file (not onlu mode changed)
4794                                print $cgi->a({-href => href(action=>"blobdiff",
4795                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4796                                                             hash_base=>$hash, hash_parent_base=>$parent,
4797                                                             file_name=>$diff->{'file'})},
4798                                              "diff") .
4799                                      " | ";
4800                        }
4801                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4802                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4803                                       "blob") . " | ";
4804                        if ($have_blame) {
4805                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4806                                                             file_name=>$diff->{'file'})},
4807                                              "blame") . " | ";
4808                        }
4809                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4810                                                     file_name=>$diff->{'file'})},
4811                                      "history");
4812                        print "</td>\n";
4813
4814                } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4815                        my %status_name = ('R' => 'moved', 'C' => 'copied');
4816                        my $nstatus = $status_name{$diff->{'status'}};
4817                        my $mode_chng = "";
4818                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4819                                # mode also for directories, so we cannot use $to_mode_str
4820                                $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4821                        }
4822                        print "<td>" .
4823                              $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4824                                                     hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4825                                      -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4826                              "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4827                              $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4828                                                     hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4829                                      -class => "list"}, esc_path($diff->{'from_file'})) .
4830                              " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4831                              "<td class=\"link\">";
4832                        if ($action eq 'commitdiff') {
4833                                # link to patch
4834                                $patchno++;
4835                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4836                                              "patch") .
4837                                      " | ";
4838                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4839                                # "commit" view and modified file (not only pure rename or copy)
4840                                print $cgi->a({-href => href(action=>"blobdiff",
4841                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4842                                                             hash_base=>$hash, hash_parent_base=>$parent,
4843                                                             file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4844                                              "diff") .
4845                                      " | ";
4846                        }
4847                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4848                                                     hash_base=>$parent, file_name=>$diff->{'to_file'})},
4849                                      "blob") . " | ";
4850                        if ($have_blame) {
4851                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4852                                                             file_name=>$diff->{'to_file'})},
4853                                              "blame") . " | ";
4854                        }
4855                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4856                                                    file_name=>$diff->{'to_file'})},
4857                                      "history");
4858                        print "</td>\n";
4859
4860                } # we should not encounter Unmerged (U) or Unknown (X) status
4861                print "</tr>\n";
4862        }
4863        print "</tbody>" if $has_header;
4864        print "</table>\n";
4865}
4866
4867sub print_sidebyside_diff_chunk {
4868        my @chunk = @_;
4869        my (@ctx, @rem, @add);
4870
4871        return unless @chunk;
4872
4873        # incomplete last line might be among removed or added lines,
4874        # or both, or among context lines: find which
4875        for (my $i = 1; $i < @chunk; $i++) {
4876                if ($chunk[$i][0] eq 'incomplete') {
4877                        $chunk[$i][0] = $chunk[$i-1][0];
4878                }
4879        }
4880
4881        # guardian
4882        push @chunk, ["", ""];
4883
4884        foreach my $line_info (@chunk) {
4885                my ($class, $line) = @$line_info;
4886
4887                # print chunk headers
4888                if ($class && $class eq 'chunk_header') {
4889                        print $line;
4890                        next;
4891                }
4892
4893                ## print from accumulator when type of class of lines change
4894                # empty contents block on start rem/add block, or end of chunk
4895                if (@ctx && (!$class || $class eq 'rem' || $class eq 'add')) {
4896                        print join '',
4897                                '<div class="chunk_block ctx">',
4898                                        '<div class="old">',
4899                                        @ctx,
4900                                        '</div>',
4901                                        '<div class="new">',
4902                                        @ctx,
4903                                        '</div>',
4904                                '</div>';
4905                        @ctx = ();
4906                }
4907                # empty add/rem block on start context block, or end of chunk
4908                if ((@rem || @add) && (!$class || $class eq 'ctx')) {
4909                        if (!@add) {
4910                                # pure removal
4911                                print join '',
4912                                        '<div class="chunk_block rem">',
4913                                                '<div class="old">',
4914                                                @rem,
4915                                                '</div>',
4916                                        '</div>';
4917                        } elsif (!@rem) {
4918                                # pure addition
4919                                print join '',
4920                                        '<div class="chunk_block add">',
4921                                                '<div class="new">',
4922                                                @add,
4923                                                '</div>',
4924                                        '</div>';
4925                        } else {
4926                                # assume that it is change
4927                                print join '',
4928                                        '<div class="chunk_block chg">',
4929                                                '<div class="old">',
4930                                                @rem,
4931                                                '</div>',
4932                                                '<div class="new">',
4933                                                @add,
4934                                                '</div>',
4935                                        '</div>';
4936                        }
4937                        @rem = @add = ();
4938                }
4939
4940                ## adding lines to accumulator
4941                # guardian value
4942                last unless $line;
4943                # rem, add or change
4944                if ($class eq 'rem') {
4945                        push @rem, $line;
4946                } elsif ($class eq 'add') {
4947                        push @add, $line;
4948                }
4949                # context line
4950                if ($class eq 'ctx') {
4951                        push @ctx, $line;
4952                }
4953        }
4954}
4955
4956sub git_patchset_body {
4957        my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
4958        my ($hash_parent) = $hash_parents[0];
4959
4960        my $is_combined = (@hash_parents > 1);
4961        my $patch_idx = 0;
4962        my $patch_number = 0;
4963        my $patch_line;
4964        my $diffinfo;
4965        my $to_name;
4966        my (%from, %to);
4967        my @chunk; # for side-by-side diff
4968
4969        print "<div class=\"patchset\">\n";
4970
4971        # skip to first patch
4972        while ($patch_line = <$fd>) {
4973                chomp $patch_line;
4974
4975                last if ($patch_line =~ m/^diff /);
4976        }
4977
4978 PATCH:
4979        while ($patch_line) {
4980
4981                # parse "git diff" header line
4982                if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
4983                        # $1 is from_name, which we do not use
4984                        $to_name = unquote($2);
4985                        $to_name =~ s!^b/!!;
4986                } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
4987                        # $1 is 'cc' or 'combined', which we do not use
4988                        $to_name = unquote($2);
4989                } else {
4990                        $to_name = undef;
4991                }
4992
4993                # check if current patch belong to current raw line
4994                # and parse raw git-diff line if needed
4995                if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
4996                        # this is continuation of a split patch
4997                        print "<div class=\"patch cont\">\n";
4998                } else {
4999                        # advance raw git-diff output if needed
5000                        $patch_idx++ if defined $diffinfo;
5001
5002                        # read and prepare patch information
5003                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5004
5005                        # compact combined diff output can have some patches skipped
5006                        # find which patch (using pathname of result) we are at now;
5007                        if ($is_combined) {
5008                                while ($to_name ne $diffinfo->{'to_file'}) {
5009                                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5010                                              format_diff_cc_simplified($diffinfo, @hash_parents) .
5011                                              "</div>\n";  # class="patch"
5012
5013                                        $patch_idx++;
5014                                        $patch_number++;
5015
5016                                        last if $patch_idx > $#$difftree;
5017                                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5018                                }
5019                        }
5020
5021                        # modifies %from, %to hashes
5022                        parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5023
5024                        # this is first patch for raw difftree line with $patch_idx index
5025                        # we index @$difftree array from 0, but number patches from 1
5026                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5027                }
5028
5029                # git diff header
5030                #assert($patch_line =~ m/^diff /) if DEBUG;
5031                #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5032                $patch_number++;
5033                # print "git diff" header
5034                print format_git_diff_header_line($patch_line, $diffinfo,
5035                                                  \%from, \%to);
5036
5037                # print extended diff header
5038                print "<div class=\"diff extended_header\">\n";
5039        EXTENDED_HEADER:
5040                while ($patch_line = <$fd>) {
5041                        chomp $patch_line;
5042
5043                        last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5044
5045                        print format_extended_diff_header_line($patch_line, $diffinfo,
5046                                                               \%from, \%to);
5047                }
5048                print "</div>\n"; # class="diff extended_header"
5049
5050                # from-file/to-file diff header
5051                if (! $patch_line) {
5052                        print "</div>\n"; # class="patch"
5053                        last PATCH;
5054                }
5055                next PATCH if ($patch_line =~ m/^diff /);
5056                #assert($patch_line =~ m/^---/) if DEBUG;
5057
5058                my $last_patch_line = $patch_line;
5059                $patch_line = <$fd>;
5060                chomp $patch_line;
5061                #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5062
5063                print format_diff_from_to_header($last_patch_line, $patch_line,
5064                                                 $diffinfo, \%from, \%to,
5065                                                 @hash_parents);
5066
5067                # the patch itself
5068        LINE:
5069                while ($patch_line = <$fd>) {
5070                        chomp $patch_line;
5071
5072                        next PATCH if ($patch_line =~ m/^diff /);
5073
5074                        my ($class, $line) = process_diff_line($patch_line, \%from, \%to);
5075                        my $diff_classes = "diff";
5076                        $diff_classes .= " $class" if ($class);
5077                        $line = "<div class=\"$diff_classes\">$line</div>\n";
5078
5079                        if ($diff_style eq 'sidebyside' && !$is_combined) {
5080                                if ($class eq 'chunk_header') {
5081                                        print_sidebyside_diff_chunk(@chunk);
5082                                        @chunk = ( [ $class, $line ] );
5083                                } else {
5084                                        push @chunk, [ $class, $line ];
5085                                }
5086                        } else {
5087                                # default 'inline' style and unknown styles
5088                                print $line;
5089                        }
5090                }
5091
5092        } continue {
5093                if (@chunk) {
5094                        print_sidebyside_diff_chunk(@chunk);
5095                        @chunk = ();
5096                }
5097                print "</div>\n"; # class="patch"
5098        }
5099
5100        # for compact combined (--cc) format, with chunk and patch simplification
5101        # the patchset might be empty, but there might be unprocessed raw lines
5102        for (++$patch_idx if $patch_number > 0;
5103             $patch_idx < @$difftree;
5104             ++$patch_idx) {
5105                # read and prepare patch information
5106                $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5107
5108                # generate anchor for "patch" links in difftree / whatchanged part
5109                print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5110                      format_diff_cc_simplified($diffinfo, @hash_parents) .
5111                      "</div>\n";  # class="patch"
5112
5113                $patch_number++;
5114        }
5115
5116        if ($patch_number == 0) {
5117                if (@hash_parents > 1) {
5118                        print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5119                } else {
5120                        print "<div class=\"diff nodifferences\">No differences found</div>\n";
5121                }
5122        }
5123
5124        print "</div>\n"; # class="patchset"
5125}
5126
5127# . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5128
5129# fills project list info (age, description, owner, category, forks)
5130# for each project in the list, removing invalid projects from
5131# returned list
5132# NOTE: modifies $projlist, but does not remove entries from it
5133sub fill_project_list_info {
5134        my $projlist = shift;
5135        my @projects;
5136
5137        my $show_ctags = gitweb_check_feature('ctags');
5138 PROJECT:
5139        foreach my $pr (@$projlist) {
5140                my (@activity) = git_get_last_activity($pr->{'path'});
5141                unless (@activity) {
5142                        next PROJECT;
5143                }
5144                ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5145                if (!defined $pr->{'descr'}) {
5146                        my $descr = git_get_project_description($pr->{'path'}) || "";
5147                        $descr = to_utf8($descr);
5148                        $pr->{'descr_long'} = $descr;
5149                        $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5150                }
5151                if (!defined $pr->{'owner'}) {
5152                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5153                }
5154                if ($show_ctags) {
5155                        $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5156                }
5157                if ($projects_list_group_categories && !defined $pr->{'category'}) {
5158                        my $cat = git_get_project_category($pr->{'path'}) ||
5159                                                           $project_list_default_category;
5160                        $pr->{'category'} = to_utf8($cat);
5161                }
5162
5163                push @projects, $pr;
5164        }
5165
5166        return @projects;
5167}
5168
5169sub sort_projects_list {
5170        my ($projlist, $order) = @_;
5171        my @projects;
5172
5173        my %order_info = (
5174                project => { key => 'path', type => 'str' },
5175                descr => { key => 'descr_long', type => 'str' },
5176                owner => { key => 'owner', type => 'str' },
5177                age => { key => 'age', type => 'num' }
5178        );
5179        my $oi = $order_info{$order};
5180        return @$projlist unless defined $oi;
5181        if ($oi->{'type'} eq 'str') {
5182                @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5183        } else {
5184                @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5185        }
5186
5187        return @projects;
5188}
5189
5190# returns a hash of categories, containing the list of project
5191# belonging to each category
5192sub build_projlist_by_category {
5193        my ($projlist, $from, $to) = @_;
5194        my %categories;
5195
5196        $from = 0 unless defined $from;
5197        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5198
5199        for (my $i = $from; $i <= $to; $i++) {
5200                my $pr = $projlist->[$i];
5201                push @{$categories{ $pr->{'category'} }}, $pr;
5202        }
5203
5204        return wantarray ? %categories : \%categories;
5205}
5206
5207# print 'sort by' <th> element, generating 'sort by $name' replay link
5208# if that order is not selected
5209sub print_sort_th {
5210        print format_sort_th(@_);
5211}
5212
5213sub format_sort_th {
5214        my ($name, $order, $header) = @_;
5215        my $sort_th = "";
5216        $header ||= ucfirst($name);
5217
5218        if ($order eq $name) {
5219                $sort_th .= "<th>$header</th>\n";
5220        } else {
5221                $sort_th .= "<th>" .
5222                            $cgi->a({-href => href(-replay=>1, order=>$name),
5223                                     -class => "header"}, $header) .
5224                            "</th>\n";
5225        }
5226
5227        return $sort_th;
5228}
5229
5230sub git_project_list_rows {
5231        my ($projlist, $from, $to, $check_forks) = @_;
5232
5233        $from = 0 unless defined $from;
5234        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5235
5236        my $alternate = 1;
5237        for (my $i = $from; $i <= $to; $i++) {
5238                my $pr = $projlist->[$i];
5239
5240                if ($alternate) {
5241                        print "<tr class=\"dark\">\n";
5242                } else {
5243                        print "<tr class=\"light\">\n";
5244                }
5245                $alternate ^= 1;
5246
5247                if ($check_forks) {
5248                        print "<td>";
5249                        if ($pr->{'forks'}) {
5250                                my $nforks = scalar @{$pr->{'forks'}};
5251                                if ($nforks > 0) {
5252                                        print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5253                                                       -title => "$nforks forks"}, "+");
5254                                } else {
5255                                        print $cgi->span({-title => "$nforks forks"}, "+");
5256                                }
5257                        }
5258                        print "</td>\n";
5259                }
5260                print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5261                                        -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
5262                      "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5263                                        -class => "list", -title => $pr->{'descr_long'}},
5264                                        esc_html($pr->{'descr'})) . "</td>\n" .
5265                      "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5266                print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5267                      (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
5268                      "<td class=\"link\">" .
5269                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5270                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5271                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5272                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5273                      ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5274                      "</td>\n" .
5275                      "</tr>\n";
5276        }
5277}
5278
5279sub git_project_list_body {
5280        # actually uses global variable $project
5281        my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5282        my @projects = @$projlist;
5283
5284        my $check_forks = gitweb_check_feature('forks');
5285        my $show_ctags  = gitweb_check_feature('ctags');
5286        my $tagfilter = $show_ctags ? $cgi->param('by_tag') : undef;
5287        $check_forks = undef
5288                if ($tagfilter || $searchtext);
5289
5290        # filtering out forks before filling info allows to do less work
5291        @projects = filter_forks_from_projects_list(\@projects)
5292                if ($check_forks);
5293        @projects = fill_project_list_info(\@projects);
5294        # searching projects require filling to be run before it
5295        @projects = search_projects_list(\@projects,
5296                                         'searchtext' => $searchtext,
5297                                         'tagfilter'  => $tagfilter)
5298                if ($tagfilter || $searchtext);
5299
5300        $order ||= $default_projects_order;
5301        $from = 0 unless defined $from;
5302        $to = $#projects if (!defined $to || $#projects < $to);
5303
5304        # short circuit
5305        if ($from > $to) {
5306                print "<center>\n".
5307                      "<b>No such projects found</b><br />\n".
5308                      "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5309                      "</center>\n<br />\n";
5310                return;
5311        }
5312
5313        @projects = sort_projects_list(\@projects, $order);
5314
5315        if ($show_ctags) {
5316                my $ctags = git_gather_all_ctags(\@projects);
5317                my $cloud = git_populate_project_tagcloud($ctags);
5318                print git_show_project_tagcloud($cloud, 64);
5319        }
5320
5321        print "<table class=\"project_list\">\n";
5322        unless ($no_header) {
5323                print "<tr>\n";
5324                if ($check_forks) {
5325                        print "<th></th>\n";
5326                }
5327                print_sort_th('project', $order, 'Project');
5328                print_sort_th('descr', $order, 'Description');
5329                print_sort_th('owner', $order, 'Owner');
5330                print_sort_th('age', $order, 'Last Change');
5331                print "<th></th>\n" . # for links
5332                      "</tr>\n";
5333        }
5334
5335        if ($projects_list_group_categories) {
5336                # only display categories with projects in the $from-$to window
5337                @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5338                my %categories = build_projlist_by_category(\@projects, $from, $to);
5339                foreach my $cat (sort keys %categories) {
5340                        unless ($cat eq "") {
5341                                print "<tr>\n";
5342                                if ($check_forks) {
5343                                        print "<td></td>\n";
5344                                }
5345                                print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5346                                print "</tr>\n";
5347                        }
5348
5349                        git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5350                }
5351        } else {
5352                git_project_list_rows(\@projects, $from, $to, $check_forks);
5353        }
5354
5355        if (defined $extra) {
5356                print "<tr>\n";
5357                if ($check_forks) {
5358                        print "<td></td>\n";
5359                }
5360                print "<td colspan=\"5\">$extra</td>\n" .
5361                      "</tr>\n";
5362        }
5363        print "</table>\n";
5364}
5365
5366sub git_log_body {
5367        # uses global variable $project
5368        my ($commitlist, $from, $to, $refs, $extra) = @_;
5369
5370        $from = 0 unless defined $from;
5371        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5372
5373        for (my $i = 0; $i <= $to; $i++) {
5374                my %co = %{$commitlist->[$i]};
5375                next if !%co;
5376                my $commit = $co{'id'};
5377                my $ref = format_ref_marker($refs, $commit);
5378                git_print_header_div('commit',
5379                               "<span class=\"age\">$co{'age_string'}</span>" .
5380                               esc_html($co{'title'}) . $ref,
5381                               $commit);
5382                print "<div class=\"title_text\">\n" .
5383                      "<div class=\"log_link\">\n" .
5384                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5385                      " | " .
5386                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5387                      " | " .
5388                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5389                      "<br/>\n" .
5390                      "</div>\n";
5391                      git_print_authorship(\%co, -tag => 'span');
5392                      print "<br/>\n</div>\n";
5393
5394                print "<div class=\"log_body\">\n";
5395                git_print_log($co{'comment'}, -final_empty_line=> 1);
5396                print "</div>\n";
5397        }
5398        if ($extra) {
5399                print "<div class=\"page_nav\">\n";
5400                print "$extra\n";
5401                print "</div>\n";
5402        }
5403}
5404
5405sub git_shortlog_body {
5406        # uses global variable $project
5407        my ($commitlist, $from, $to, $refs, $extra) = @_;
5408
5409        $from = 0 unless defined $from;
5410        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5411
5412        print "<table class=\"shortlog\">\n";
5413        my $alternate = 1;
5414        for (my $i = $from; $i <= $to; $i++) {
5415                my %co = %{$commitlist->[$i]};
5416                my $commit = $co{'id'};
5417                my $ref = format_ref_marker($refs, $commit);
5418                if ($alternate) {
5419                        print "<tr class=\"dark\">\n";
5420                } else {
5421                        print "<tr class=\"light\">\n";
5422                }
5423                $alternate ^= 1;
5424                # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5425                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5426                      format_author_html('td', \%co, 10) . "<td>";
5427                print format_subject_html($co{'title'}, $co{'title_short'},
5428                                          href(action=>"commit", hash=>$commit), $ref);
5429                print "</td>\n" .
5430                      "<td class=\"link\">" .
5431                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5432                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5433                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5434                my $snapshot_links = format_snapshot_links($commit);
5435                if (defined $snapshot_links) {
5436                        print " | " . $snapshot_links;
5437                }
5438                print "</td>\n" .
5439                      "</tr>\n";
5440        }
5441        if (defined $extra) {
5442                print "<tr>\n" .
5443                      "<td colspan=\"4\">$extra</td>\n" .
5444                      "</tr>\n";
5445        }
5446        print "</table>\n";
5447}
5448
5449sub git_history_body {
5450        # Warning: assumes constant type (blob or tree) during history
5451        my ($commitlist, $from, $to, $refs, $extra,
5452            $file_name, $file_hash, $ftype) = @_;
5453
5454        $from = 0 unless defined $from;
5455        $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5456
5457        print "<table class=\"history\">\n";
5458        my $alternate = 1;
5459        for (my $i = $from; $i <= $to; $i++) {
5460                my %co = %{$commitlist->[$i]};
5461                if (!%co) {
5462                        next;
5463                }
5464                my $commit = $co{'id'};
5465
5466                my $ref = format_ref_marker($refs, $commit);
5467
5468                if ($alternate) {
5469                        print "<tr class=\"dark\">\n";
5470                } else {
5471                        print "<tr class=\"light\">\n";
5472                }
5473                $alternate ^= 1;
5474                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5475        # shortlog:   format_author_html('td', \%co, 10)
5476                      format_author_html('td', \%co, 15, 3) . "<td>";
5477                # originally git_history used chop_str($co{'title'}, 50)
5478                print format_subject_html($co{'title'}, $co{'title_short'},
5479                                          href(action=>"commit", hash=>$commit), $ref);
5480                print "</td>\n" .
5481                      "<td class=\"link\">" .
5482                      $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5483                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5484
5485                if ($ftype eq 'blob') {
5486                        my $blob_current = $file_hash;
5487                        my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5488                        if (defined $blob_current && defined $blob_parent &&
5489                                        $blob_current ne $blob_parent) {
5490                                print " | " .
5491                                        $cgi->a({-href => href(action=>"blobdiff",
5492                                                               hash=>$blob_current, hash_parent=>$blob_parent,
5493                                                               hash_base=>$hash_base, hash_parent_base=>$commit,
5494                                                               file_name=>$file_name)},
5495                                                "diff to current");
5496                        }
5497                }
5498                print "</td>\n" .
5499                      "</tr>\n";
5500        }
5501        if (defined $extra) {
5502                print "<tr>\n" .
5503                      "<td colspan=\"4\">$extra</td>\n" .
5504                      "</tr>\n";
5505        }
5506        print "</table>\n";
5507}
5508
5509sub git_tags_body {
5510        # uses global variable $project
5511        my ($taglist, $from, $to, $extra) = @_;
5512        $from = 0 unless defined $from;
5513        $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5514
5515        print "<table class=\"tags\">\n";
5516        my $alternate = 1;
5517        for (my $i = $from; $i <= $to; $i++) {
5518                my $entry = $taglist->[$i];
5519                my %tag = %$entry;
5520                my $comment = $tag{'subject'};
5521                my $comment_short;
5522                if (defined $comment) {
5523                        $comment_short = chop_str($comment, 30, 5);
5524                }
5525                if ($alternate) {
5526                        print "<tr class=\"dark\">\n";
5527                } else {
5528                        print "<tr class=\"light\">\n";
5529                }
5530                $alternate ^= 1;
5531                if (defined $tag{'age'}) {
5532                        print "<td><i>$tag{'age'}</i></td>\n";
5533                } else {
5534                        print "<td></td>\n";
5535                }
5536                print "<td>" .
5537                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5538                               -class => "list name"}, esc_html($tag{'name'})) .
5539                      "</td>\n" .
5540                      "<td>";
5541                if (defined $comment) {
5542                        print format_subject_html($comment, $comment_short,
5543                                                  href(action=>"tag", hash=>$tag{'id'}));
5544                }
5545                print "</td>\n" .
5546                      "<td class=\"selflink\">";
5547                if ($tag{'type'} eq "tag") {
5548                        print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5549                } else {
5550                        print "&nbsp;";
5551                }
5552                print "</td>\n" .
5553                      "<td class=\"link\">" . " | " .
5554                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5555                if ($tag{'reftype'} eq "commit") {
5556                        print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5557                              " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5558                } elsif ($tag{'reftype'} eq "blob") {
5559                        print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5560                }
5561                print "</td>\n" .
5562                      "</tr>";
5563        }
5564        if (defined $extra) {
5565                print "<tr>\n" .
5566                      "<td colspan=\"5\">$extra</td>\n" .
5567                      "</tr>\n";
5568        }
5569        print "</table>\n";
5570}
5571
5572sub git_heads_body {
5573        # uses global variable $project
5574        my ($headlist, $head, $from, $to, $extra) = @_;
5575        $from = 0 unless defined $from;
5576        $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5577
5578        print "<table class=\"heads\">\n";
5579        my $alternate = 1;
5580        for (my $i = $from; $i <= $to; $i++) {
5581                my $entry = $headlist->[$i];
5582                my %ref = %$entry;
5583                my $curr = $ref{'id'} eq $head;
5584                if ($alternate) {
5585                        print "<tr class=\"dark\">\n";
5586                } else {
5587                        print "<tr class=\"light\">\n";
5588                }
5589                $alternate ^= 1;
5590                print "<td><i>$ref{'age'}</i></td>\n" .
5591                      ($curr ? "<td class=\"current_head\">" : "<td>") .
5592                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5593                               -class => "list name"},esc_html($ref{'name'})) .
5594                      "</td>\n" .
5595                      "<td class=\"link\">" .
5596                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5597                      $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5598                      $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5599                      "</td>\n" .
5600                      "</tr>";
5601        }
5602        if (defined $extra) {
5603                print "<tr>\n" .
5604                      "<td colspan=\"3\">$extra</td>\n" .
5605                      "</tr>\n";
5606        }
5607        print "</table>\n";
5608}
5609
5610# Display a single remote block
5611sub git_remote_block {
5612        my ($remote, $rdata, $limit, $head) = @_;
5613
5614        my $heads = $rdata->{'heads'};
5615        my $fetch = $rdata->{'fetch'};
5616        my $push = $rdata->{'push'};
5617
5618        my $urls_table = "<table class=\"projects_list\">\n" ;
5619
5620        if (defined $fetch) {
5621                if ($fetch eq $push) {
5622                        $urls_table .= format_repo_url("URL", $fetch);
5623                } else {
5624                        $urls_table .= format_repo_url("Fetch URL", $fetch);
5625                        $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5626                }
5627        } elsif (defined $push) {
5628                $urls_table .= format_repo_url("Push URL", $push);
5629        } else {
5630                $urls_table .= format_repo_url("", "No remote URL");
5631        }
5632
5633        $urls_table .= "</table>\n";
5634
5635        my $dots;
5636        if (defined $limit && $limit < @$heads) {
5637                $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5638        }
5639
5640        print $urls_table;
5641        git_heads_body($heads, $head, 0, $limit, $dots);
5642}
5643
5644# Display a list of remote names with the respective fetch and push URLs
5645sub git_remotes_list {
5646        my ($remotedata, $limit) = @_;
5647        print "<table class=\"heads\">\n";
5648        my $alternate = 1;
5649        my @remotes = sort keys %$remotedata;
5650
5651        my $limited = $limit && $limit < @remotes;
5652
5653        $#remotes = $limit - 1 if $limited;
5654
5655        while (my $remote = shift @remotes) {
5656                my $rdata = $remotedata->{$remote};
5657                my $fetch = $rdata->{'fetch'};
5658                my $push = $rdata->{'push'};
5659                if ($alternate) {
5660                        print "<tr class=\"dark\">\n";
5661                } else {
5662                        print "<tr class=\"light\">\n";
5663                }
5664                $alternate ^= 1;
5665                print "<td>" .
5666                      $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5667                               -class=> "list name"},esc_html($remote)) .
5668                      "</td>";
5669                print "<td class=\"link\">" .
5670                      (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5671                      " | " .
5672                      (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5673                      "</td>";
5674
5675                print "</tr>\n";
5676        }
5677
5678        if ($limited) {
5679                print "<tr>\n" .
5680                      "<td colspan=\"3\">" .
5681                      $cgi->a({-href => href(action=>"remotes")}, "...") .
5682                      "</td>\n" . "</tr>\n";
5683        }
5684
5685        print "</table>";
5686}
5687
5688# Display remote heads grouped by remote, unless there are too many
5689# remotes, in which case we only display the remote names
5690sub git_remotes_body {
5691        my ($remotedata, $limit, $head) = @_;
5692        if ($limit and $limit < keys %$remotedata) {
5693                git_remotes_list($remotedata, $limit);
5694        } else {
5695                fill_remote_heads($remotedata);
5696                while (my ($remote, $rdata) = each %$remotedata) {
5697                        git_print_section({-class=>"remote", -id=>$remote},
5698                                ["remotes", $remote, $remote], sub {
5699                                        git_remote_block($remote, $rdata, $limit, $head);
5700                                });
5701                }
5702        }
5703}
5704
5705sub git_search_message {
5706        my %co = @_;
5707
5708        my $greptype;
5709        if ($searchtype eq 'commit') {
5710                $greptype = "--grep=";
5711        } elsif ($searchtype eq 'author') {
5712                $greptype = "--author=";
5713        } elsif ($searchtype eq 'committer') {
5714                $greptype = "--committer=";
5715        }
5716        $greptype .= $searchtext;
5717        my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
5718                                       $greptype, '--regexp-ignore-case',
5719                                       $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
5720
5721        my $paging_nav = '';
5722        if ($page > 0) {
5723                $paging_nav .=
5724                        $cgi->a({-href => href(-replay=>1, page=>undef)},
5725                                "first") .
5726                        " &sdot; " .
5727                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
5728                                 -accesskey => "p", -title => "Alt-p"}, "prev");
5729        } else {
5730                $paging_nav .= "first &sdot; prev";
5731        }
5732        my $next_link = '';
5733        if ($#commitlist >= 100) {
5734                $next_link =
5735                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
5736                                 -accesskey => "n", -title => "Alt-n"}, "next");
5737                $paging_nav .= " &sdot; $next_link";
5738        } else {
5739                $paging_nav .= " &sdot; next";
5740        }
5741
5742        git_header_html();
5743
5744        git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
5745        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5746        if ($page == 0 && !@commitlist) {
5747                print "<p>No match.</p>\n";
5748        } else {
5749                git_search_grep_body(\@commitlist, 0, 99, $next_link);
5750        }
5751
5752        git_footer_html();
5753}
5754
5755sub git_search_changes {
5756        my %co = @_;
5757
5758        local $/ = "\n";
5759        open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
5760                '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
5761                ($search_use_regexp ? '--pickaxe-regex' : ())
5762                        or die_error(500, "Open git-log failed");
5763
5764        git_header_html();
5765
5766        git_print_page_nav('','', $hash,$co{'tree'},$hash);
5767        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5768
5769        print "<table class=\"pickaxe search\">\n";
5770        my $alternate = 1;
5771        undef %co;
5772        my @files;
5773        while (my $line = <$fd>) {
5774                chomp $line;
5775                next unless $line;
5776
5777                my %set = parse_difftree_raw_line($line);
5778                if (defined $set{'commit'}) {
5779                        # finish previous commit
5780                        if (%co) {
5781                                print "</td>\n" .
5782                                      "<td class=\"link\">" .
5783                                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5784                                              "commit") .
5785                                      " | " .
5786                                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5787                                                             hash_base=>$co{'id'})},
5788                                              "tree") .
5789                                      "</td>\n" .
5790                                      "</tr>\n";
5791                        }
5792
5793                        if ($alternate) {
5794                                print "<tr class=\"dark\">\n";
5795                        } else {
5796                                print "<tr class=\"light\">\n";
5797                        }
5798                        $alternate ^= 1;
5799                        %co = parse_commit($set{'commit'});
5800                        my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
5801                        print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5802                              "<td><i>$author</i></td>\n" .
5803                              "<td>" .
5804                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5805                                      -class => "list subject"},
5806                                      chop_and_escape_str($co{'title'}, 50) . "<br/>");
5807                } elsif (defined $set{'to_id'}) {
5808                        next if ($set{'to_id'} =~ m/^0{40}$/);
5809
5810                        print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
5811                                                     hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
5812                                      -class => "list"},
5813                                      "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
5814                              "<br/>\n";
5815                }
5816        }
5817        close $fd;
5818
5819        # finish last commit (warning: repetition!)
5820        if (%co) {
5821                print "</td>\n" .
5822                      "<td class=\"link\">" .
5823                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5824                              "commit") .
5825                      " | " .
5826                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5827                                             hash_base=>$co{'id'})},
5828                              "tree") .
5829                      "</td>\n" .
5830                      "</tr>\n";
5831        }
5832
5833        print "</table>\n";
5834
5835        git_footer_html();
5836}
5837
5838sub git_search_files {
5839        my %co = @_;
5840
5841        local $/ = "\n";
5842        open my $fd, "-|", git_cmd(), 'grep', '-n', '-z',
5843                $search_use_regexp ? ('-E', '-i') : '-F',
5844                $searchtext, $co{'tree'}
5845                        or die_error(500, "Open git-grep failed");
5846
5847        git_header_html();
5848
5849        git_print_page_nav('','', $hash,$co{'tree'},$hash);
5850        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5851
5852        print "<table class=\"grep_search\">\n";
5853        my $alternate = 1;
5854        my $matches = 0;
5855        my $lastfile = '';
5856        while (my $line = <$fd>) {
5857                chomp $line;
5858                my ($file, $file_href, $lno, $ltext, $binary);
5859                last if ($matches++ > 1000);
5860                if ($line =~ /^Binary file (.+) matches$/) {
5861                        $file = $1;
5862                        $binary = 1;
5863                } else {
5864                        ($file, $lno, $ltext) = split(/\0/, $line, 3);
5865                        $file =~ s/^$co{'tree'}://;
5866                }
5867                if ($file ne $lastfile) {
5868                        $lastfile and print "</td></tr>\n";
5869                        if ($alternate++) {
5870                                print "<tr class=\"dark\">\n";
5871                        } else {
5872                                print "<tr class=\"light\">\n";
5873                        }
5874                        $file_href = href(action=>"blob", hash_base=>$co{'id'},
5875                                          file_name=>$file);
5876                        print "<td class=\"list\">".
5877                                $cgi->a({-href => $file_href, -class => "list"}, esc_path($file));
5878                        print "</td><td>\n";
5879                        $lastfile = $file;
5880                }
5881                if ($binary) {
5882                        print "<div class=\"binary\">Binary file</div>\n";
5883                } else {
5884                        $ltext = untabify($ltext);
5885                        if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
5886                                $ltext = esc_html($1, -nbsp=>1);
5887                                $ltext .= '<span class="match">';
5888                                $ltext .= esc_html($2, -nbsp=>1);
5889                                $ltext .= '</span>';
5890                                $ltext .= esc_html($3, -nbsp=>1);
5891                        } else {
5892                                $ltext = esc_html($ltext, -nbsp=>1);
5893                        }
5894                        print "<div class=\"pre\">" .
5895                                $cgi->a({-href => $file_href.'#l'.$lno,
5896                                        -class => "linenr"}, sprintf('%4i', $lno)) .
5897                                ' ' .  $ltext . "</div>\n";
5898                }
5899        }
5900        if ($lastfile) {
5901                print "</td></tr>\n";
5902                if ($matches > 1000) {
5903                        print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
5904                }
5905        } else {
5906                print "<div class=\"diff nodifferences\">No matches found</div>\n";
5907        }
5908        close $fd;
5909
5910        print "</table>\n";
5911
5912        git_footer_html();
5913}
5914
5915sub git_search_grep_body {
5916        my ($commitlist, $from, $to, $extra) = @_;
5917        $from = 0 unless defined $from;
5918        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5919
5920        print "<table class=\"commit_search\">\n";
5921        my $alternate = 1;
5922        for (my $i = $from; $i <= $to; $i++) {
5923                my %co = %{$commitlist->[$i]};
5924                if (!%co) {
5925                        next;
5926                }
5927                my $commit = $co{'id'};
5928                if ($alternate) {
5929                        print "<tr class=\"dark\">\n";
5930                } else {
5931                        print "<tr class=\"light\">\n";
5932                }
5933                $alternate ^= 1;
5934                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5935                      format_author_html('td', \%co, 15, 5) .
5936                      "<td>" .
5937                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5938                               -class => "list subject"},
5939                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
5940                my $comment = $co{'comment'};
5941                foreach my $line (@$comment) {
5942                        if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
5943                                my ($lead, $match, $trail) = ($1, $2, $3);
5944                                $match = chop_str($match, 70, 5, 'center');
5945                                my $contextlen = int((80 - length($match))/2);
5946                                $contextlen = 30 if ($contextlen > 30);
5947                                $lead  = chop_str($lead,  $contextlen, 10, 'left');
5948                                $trail = chop_str($trail, $contextlen, 10, 'right');
5949
5950                                $lead  = esc_html($lead);
5951                                $match = esc_html($match);
5952                                $trail = esc_html($trail);
5953
5954                                print "$lead<span class=\"match\">$match</span>$trail<br />";
5955                        }
5956                }
5957                print "</td>\n" .
5958                      "<td class=\"link\">" .
5959                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5960                      " | " .
5961                      $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5962                      " | " .
5963                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5964                print "</td>\n" .
5965                      "</tr>\n";
5966        }
5967        if (defined $extra) {
5968                print "<tr>\n" .
5969                      "<td colspan=\"3\">$extra</td>\n" .
5970                      "</tr>\n";
5971        }
5972        print "</table>\n";
5973}
5974
5975## ======================================================================
5976## ======================================================================
5977## actions
5978
5979sub git_project_list {
5980        my $order = $input_params{'order'};
5981        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5982                die_error(400, "Unknown order parameter");
5983        }
5984
5985        my @list = git_get_projects_list();
5986        if (!@list) {
5987                die_error(404, "No projects found");
5988        }
5989
5990        git_header_html();
5991        if (defined $home_text && -f $home_text) {
5992                print "<div class=\"index_include\">\n";
5993                insert_file($home_text);
5994                print "</div>\n";
5995        }
5996        print $cgi->startform(-method => "get") .
5997              "<p class=\"projsearch\">Search:\n" .
5998              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
5999              "</p>" .
6000              $cgi->end_form() . "\n";
6001        git_project_list_body(\@list, $order);
6002        git_footer_html();
6003}
6004
6005sub git_forks {
6006        my $order = $input_params{'order'};
6007        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6008                die_error(400, "Unknown order parameter");
6009        }
6010
6011        my $filter = $project;
6012        $filter =~ s/\.git$//;
6013        my @list = git_get_projects_list($filter);
6014        if (!@list) {
6015                die_error(404, "No forks found");
6016        }
6017
6018        git_header_html();
6019        git_print_page_nav('','');
6020        git_print_header_div('summary', "$project forks");
6021        git_project_list_body(\@list, $order);
6022        git_footer_html();
6023}
6024
6025sub git_project_index {
6026        my @projects = git_get_projects_list();
6027        if (!@projects) {
6028                die_error(404, "No projects found");
6029        }
6030
6031        print $cgi->header(
6032                -type => 'text/plain',
6033                -charset => 'utf-8',
6034                -content_disposition => 'inline; filename="index.aux"');
6035
6036        foreach my $pr (@projects) {
6037                if (!exists $pr->{'owner'}) {
6038                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6039                }
6040
6041                my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6042                # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6043                $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6044                $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6045                $path  =~ s/ /\+/g;
6046                $owner =~ s/ /\+/g;
6047
6048                print "$path $owner\n";
6049        }
6050}
6051
6052sub git_summary {
6053        my $descr = git_get_project_description($project) || "none";
6054        my %co = parse_commit("HEAD");
6055        my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6056        my $head = $co{'id'};
6057        my $remote_heads = gitweb_check_feature('remote_heads');
6058
6059        my $owner = git_get_project_owner($project);
6060
6061        my $refs = git_get_references();
6062        # These get_*_list functions return one more to allow us to see if
6063        # there are more ...
6064        my @taglist  = git_get_tags_list(16);
6065        my @headlist = git_get_heads_list(16);
6066        my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6067        my @forklist;
6068        my $check_forks = gitweb_check_feature('forks');
6069
6070        if ($check_forks) {
6071                # find forks of a project
6072                my $filter = $project;
6073                $filter =~ s/\.git$//;
6074                @forklist = git_get_projects_list($filter);
6075                # filter out forks of forks
6076                @forklist = filter_forks_from_projects_list(\@forklist)
6077                        if (@forklist);
6078        }
6079
6080        git_header_html();
6081        git_print_page_nav('summary','', $head);
6082
6083        print "<div class=\"title\">&nbsp;</div>\n";
6084        print "<table class=\"projects_list\">\n" .
6085              "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
6086              "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6087        if (defined $cd{'rfc2822'}) {
6088                print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6089                      "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6090        }
6091
6092        # use per project git URL list in $projectroot/$project/cloneurl
6093        # or make project git URL from git base URL and project name
6094        my $url_tag = "URL";
6095        my @url_list = git_get_project_url_list($project);
6096        @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6097        foreach my $git_url (@url_list) {
6098                next unless $git_url;
6099                print format_repo_url($url_tag, $git_url);
6100                $url_tag = "";
6101        }
6102
6103        # Tag cloud
6104        my $show_ctags = gitweb_check_feature('ctags');
6105        if ($show_ctags) {
6106                my $ctags = git_get_project_ctags($project);
6107                if (%$ctags) {
6108                        # without ability to add tags, don't show if there are none
6109                        my $cloud = git_populate_project_tagcloud($ctags);
6110                        print "<tr id=\"metadata_ctags\">" .
6111                              "<td>content tags</td>" .
6112                              "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6113                              "</tr>\n";
6114                }
6115        }
6116
6117        print "</table>\n";
6118
6119        # If XSS prevention is on, we don't include README.html.
6120        # TODO: Allow a readme in some safe format.
6121        if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6122                print "<div class=\"title\">readme</div>\n" .
6123                      "<div class=\"readme\">\n";
6124                insert_file("$projectroot/$project/README.html");
6125                print "\n</div>\n"; # class="readme"
6126        }
6127
6128        # we need to request one more than 16 (0..15) to check if
6129        # those 16 are all
6130        my @commitlist = $head ? parse_commits($head, 17) : ();
6131        if (@commitlist) {
6132                git_print_header_div('shortlog');
6133                git_shortlog_body(\@commitlist, 0, 15, $refs,
6134                                  $#commitlist <=  15 ? undef :
6135                                  $cgi->a({-href => href(action=>"shortlog")}, "..."));
6136        }
6137
6138        if (@taglist) {
6139                git_print_header_div('tags');
6140                git_tags_body(\@taglist, 0, 15,
6141                              $#taglist <=  15 ? undef :
6142                              $cgi->a({-href => href(action=>"tags")}, "..."));
6143        }
6144
6145        if (@headlist) {
6146                git_print_header_div('heads');
6147                git_heads_body(\@headlist, $head, 0, 15,
6148                               $#headlist <= 15 ? undef :
6149                               $cgi->a({-href => href(action=>"heads")}, "..."));
6150        }
6151
6152        if (%remotedata) {
6153                git_print_header_div('remotes');
6154                git_remotes_body(\%remotedata, 15, $head);
6155        }
6156
6157        if (@forklist) {
6158                git_print_header_div('forks');
6159                git_project_list_body(\@forklist, 'age', 0, 15,
6160                                      $#forklist <= 15 ? undef :
6161                                      $cgi->a({-href => href(action=>"forks")}, "..."),
6162                                      'no_header');
6163        }
6164
6165        git_footer_html();
6166}
6167
6168sub git_tag {
6169        my %tag = parse_tag($hash);
6170
6171        if (! %tag) {
6172                die_error(404, "Unknown tag object");
6173        }
6174
6175        my $head = git_get_head_hash($project);
6176        git_header_html();
6177        git_print_page_nav('','', $head,undef,$head);
6178        git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6179        print "<div class=\"title_text\">\n" .
6180              "<table class=\"object_header\">\n" .
6181              "<tr>\n" .
6182              "<td>object</td>\n" .
6183              "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6184                               $tag{'object'}) . "</td>\n" .
6185              "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6186                                              $tag{'type'}) . "</td>\n" .
6187              "</tr>\n";
6188        if (defined($tag{'author'})) {
6189                git_print_authorship_rows(\%tag, 'author');
6190        }
6191        print "</table>\n\n" .
6192              "</div>\n";
6193        print "<div class=\"page_body\">";
6194        my $comment = $tag{'comment'};
6195        foreach my $line (@$comment) {
6196                chomp $line;
6197                print esc_html($line, -nbsp=>1) . "<br/>\n";
6198        }
6199        print "</div>\n";
6200        git_footer_html();
6201}
6202
6203sub git_blame_common {
6204        my $format = shift || 'porcelain';
6205        if ($format eq 'porcelain' && $cgi->param('js')) {
6206                $format = 'incremental';
6207                $action = 'blame_incremental'; # for page title etc
6208        }
6209
6210        # permissions
6211        gitweb_check_feature('blame')
6212                or die_error(403, "Blame view not allowed");
6213
6214        # error checking
6215        die_error(400, "No file name given") unless $file_name;
6216        $hash_base ||= git_get_head_hash($project);
6217        die_error(404, "Couldn't find base commit") unless $hash_base;
6218        my %co = parse_commit($hash_base)
6219                or die_error(404, "Commit not found");
6220        my $ftype = "blob";
6221        if (!defined $hash) {
6222                $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6223                        or die_error(404, "Error looking up file");
6224        } else {
6225                $ftype = git_get_type($hash);
6226                if ($ftype !~ "blob") {
6227                        die_error(400, "Object is not a blob");
6228                }
6229        }
6230
6231        my $fd;
6232        if ($format eq 'incremental') {
6233                # get file contents (as base)
6234                open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6235                        or die_error(500, "Open git-cat-file failed");
6236        } elsif ($format eq 'data') {
6237                # run git-blame --incremental
6238                open $fd, "-|", git_cmd(), "blame", "--incremental",
6239                        $hash_base, "--", $file_name
6240                        or die_error(500, "Open git-blame --incremental failed");
6241        } else {
6242                # run git-blame --porcelain
6243                open $fd, "-|", git_cmd(), "blame", '-p',
6244                        $hash_base, '--', $file_name
6245                        or die_error(500, "Open git-blame --porcelain failed");
6246        }
6247
6248        # incremental blame data returns early
6249        if ($format eq 'data') {
6250                print $cgi->header(
6251                        -type=>"text/plain", -charset => "utf-8",
6252                        -status=> "200 OK");
6253                local $| = 1; # output autoflush
6254                while (my $line = <$fd>) {
6255                        print to_utf8($line);
6256                }
6257                close $fd
6258                        or print "ERROR $!\n";
6259
6260                print 'END';
6261                if (defined $t0 && gitweb_check_feature('timed')) {
6262                        print ' '.
6263                              tv_interval($t0, [ gettimeofday() ]).
6264                              ' '.$number_of_git_cmds;
6265                }
6266                print "\n";
6267
6268                return;
6269        }
6270
6271        # page header
6272        git_header_html();
6273        my $formats_nav =
6274                $cgi->a({-href => href(action=>"blob", -replay=>1)},
6275                        "blob") .
6276                " | ";
6277        if ($format eq 'incremental') {
6278                $formats_nav .=
6279                        $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6280                                "blame") . " (non-incremental)";
6281        } else {
6282                $formats_nav .=
6283                        $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6284                                "blame") . " (incremental)";
6285        }
6286        $formats_nav .=
6287                " | " .
6288                $cgi->a({-href => href(action=>"history", -replay=>1)},
6289                        "history") .
6290                " | " .
6291                $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6292                        "HEAD");
6293        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6294        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6295        git_print_page_path($file_name, $ftype, $hash_base);
6296
6297        # page body
6298        if ($format eq 'incremental') {
6299                print "<noscript>\n<div class=\"error\"><center><b>\n".
6300                      "This page requires JavaScript to run.\n Use ".
6301                      $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6302                              'this page').
6303                      " instead.\n".
6304                      "</b></center></div>\n</noscript>\n";
6305
6306                print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6307        }
6308
6309        print qq!<div class="page_body">\n!;
6310        print qq!<div id="progress_info">... / ...</div>\n!
6311                if ($format eq 'incremental');
6312        print qq!<table id="blame_table" class="blame" width="100%">\n!.
6313              #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6314              qq!<thead>\n!.
6315              qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6316              qq!</thead>\n!.
6317              qq!<tbody>\n!;
6318
6319        my @rev_color = qw(light dark);
6320        my $num_colors = scalar(@rev_color);
6321        my $current_color = 0;
6322
6323        if ($format eq 'incremental') {
6324                my $color_class = $rev_color[$current_color];
6325
6326                #contents of a file
6327                my $linenr = 0;
6328        LINE:
6329                while (my $line = <$fd>) {
6330                        chomp $line;
6331                        $linenr++;
6332
6333                        print qq!<tr id="l$linenr" class="$color_class">!.
6334                              qq!<td class="sha1"><a href=""> </a></td>!.
6335                              qq!<td class="linenr">!.
6336                              qq!<a class="linenr" href="">$linenr</a></td>!;
6337                        print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6338                        print qq!</tr>\n!;
6339                }
6340
6341        } else { # porcelain, i.e. ordinary blame
6342                my %metainfo = (); # saves information about commits
6343
6344                # blame data
6345        LINE:
6346                while (my $line = <$fd>) {
6347                        chomp $line;
6348                        # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6349                        # no <lines in group> for subsequent lines in group of lines
6350                        my ($full_rev, $orig_lineno, $lineno, $group_size) =
6351                           ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6352                        if (!exists $metainfo{$full_rev}) {
6353                                $metainfo{$full_rev} = { 'nprevious' => 0 };
6354                        }
6355                        my $meta = $metainfo{$full_rev};
6356                        my $data;
6357                        while ($data = <$fd>) {
6358                                chomp $data;
6359                                last if ($data =~ s/^\t//); # contents of line
6360                                if ($data =~ /^(\S+)(?: (.*))?$/) {
6361                                        $meta->{$1} = $2 unless exists $meta->{$1};
6362                                }
6363                                if ($data =~ /^previous /) {
6364                                        $meta->{'nprevious'}++;
6365                                }
6366                        }
6367                        my $short_rev = substr($full_rev, 0, 8);
6368                        my $author = $meta->{'author'};
6369                        my %date =
6370                                parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6371                        my $date = $date{'iso-tz'};
6372                        if ($group_size) {
6373                                $current_color = ($current_color + 1) % $num_colors;
6374                        }
6375                        my $tr_class = $rev_color[$current_color];
6376                        $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6377                        $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6378                        $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6379                        print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6380                        if ($group_size) {
6381                                print "<td class=\"sha1\"";
6382                                print " title=\"". esc_html($author) . ", $date\"";
6383                                print " rowspan=\"$group_size\"" if ($group_size > 1);
6384                                print ">";
6385                                print $cgi->a({-href => href(action=>"commit",
6386                                                             hash=>$full_rev,
6387                                                             file_name=>$file_name)},
6388                                              esc_html($short_rev));
6389                                if ($group_size >= 2) {
6390                                        my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6391                                        if (@author_initials) {
6392                                                print "<br />" .
6393                                                      esc_html(join('', @author_initials));
6394                                                #           or join('.', ...)
6395                                        }
6396                                }
6397                                print "</td>\n";
6398                        }
6399                        # 'previous' <sha1 of parent commit> <filename at commit>
6400                        if (exists $meta->{'previous'} &&
6401                            $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6402                                $meta->{'parent'} = $1;
6403                                $meta->{'file_parent'} = unquote($2);
6404                        }
6405                        my $linenr_commit =
6406                                exists($meta->{'parent'}) ?
6407                                $meta->{'parent'} : $full_rev;
6408                        my $linenr_filename =
6409                                exists($meta->{'file_parent'}) ?
6410                                $meta->{'file_parent'} : unquote($meta->{'filename'});
6411                        my $blamed = href(action => 'blame',
6412                                          file_name => $linenr_filename,
6413                                          hash_base => $linenr_commit);
6414                        print "<td class=\"linenr\">";
6415                        print $cgi->a({ -href => "$blamed#l$orig_lineno",
6416                                        -class => "linenr" },
6417                                      esc_html($lineno));
6418                        print "</td>";
6419                        print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6420                        print "</tr>\n";
6421                } # end while
6422
6423        }
6424
6425        # footer
6426        print "</tbody>\n".
6427              "</table>\n"; # class="blame"
6428        print "</div>\n";   # class="blame_body"
6429        close $fd
6430                or print "Reading blob failed\n";
6431
6432        git_footer_html();
6433}
6434
6435sub git_blame {
6436        git_blame_common();
6437}
6438
6439sub git_blame_incremental {
6440        git_blame_common('incremental');
6441}
6442
6443sub git_blame_data {
6444        git_blame_common('data');
6445}
6446
6447sub git_tags {
6448        my $head = git_get_head_hash($project);
6449        git_header_html();
6450        git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6451        git_print_header_div('summary', $project);
6452
6453        my @tagslist = git_get_tags_list();
6454        if (@tagslist) {
6455                git_tags_body(\@tagslist);
6456        }
6457        git_footer_html();
6458}
6459
6460sub git_heads {
6461        my $head = git_get_head_hash($project);
6462        git_header_html();
6463        git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6464        git_print_header_div('summary', $project);
6465
6466        my @headslist = git_get_heads_list();
6467        if (@headslist) {
6468                git_heads_body(\@headslist, $head);
6469        }
6470        git_footer_html();
6471}
6472
6473# used both for single remote view and for list of all the remotes
6474sub git_remotes {
6475        gitweb_check_feature('remote_heads')
6476                or die_error(403, "Remote heads view is disabled");
6477
6478        my $head = git_get_head_hash($project);
6479        my $remote = $input_params{'hash'};
6480
6481        my $remotedata = git_get_remotes_list($remote);
6482        die_error(500, "Unable to get remote information") unless defined $remotedata;
6483
6484        unless (%$remotedata) {
6485                die_error(404, defined $remote ?
6486                        "Remote $remote not found" :
6487                        "No remotes found");
6488        }
6489
6490        git_header_html(undef, undef, -action_extra => $remote);
6491        git_print_page_nav('', '',  $head, undef, $head,
6492                format_ref_views($remote ? '' : 'remotes'));
6493
6494        fill_remote_heads($remotedata);
6495        if (defined $remote) {
6496                git_print_header_div('remotes', "$remote remote for $project");
6497                git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6498        } else {
6499                git_print_header_div('summary', "$project remotes");
6500                git_remotes_body($remotedata, undef, $head);
6501        }
6502
6503        git_footer_html();
6504}
6505
6506sub git_blob_plain {
6507        my $type = shift;
6508        my $expires;
6509
6510        if (!defined $hash) {
6511                if (defined $file_name) {
6512                        my $base = $hash_base || git_get_head_hash($project);
6513                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6514                                or die_error(404, "Cannot find file");
6515                } else {
6516                        die_error(400, "No file name defined");
6517                }
6518        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6519                # blobs defined by non-textual hash id's can be cached
6520                $expires = "+1d";
6521        }
6522
6523        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6524                or die_error(500, "Open git-cat-file blob '$hash' failed");
6525
6526        # content-type (can include charset)
6527        $type = blob_contenttype($fd, $file_name, $type);
6528
6529        # "save as" filename, even when no $file_name is given
6530        my $save_as = "$hash";
6531        if (defined $file_name) {
6532                $save_as = $file_name;
6533        } elsif ($type =~ m/^text\//) {
6534                $save_as .= '.txt';
6535        }
6536
6537        # With XSS prevention on, blobs of all types except a few known safe
6538        # ones are served with "Content-Disposition: attachment" to make sure
6539        # they don't run in our security domain.  For certain image types,
6540        # blob view writes an <img> tag referring to blob_plain view, and we
6541        # want to be sure not to break that by serving the image as an
6542        # attachment (though Firefox 3 doesn't seem to care).
6543        my $sandbox = $prevent_xss &&
6544                $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6545
6546        # serve text/* as text/plain
6547        if ($prevent_xss &&
6548            ($type =~ m!^text/[a-z]+\b(.*)$! ||
6549             ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
6550                my $rest = $1;
6551                $rest = defined $rest ? $rest : '';
6552                $type = "text/plain$rest";
6553        }
6554
6555        print $cgi->header(
6556                -type => $type,
6557                -expires => $expires,
6558                -content_disposition =>
6559                        ($sandbox ? 'attachment' : 'inline')
6560                        . '; filename="' . $save_as . '"');
6561        local $/ = undef;
6562        binmode STDOUT, ':raw';
6563        print <$fd>;
6564        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6565        close $fd;
6566}
6567
6568sub git_blob {
6569        my $expires;
6570
6571        if (!defined $hash) {
6572                if (defined $file_name) {
6573                        my $base = $hash_base || git_get_head_hash($project);
6574                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6575                                or die_error(404, "Cannot find file");
6576                } else {
6577                        die_error(400, "No file name defined");
6578                }
6579        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6580                # blobs defined by non-textual hash id's can be cached
6581                $expires = "+1d";
6582        }
6583
6584        my $have_blame = gitweb_check_feature('blame');
6585        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6586                or die_error(500, "Couldn't cat $file_name, $hash");
6587        my $mimetype = blob_mimetype($fd, $file_name);
6588        # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6589        if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6590                close $fd;
6591                return git_blob_plain($mimetype);
6592        }
6593        # we can have blame only for text/* mimetype
6594        $have_blame &&= ($mimetype =~ m!^text/!);
6595
6596        my $highlight = gitweb_check_feature('highlight');
6597        my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6598        $fd = run_highlighter($fd, $highlight, $syntax)
6599                if $syntax;
6600
6601        git_header_html(undef, $expires);
6602        my $formats_nav = '';
6603        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6604                if (defined $file_name) {
6605                        if ($have_blame) {
6606                                $formats_nav .=
6607                                        $cgi->a({-href => href(action=>"blame", -replay=>1)},
6608                                                "blame") .
6609                                        " | ";
6610                        }
6611                        $formats_nav .=
6612                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6613                                        "history") .
6614                                " | " .
6615                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6616                                        "raw") .
6617                                " | " .
6618                                $cgi->a({-href => href(action=>"blob",
6619                                                       hash_base=>"HEAD", file_name=>$file_name)},
6620                                        "HEAD");
6621                } else {
6622                        $formats_nav .=
6623                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6624                                        "raw");
6625                }
6626                git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6627                git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6628        } else {
6629                print "<div class=\"page_nav\">\n" .
6630                      "<br/><br/></div>\n" .
6631                      "<div class=\"title\">".esc_html($hash)."</div>\n";
6632        }
6633        git_print_page_path($file_name, "blob", $hash_base);
6634        print "<div class=\"page_body\">\n";
6635        if ($mimetype =~ m!^image/!) {
6636                print qq!<img type="!.esc_attr($mimetype).qq!"!;
6637                if ($file_name) {
6638                        print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
6639                }
6640                print qq! src="! .
6641                      href(action=>"blob_plain", hash=>$hash,
6642                           hash_base=>$hash_base, file_name=>$file_name) .
6643                      qq!" />\n!;
6644        } else {
6645                my $nr;
6646                while (my $line = <$fd>) {
6647                        chomp $line;
6648                        $nr++;
6649                        $line = untabify($line);
6650                        printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
6651                               $nr, esc_attr(href(-replay => 1)), $nr, $nr,
6652                               $syntax ? sanitize($line) : esc_html($line, -nbsp=>1);
6653                }
6654        }
6655        close $fd
6656                or print "Reading blob failed.\n";
6657        print "</div>";
6658        git_footer_html();
6659}
6660
6661sub git_tree {
6662        if (!defined $hash_base) {
6663                $hash_base = "HEAD";
6664        }
6665        if (!defined $hash) {
6666                if (defined $file_name) {
6667                        $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
6668                } else {
6669                        $hash = $hash_base;
6670                }
6671        }
6672        die_error(404, "No such tree") unless defined($hash);
6673
6674        my $show_sizes = gitweb_check_feature('show-sizes');
6675        my $have_blame = gitweb_check_feature('blame');
6676
6677        my @entries = ();
6678        {
6679                local $/ = "\0";
6680                open my $fd, "-|", git_cmd(), "ls-tree", '-z',
6681                        ($show_sizes ? '-l' : ()), @extra_options, $hash
6682                        or die_error(500, "Open git-ls-tree failed");
6683                @entries = map { chomp; $_ } <$fd>;
6684                close $fd
6685                        or die_error(404, "Reading tree failed");
6686        }
6687
6688        my $refs = git_get_references();
6689        my $ref = format_ref_marker($refs, $hash_base);
6690        git_header_html();
6691        my $basedir = '';
6692        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6693                my @views_nav = ();
6694                if (defined $file_name) {
6695                        push @views_nav,
6696                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6697                                        "history"),
6698                                $cgi->a({-href => href(action=>"tree",
6699                                                       hash_base=>"HEAD", file_name=>$file_name)},
6700                                        "HEAD"),
6701                }
6702                my $snapshot_links = format_snapshot_links($hash);
6703                if (defined $snapshot_links) {
6704                        # FIXME: Should be available when we have no hash base as well.
6705                        push @views_nav, $snapshot_links;
6706                }
6707                git_print_page_nav('tree','', $hash_base, undef, undef,
6708                                   join(' | ', @views_nav));
6709                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6710        } else {
6711                undef $hash_base;
6712                print "<div class=\"page_nav\">\n";
6713                print "<br/><br/></div>\n";
6714                print "<div class=\"title\">".esc_html($hash)."</div>\n";
6715        }
6716        if (defined $file_name) {
6717                $basedir = $file_name;
6718                if ($basedir ne '' && substr($basedir, -1) ne '/') {
6719                        $basedir .= '/';
6720                }
6721                git_print_page_path($file_name, 'tree', $hash_base);
6722        }
6723        print "<div class=\"page_body\">\n";
6724        print "<table class=\"tree\">\n";
6725        my $alternate = 1;
6726        # '..' (top directory) link if possible
6727        if (defined $hash_base &&
6728            defined $file_name && $file_name =~ m![^/]+$!) {
6729                if ($alternate) {
6730                        print "<tr class=\"dark\">\n";
6731                } else {
6732                        print "<tr class=\"light\">\n";
6733                }
6734                $alternate ^= 1;
6735
6736                my $up = $file_name;
6737                $up =~ s!/?[^/]+$!!;
6738                undef $up unless $up;
6739                # based on git_print_tree_entry
6740                print '<td class="mode">' . mode_str('040000') . "</td>\n";
6741                print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6742                print '<td class="list">';
6743                print $cgi->a({-href => href(action=>"tree",
6744                                             hash_base=>$hash_base,
6745                                             file_name=>$up)},
6746                              "..");
6747                print "</td>\n";
6748                print "<td class=\"link\"></td>\n";
6749
6750                print "</tr>\n";
6751        }
6752        foreach my $line (@entries) {
6753                my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6754
6755                if ($alternate) {
6756                        print "<tr class=\"dark\">\n";
6757                } else {
6758                        print "<tr class=\"light\">\n";
6759                }
6760                $alternate ^= 1;
6761
6762                git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6763
6764                print "</tr>\n";
6765        }
6766        print "</table>\n" .
6767              "</div>";
6768        git_footer_html();
6769}
6770
6771sub snapshot_name {
6772        my ($project, $hash) = @_;
6773
6774        # path/to/project.git  -> project
6775        # path/to/project/.git -> project
6776        my $name = to_utf8($project);
6777        $name =~ s,([^/])/*\.git$,$1,;
6778        $name = basename($name);
6779        # sanitize name
6780        $name =~ s/[[:cntrl:]]/?/g;
6781
6782        my $ver = $hash;
6783        if ($hash =~ /^[0-9a-fA-F]+$/) {
6784                # shorten SHA-1 hash
6785                my $full_hash = git_get_full_hash($project, $hash);
6786                if ($full_hash =~ /^$hash/ && length($hash) > 7) {
6787                        $ver = git_get_short_hash($project, $hash);
6788                }
6789        } elsif ($hash =~ m!^refs/tags/(.*)$!) {
6790                # tags don't need shortened SHA-1 hash
6791                $ver = $1;
6792        } else {
6793                # branches and other need shortened SHA-1 hash
6794                if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
6795                        $ver = $1;
6796                }
6797                $ver .= '-' . git_get_short_hash($project, $hash);
6798        }
6799        # in case of hierarchical branch names
6800        $ver =~ s!/!.!g;
6801
6802        # name = project-version_string
6803        $name = "$name-$ver";
6804
6805        return wantarray ? ($name, $name) : $name;
6806}
6807
6808sub git_snapshot {
6809        my $format = $input_params{'snapshot_format'};
6810        if (!@snapshot_fmts) {
6811                die_error(403, "Snapshots not allowed");
6812        }
6813        # default to first supported snapshot format
6814        $format ||= $snapshot_fmts[0];
6815        if ($format !~ m/^[a-z0-9]+$/) {
6816                die_error(400, "Invalid snapshot format parameter");
6817        } elsif (!exists($known_snapshot_formats{$format})) {
6818                die_error(400, "Unknown snapshot format");
6819        } elsif ($known_snapshot_formats{$format}{'disabled'}) {
6820                die_error(403, "Snapshot format not allowed");
6821        } elsif (!grep($_ eq $format, @snapshot_fmts)) {
6822                die_error(403, "Unsupported snapshot format");
6823        }
6824
6825        my $type = git_get_type("$hash^{}");
6826        if (!$type) {
6827                die_error(404, 'Object does not exist');
6828        }  elsif ($type eq 'blob') {
6829                die_error(400, 'Object is not a tree-ish');
6830        }
6831
6832        my ($name, $prefix) = snapshot_name($project, $hash);
6833        my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
6834        my $cmd = quote_command(
6835                git_cmd(), 'archive',
6836                "--format=$known_snapshot_formats{$format}{'format'}",
6837                "--prefix=$prefix/", $hash);
6838        if (exists $known_snapshot_formats{$format}{'compressor'}) {
6839                $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
6840        }
6841
6842        $filename =~ s/(["\\])/\\$1/g;
6843        print $cgi->header(
6844                -type => $known_snapshot_formats{$format}{'type'},
6845                -content_disposition => 'inline; filename="' . $filename . '"',
6846                -status => '200 OK');
6847
6848        open my $fd, "-|", $cmd
6849                or die_error(500, "Execute git-archive failed");
6850        binmode STDOUT, ':raw';
6851        print <$fd>;
6852        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6853        close $fd;
6854}
6855
6856sub git_log_generic {
6857        my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
6858
6859        my $head = git_get_head_hash($project);
6860        if (!defined $base) {
6861                $base = $head;
6862        }
6863        if (!defined $page) {
6864                $page = 0;
6865        }
6866        my $refs = git_get_references();
6867
6868        my $commit_hash = $base;
6869        if (defined $parent) {
6870                $commit_hash = "$parent..$base";
6871        }
6872        my @commitlist =
6873                parse_commits($commit_hash, 101, (100 * $page),
6874                              defined $file_name ? ($file_name, "--full-history") : ());
6875
6876        my $ftype;
6877        if (!defined $file_hash && defined $file_name) {
6878                # some commits could have deleted file in question,
6879                # and not have it in tree, but one of them has to have it
6880                for (my $i = 0; $i < @commitlist; $i++) {
6881                        $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
6882                        last if defined $file_hash;
6883                }
6884        }
6885        if (defined $file_hash) {
6886                $ftype = git_get_type($file_hash);
6887        }
6888        if (defined $file_name && !defined $ftype) {
6889                die_error(500, "Unknown type of object");
6890        }
6891        my %co;
6892        if (defined $file_name) {
6893                %co = parse_commit($base)
6894                        or die_error(404, "Unknown commit object");
6895        }
6896
6897
6898        my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
6899        my $next_link = '';
6900        if ($#commitlist >= 100) {
6901                $next_link =
6902                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
6903                                 -accesskey => "n", -title => "Alt-n"}, "next");
6904        }
6905        my $patch_max = gitweb_get_feature('patches');
6906        if ($patch_max && !defined $file_name) {
6907                if ($patch_max < 0 || @commitlist <= $patch_max) {
6908                        $paging_nav .= " &sdot; " .
6909                                $cgi->a({-href => href(action=>"patches", -replay=>1)},
6910                                        "patches");
6911                }
6912        }
6913
6914        git_header_html();
6915        git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
6916        if (defined $file_name) {
6917                git_print_header_div('commit', esc_html($co{'title'}), $base);
6918        } else {
6919                git_print_header_div('summary', $project)
6920        }
6921        git_print_page_path($file_name, $ftype, $hash_base)
6922                if (defined $file_name);
6923
6924        $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
6925                     $file_name, $file_hash, $ftype);
6926
6927        git_footer_html();
6928}
6929
6930sub git_log {
6931        git_log_generic('log', \&git_log_body,
6932                        $hash, $hash_parent);
6933}
6934
6935sub git_commit {
6936        $hash ||= $hash_base || "HEAD";
6937        my %co = parse_commit($hash)
6938            or die_error(404, "Unknown commit object");
6939
6940        my $parent  = $co{'parent'};
6941        my $parents = $co{'parents'}; # listref
6942
6943        # we need to prepare $formats_nav before any parameter munging
6944        my $formats_nav;
6945        if (!defined $parent) {
6946                # --root commitdiff
6947                $formats_nav .= '(initial)';
6948        } elsif (@$parents == 1) {
6949                # single parent commit
6950                $formats_nav .=
6951                        '(parent: ' .
6952                        $cgi->a({-href => href(action=>"commit",
6953                                               hash=>$parent)},
6954                                esc_html(substr($parent, 0, 7))) .
6955                        ')';
6956        } else {
6957                # merge commit
6958                $formats_nav .=
6959                        '(merge: ' .
6960                        join(' ', map {
6961                                $cgi->a({-href => href(action=>"commit",
6962                                                       hash=>$_)},
6963                                        esc_html(substr($_, 0, 7)));
6964                        } @$parents ) .
6965                        ')';
6966        }
6967        if (gitweb_check_feature('patches') && @$parents <= 1) {
6968                $formats_nav .= " | " .
6969                        $cgi->a({-href => href(action=>"patch", -replay=>1)},
6970                                "patch");
6971        }
6972
6973        if (!defined $parent) {
6974                $parent = "--root";
6975        }
6976        my @difftree;
6977        open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
6978                @diff_opts,
6979                (@$parents <= 1 ? $parent : '-c'),
6980                $hash, "--"
6981                or die_error(500, "Open git-diff-tree failed");
6982        @difftree = map { chomp; $_ } <$fd>;
6983        close $fd or die_error(404, "Reading git-diff-tree failed");
6984
6985        # non-textual hash id's can be cached
6986        my $expires;
6987        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6988                $expires = "+1d";
6989        }
6990        my $refs = git_get_references();
6991        my $ref = format_ref_marker($refs, $co{'id'});
6992
6993        git_header_html(undef, $expires);
6994        git_print_page_nav('commit', '',
6995                           $hash, $co{'tree'}, $hash,
6996                           $formats_nav);
6997
6998        if (defined $co{'parent'}) {
6999                git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
7000        } else {
7001                git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
7002        }
7003        print "<div class=\"title_text\">\n" .
7004              "<table class=\"object_header\">\n";
7005        git_print_authorship_rows(\%co);
7006        print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
7007        print "<tr>" .
7008              "<td>tree</td>" .
7009              "<td class=\"sha1\">" .
7010              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7011                       class => "list"}, $co{'tree'}) .
7012              "</td>" .
7013              "<td class=\"link\">" .
7014              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7015                      "tree");
7016        my $snapshot_links = format_snapshot_links($hash);
7017        if (defined $snapshot_links) {
7018                print " | " . $snapshot_links;
7019        }
7020        print "</td>" .
7021              "</tr>\n";
7022
7023        foreach my $par (@$parents) {
7024                print "<tr>" .
7025                      "<td>parent</td>" .
7026                      "<td class=\"sha1\">" .
7027                      $cgi->a({-href => href(action=>"commit", hash=>$par),
7028                               class => "list"}, $par) .
7029                      "</td>" .
7030                      "<td class=\"link\">" .
7031                      $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7032                      " | " .
7033                      $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7034                      "</td>" .
7035                      "</tr>\n";
7036        }
7037        print "</table>".
7038              "</div>\n";
7039
7040        print "<div class=\"page_body\">\n";
7041        git_print_log($co{'comment'});
7042        print "</div>\n";
7043
7044        git_difftree_body(\@difftree, $hash, @$parents);
7045
7046        git_footer_html();
7047}
7048
7049sub git_object {
7050        # object is defined by:
7051        # - hash or hash_base alone
7052        # - hash_base and file_name
7053        my $type;
7054
7055        # - hash or hash_base alone
7056        if ($hash || ($hash_base && !defined $file_name)) {
7057                my $object_id = $hash || $hash_base;
7058
7059                open my $fd, "-|", quote_command(
7060                        git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7061                        or die_error(404, "Object does not exist");
7062                $type = <$fd>;
7063                chomp $type;
7064                close $fd
7065                        or die_error(404, "Object does not exist");
7066
7067        # - hash_base and file_name
7068        } elsif ($hash_base && defined $file_name) {
7069                $file_name =~ s,/+$,,;
7070
7071                system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7072                        or die_error(404, "Base object does not exist");
7073
7074                # here errors should not hapen
7075                open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7076                        or die_error(500, "Open git-ls-tree failed");
7077                my $line = <$fd>;
7078                close $fd;
7079
7080                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7081                unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7082                        die_error(404, "File or directory for given base does not exist");
7083                }
7084                $type = $2;
7085                $hash = $3;
7086        } else {
7087                die_error(400, "Not enough information to find object");
7088        }
7089
7090        print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7091                                          hash=>$hash, hash_base=>$hash_base,
7092                                          file_name=>$file_name),
7093                             -status => '302 Found');
7094}
7095
7096sub git_blobdiff {
7097        my $format = shift || 'html';
7098        my $diff_style = $input_params{'diff_style'} || 'inline';
7099
7100        my $fd;
7101        my @difftree;
7102        my %diffinfo;
7103        my $expires;
7104
7105        # preparing $fd and %diffinfo for git_patchset_body
7106        # new style URI
7107        if (defined $hash_base && defined $hash_parent_base) {
7108                if (defined $file_name) {
7109                        # read raw output
7110                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7111                                $hash_parent_base, $hash_base,
7112                                "--", (defined $file_parent ? $file_parent : ()), $file_name
7113                                or die_error(500, "Open git-diff-tree failed");
7114                        @difftree = map { chomp; $_ } <$fd>;
7115                        close $fd
7116                                or die_error(404, "Reading git-diff-tree failed");
7117                        @difftree
7118                                or die_error(404, "Blob diff not found");
7119
7120                } elsif (defined $hash &&
7121                         $hash =~ /[0-9a-fA-F]{40}/) {
7122                        # try to find filename from $hash
7123
7124                        # read filtered raw output
7125                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7126                                $hash_parent_base, $hash_base, "--"
7127                                or die_error(500, "Open git-diff-tree failed");
7128                        @difftree =
7129                                # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7130                                # $hash == to_id
7131                                grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7132                                map { chomp; $_ } <$fd>;
7133                        close $fd
7134                                or die_error(404, "Reading git-diff-tree failed");
7135                        @difftree
7136                                or die_error(404, "Blob diff not found");
7137
7138                } else {
7139                        die_error(400, "Missing one of the blob diff parameters");
7140                }
7141
7142                if (@difftree > 1) {
7143                        die_error(400, "Ambiguous blob diff specification");
7144                }
7145
7146                %diffinfo = parse_difftree_raw_line($difftree[0]);
7147                $file_parent ||= $diffinfo{'from_file'} || $file_name;
7148                $file_name   ||= $diffinfo{'to_file'};
7149
7150                $hash_parent ||= $diffinfo{'from_id'};
7151                $hash        ||= $diffinfo{'to_id'};
7152
7153                # non-textual hash id's can be cached
7154                if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7155                    $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7156                        $expires = '+1d';
7157                }
7158
7159                # open patch output
7160                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7161                        '-p', ($format eq 'html' ? "--full-index" : ()),
7162                        $hash_parent_base, $hash_base,
7163                        "--", (defined $file_parent ? $file_parent : ()), $file_name
7164                        or die_error(500, "Open git-diff-tree failed");
7165        }
7166
7167        # old/legacy style URI -- not generated anymore since 1.4.3.
7168        if (!%diffinfo) {
7169                die_error('404 Not Found', "Missing one of the blob diff parameters")
7170        }
7171
7172        # header
7173        if ($format eq 'html') {
7174                my $formats_nav =
7175                        $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7176                                "raw");
7177                $formats_nav .= diff_style_nav($diff_style);
7178                git_header_html(undef, $expires);
7179                if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7180                        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7181                        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7182                } else {
7183                        print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7184                        print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7185                }
7186                if (defined $file_name) {
7187                        git_print_page_path($file_name, "blob", $hash_base);
7188                } else {
7189                        print "<div class=\"page_path\"></div>\n";
7190                }
7191
7192        } elsif ($format eq 'plain') {
7193                print $cgi->header(
7194                        -type => 'text/plain',
7195                        -charset => 'utf-8',
7196                        -expires => $expires,
7197                        -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7198
7199                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7200
7201        } else {
7202                die_error(400, "Unknown blobdiff format");
7203        }
7204
7205        # patch
7206        if ($format eq 'html') {
7207                print "<div class=\"page_body\">\n";
7208
7209                git_patchset_body($fd, $diff_style,
7210                                  [ \%diffinfo ], $hash_base, $hash_parent_base);
7211                close $fd;
7212
7213                print "</div>\n"; # class="page_body"
7214                git_footer_html();
7215
7216        } else {
7217                while (my $line = <$fd>) {
7218                        $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7219                        $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7220
7221                        print $line;
7222
7223                        last if $line =~ m!^\+\+\+!;
7224                }
7225                local $/ = undef;
7226                print <$fd>;
7227                close $fd;
7228        }
7229}
7230
7231sub git_blobdiff_plain {
7232        git_blobdiff('plain');
7233}
7234
7235# assumes that it is added as later part of already existing navigation,
7236# so it returns "| foo | bar" rather than just "foo | bar"
7237sub diff_style_nav {
7238        my ($diff_style, $is_combined) = @_;
7239        $diff_style ||= 'inline';
7240
7241        return "" if ($is_combined);
7242
7243        my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7244        my %styles = @styles;
7245        @styles =
7246                @styles[ map { $_ * 2 } 0..$#styles/2 ];
7247
7248        return join '',
7249                map { " | ".$_ }
7250                map {
7251                        $_ eq $diff_style ? $styles{$_} :
7252                        $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7253                } @styles;
7254}
7255
7256sub git_commitdiff {
7257        my %params = @_;
7258        my $format = $params{-format} || 'html';
7259        my $diff_style = $input_params{'diff_style'} || 'inline';
7260
7261        my ($patch_max) = gitweb_get_feature('patches');
7262        if ($format eq 'patch') {
7263                die_error(403, "Patch view not allowed") unless $patch_max;
7264        }
7265
7266        $hash ||= $hash_base || "HEAD";
7267        my %co = parse_commit($hash)
7268            or die_error(404, "Unknown commit object");
7269
7270        # choose format for commitdiff for merge
7271        if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7272                $hash_parent = '--cc';
7273        }
7274        # we need to prepare $formats_nav before almost any parameter munging
7275        my $formats_nav;
7276        if ($format eq 'html') {
7277                $formats_nav =
7278                        $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7279                                "raw");
7280                if ($patch_max && @{$co{'parents'}} <= 1) {
7281                        $formats_nav .= " | " .
7282                                $cgi->a({-href => href(action=>"patch", -replay=>1)},
7283                                        "patch");
7284                }
7285                $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7286
7287                if (defined $hash_parent &&
7288                    $hash_parent ne '-c' && $hash_parent ne '--cc') {
7289                        # commitdiff with two commits given
7290                        my $hash_parent_short = $hash_parent;
7291                        if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7292                                $hash_parent_short = substr($hash_parent, 0, 7);
7293                        }
7294                        $formats_nav .=
7295                                ' (from';
7296                        for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7297                                if ($co{'parents'}[$i] eq $hash_parent) {
7298                                        $formats_nav .= ' parent ' . ($i+1);
7299                                        last;
7300                                }
7301                        }
7302                        $formats_nav .= ': ' .
7303                                $cgi->a({-href => href(-replay=>1,
7304                                                       hash=>$hash_parent, hash_base=>undef)},
7305                                        esc_html($hash_parent_short)) .
7306                                ')';
7307                } elsif (!$co{'parent'}) {
7308                        # --root commitdiff
7309                        $formats_nav .= ' (initial)';
7310                } elsif (scalar @{$co{'parents'}} == 1) {
7311                        # single parent commit
7312                        $formats_nav .=
7313                                ' (parent: ' .
7314                                $cgi->a({-href => href(-replay=>1,
7315                                                       hash=>$co{'parent'}, hash_base=>undef)},
7316                                        esc_html(substr($co{'parent'}, 0, 7))) .
7317                                ')';
7318                } else {
7319                        # merge commit
7320                        if ($hash_parent eq '--cc') {
7321                                $formats_nav .= ' | ' .
7322                                        $cgi->a({-href => href(-replay=>1,
7323                                                               hash=>$hash, hash_parent=>'-c')},
7324                                                'combined');
7325                        } else { # $hash_parent eq '-c'
7326                                $formats_nav .= ' | ' .
7327                                        $cgi->a({-href => href(-replay=>1,
7328                                                               hash=>$hash, hash_parent=>'--cc')},
7329                                                'compact');
7330                        }
7331                        $formats_nav .=
7332                                ' (merge: ' .
7333                                join(' ', map {
7334                                        $cgi->a({-href => href(-replay=>1,
7335                                                               hash=>$_, hash_base=>undef)},
7336                                                esc_html(substr($_, 0, 7)));
7337                                } @{$co{'parents'}} ) .
7338                                ')';
7339                }
7340        }
7341
7342        my $hash_parent_param = $hash_parent;
7343        if (!defined $hash_parent_param) {
7344                # --cc for multiple parents, --root for parentless
7345                $hash_parent_param =
7346                        @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7347        }
7348
7349        # read commitdiff
7350        my $fd;
7351        my @difftree;
7352        if ($format eq 'html') {
7353                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7354                        "--no-commit-id", "--patch-with-raw", "--full-index",
7355                        $hash_parent_param, $hash, "--"
7356                        or die_error(500, "Open git-diff-tree failed");
7357
7358                while (my $line = <$fd>) {
7359                        chomp $line;
7360                        # empty line ends raw part of diff-tree output
7361                        last unless $line;
7362                        push @difftree, scalar parse_difftree_raw_line($line);
7363                }
7364
7365        } elsif ($format eq 'plain') {
7366                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7367                        '-p', $hash_parent_param, $hash, "--"
7368                        or die_error(500, "Open git-diff-tree failed");
7369        } elsif ($format eq 'patch') {
7370                # For commit ranges, we limit the output to the number of
7371                # patches specified in the 'patches' feature.
7372                # For single commits, we limit the output to a single patch,
7373                # diverging from the git-format-patch default.
7374                my @commit_spec = ();
7375                if ($hash_parent) {
7376                        if ($patch_max > 0) {
7377                                push @commit_spec, "-$patch_max";
7378                        }
7379                        push @commit_spec, '-n', "$hash_parent..$hash";
7380                } else {
7381                        if ($params{-single}) {
7382                                push @commit_spec, '-1';
7383                        } else {
7384                                if ($patch_max > 0) {
7385                                        push @commit_spec, "-$patch_max";
7386                                }
7387                                push @commit_spec, "-n";
7388                        }
7389                        push @commit_spec, '--root', $hash;
7390                }
7391                open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7392                        '--encoding=utf8', '--stdout', @commit_spec
7393                        or die_error(500, "Open git-format-patch failed");
7394        } else {
7395                die_error(400, "Unknown commitdiff format");
7396        }
7397
7398        # non-textual hash id's can be cached
7399        my $expires;
7400        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7401                $expires = "+1d";
7402        }
7403
7404        # write commit message
7405        if ($format eq 'html') {
7406                my $refs = git_get_references();
7407                my $ref = format_ref_marker($refs, $co{'id'});
7408
7409                git_header_html(undef, $expires);
7410                git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7411                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7412                print "<div class=\"title_text\">\n" .
7413                      "<table class=\"object_header\">\n";
7414                git_print_authorship_rows(\%co);
7415                print "</table>".
7416                      "</div>\n";
7417                print "<div class=\"page_body\">\n";
7418                if (@{$co{'comment'}} > 1) {
7419                        print "<div class=\"log\">\n";
7420                        git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7421                        print "</div>\n"; # class="log"
7422                }
7423
7424        } elsif ($format eq 'plain') {
7425                my $refs = git_get_references("tags");
7426                my $tagname = git_get_rev_name_tags($hash);
7427                my $filename = basename($project) . "-$hash.patch";
7428
7429                print $cgi->header(
7430                        -type => 'text/plain',
7431                        -charset => 'utf-8',
7432                        -expires => $expires,
7433                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7434                my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7435                print "From: " . to_utf8($co{'author'}) . "\n";
7436                print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7437                print "Subject: " . to_utf8($co{'title'}) . "\n";
7438
7439                print "X-Git-Tag: $tagname\n" if $tagname;
7440                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7441
7442                foreach my $line (@{$co{'comment'}}) {
7443                        print to_utf8($line) . "\n";
7444                }
7445                print "---\n\n";
7446        } elsif ($format eq 'patch') {
7447                my $filename = basename($project) . "-$hash.patch";
7448
7449                print $cgi->header(
7450                        -type => 'text/plain',
7451                        -charset => 'utf-8',
7452                        -expires => $expires,
7453                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7454        }
7455
7456        # write patch
7457        if ($format eq 'html') {
7458                my $use_parents = !defined $hash_parent ||
7459                        $hash_parent eq '-c' || $hash_parent eq '--cc';
7460                git_difftree_body(\@difftree, $hash,
7461                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7462                print "<br/>\n";
7463
7464                git_patchset_body($fd, $diff_style,
7465                                  \@difftree, $hash,
7466                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7467                close $fd;
7468                print "</div>\n"; # class="page_body"
7469                git_footer_html();
7470
7471        } elsif ($format eq 'plain') {
7472                local $/ = undef;
7473                print <$fd>;
7474                close $fd
7475                        or print "Reading git-diff-tree failed\n";
7476        } elsif ($format eq 'patch') {
7477                local $/ = undef;
7478                print <$fd>;
7479                close $fd
7480                        or print "Reading git-format-patch failed\n";
7481        }
7482}
7483
7484sub git_commitdiff_plain {
7485        git_commitdiff(-format => 'plain');
7486}
7487
7488# format-patch-style patches
7489sub git_patch {
7490        git_commitdiff(-format => 'patch', -single => 1);
7491}
7492
7493sub git_patches {
7494        git_commitdiff(-format => 'patch');
7495}
7496
7497sub git_history {
7498        git_log_generic('history', \&git_history_body,
7499                        $hash_base, $hash_parent_base,
7500                        $file_name, $hash);
7501}
7502
7503sub git_search {
7504        $searchtype ||= 'commit';
7505
7506        # check if appropriate features are enabled
7507        gitweb_check_feature('search')
7508                or die_error(403, "Search is disabled");
7509        if ($searchtype eq 'pickaxe') {
7510                # pickaxe may take all resources of your box and run for several minutes
7511                # with every query - so decide by yourself how public you make this feature
7512                gitweb_check_feature('pickaxe')
7513                        or die_error(403, "Pickaxe search is disabled");
7514        }
7515        if ($searchtype eq 'grep') {
7516                # grep search might be potentially CPU-intensive, too
7517                gitweb_check_feature('grep')
7518                        or die_error(403, "Grep search is disabled");
7519        }
7520
7521        if (!defined $searchtext) {
7522                die_error(400, "Text field is empty");
7523        }
7524        if (!defined $hash) {
7525                $hash = git_get_head_hash($project);
7526        }
7527        my %co = parse_commit($hash);
7528        if (!%co) {
7529                die_error(404, "Unknown commit object");
7530        }
7531        if (!defined $page) {
7532                $page = 0;
7533        }
7534
7535        if ($searchtype eq 'commit' ||
7536            $searchtype eq 'author' ||
7537            $searchtype eq 'committer') {
7538                git_search_message(%co);
7539        } elsif ($searchtype eq 'pickaxe') {
7540                git_search_changes(%co);
7541        } elsif ($searchtype eq 'grep') {
7542                git_search_files(%co);
7543        } else {
7544                die_error(400, "Unknown search type");
7545        }
7546}
7547
7548sub git_search_help {
7549        git_header_html();
7550        git_print_page_nav('','', $hash,$hash,$hash);
7551        print <<EOT;
7552<p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7553regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7554the pattern entered is recognized as the POSIX extended
7555<a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7556insensitive).</p>
7557<dl>
7558<dt><b>commit</b></dt>
7559<dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7560EOT
7561        my $have_grep = gitweb_check_feature('grep');
7562        if ($have_grep) {
7563                print <<EOT;
7564<dt><b>grep</b></dt>
7565<dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7566    a different one) are searched for the given pattern. On large trees, this search can take
7567a while and put some strain on the server, so please use it with some consideration. Note that
7568due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7569case-sensitive.</dd>
7570EOT
7571        }
7572        print <<EOT;
7573<dt><b>author</b></dt>
7574<dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7575<dt><b>committer</b></dt>
7576<dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7577EOT
7578        my $have_pickaxe = gitweb_check_feature('pickaxe');
7579        if ($have_pickaxe) {
7580                print <<EOT;
7581<dt><b>pickaxe</b></dt>
7582<dd>All commits that caused the string to appear or disappear from any file (changes that
7583added, removed or "modified" the string) will be listed. This search can take a while and
7584takes a lot of strain on the server, so please use it wisely. Note that since you may be
7585interested even in changes just changing the case as well, this search is case sensitive.</dd>
7586EOT
7587        }
7588        print "</dl>\n";
7589        git_footer_html();
7590}
7591
7592sub git_shortlog {
7593        git_log_generic('shortlog', \&git_shortlog_body,
7594                        $hash, $hash_parent);
7595}
7596
7597## ......................................................................
7598## feeds (RSS, Atom; OPML)
7599
7600sub git_feed {
7601        my $format = shift || 'atom';
7602        my $have_blame = gitweb_check_feature('blame');
7603
7604        # Atom: http://www.atomenabled.org/developers/syndication/
7605        # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7606        if ($format ne 'rss' && $format ne 'atom') {
7607                die_error(400, "Unknown web feed format");
7608        }
7609
7610        # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7611        my $head = $hash || 'HEAD';
7612        my @commitlist = parse_commits($head, 150, 0, $file_name);
7613
7614        my %latest_commit;
7615        my %latest_date;
7616        my $content_type = "application/$format+xml";
7617        if (defined $cgi->http('HTTP_ACCEPT') &&
7618                 $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7619                # browser (feed reader) prefers text/xml
7620                $content_type = 'text/xml';
7621        }
7622        if (defined($commitlist[0])) {
7623                %latest_commit = %{$commitlist[0]};
7624                my $latest_epoch = $latest_commit{'committer_epoch'};
7625                %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7626                my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7627                if (defined $if_modified) {
7628                        my $since;
7629                        if (eval { require HTTP::Date; 1; }) {
7630                                $since = HTTP::Date::str2time($if_modified);
7631                        } elsif (eval { require Time::ParseDate; 1; }) {
7632                                $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7633                        }
7634                        if (defined $since && $latest_epoch <= $since) {
7635                                print $cgi->header(
7636                                        -type => $content_type,
7637                                        -charset => 'utf-8',
7638                                        -last_modified => $latest_date{'rfc2822'},
7639                                        -status => '304 Not Modified');
7640                                return;
7641                        }
7642                }
7643                print $cgi->header(
7644                        -type => $content_type,
7645                        -charset => 'utf-8',
7646                        -last_modified => $latest_date{'rfc2822'});
7647        } else {
7648                print $cgi->header(
7649                        -type => $content_type,
7650                        -charset => 'utf-8');
7651        }
7652
7653        # Optimization: skip generating the body if client asks only
7654        # for Last-Modified date.
7655        return if ($cgi->request_method() eq 'HEAD');
7656
7657        # header variables
7658        my $title = "$site_name - $project/$action";
7659        my $feed_type = 'log';
7660        if (defined $hash) {
7661                $title .= " - '$hash'";
7662                $feed_type = 'branch log';
7663                if (defined $file_name) {
7664                        $title .= " :: $file_name";
7665                        $feed_type = 'history';
7666                }
7667        } elsif (defined $file_name) {
7668                $title .= " - $file_name";
7669                $feed_type = 'history';
7670        }
7671        $title .= " $feed_type";
7672        my $descr = git_get_project_description($project);
7673        if (defined $descr) {
7674                $descr = esc_html($descr);
7675        } else {
7676                $descr = "$project " .
7677                         ($format eq 'rss' ? 'RSS' : 'Atom') .
7678                         " feed";
7679        }
7680        my $owner = git_get_project_owner($project);
7681        $owner = esc_html($owner);
7682
7683        #header
7684        my $alt_url;
7685        if (defined $file_name) {
7686                $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7687        } elsif (defined $hash) {
7688                $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7689        } else {
7690                $alt_url = href(-full=>1, action=>"summary");
7691        }
7692        print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7693        if ($format eq 'rss') {
7694                print <<XML;
7695<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7696<channel>
7697XML
7698                print "<title>$title</title>\n" .
7699                      "<link>$alt_url</link>\n" .
7700                      "<description>$descr</description>\n" .
7701                      "<language>en</language>\n" .
7702                      # project owner is responsible for 'editorial' content
7703                      "<managingEditor>$owner</managingEditor>\n";
7704                if (defined $logo || defined $favicon) {
7705                        # prefer the logo to the favicon, since RSS
7706                        # doesn't allow both
7707                        my $img = esc_url($logo || $favicon);
7708                        print "<image>\n" .
7709                              "<url>$img</url>\n" .
7710                              "<title>$title</title>\n" .
7711                              "<link>$alt_url</link>\n" .
7712                              "</image>\n";
7713                }
7714                if (%latest_date) {
7715                        print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7716                        print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7717                }
7718                print "<generator>gitweb v.$version/$git_version</generator>\n";
7719        } elsif ($format eq 'atom') {
7720                print <<XML;
7721<feed xmlns="http://www.w3.org/2005/Atom">
7722XML
7723                print "<title>$title</title>\n" .
7724                      "<subtitle>$descr</subtitle>\n" .
7725                      '<link rel="alternate" type="text/html" href="' .
7726                      $alt_url . '" />' . "\n" .
7727                      '<link rel="self" type="' . $content_type . '" href="' .
7728                      $cgi->self_url() . '" />' . "\n" .
7729                      "<id>" . href(-full=>1) . "</id>\n" .
7730                      # use project owner for feed author
7731                      "<author><name>$owner</name></author>\n";
7732                if (defined $favicon) {
7733                        print "<icon>" . esc_url($favicon) . "</icon>\n";
7734                }
7735                if (defined $logo) {
7736                        # not twice as wide as tall: 72 x 27 pixels
7737                        print "<logo>" . esc_url($logo) . "</logo>\n";
7738                }
7739                if (! %latest_date) {
7740                        # dummy date to keep the feed valid until commits trickle in:
7741                        print "<updated>1970-01-01T00:00:00Z</updated>\n";
7742                } else {
7743                        print "<updated>$latest_date{'iso-8601'}</updated>\n";
7744                }
7745                print "<generator version='$version/$git_version'>gitweb</generator>\n";
7746        }
7747
7748        # contents
7749        for (my $i = 0; $i <= $#commitlist; $i++) {
7750                my %co = %{$commitlist[$i]};
7751                my $commit = $co{'id'};
7752                # we read 150, we always show 30 and the ones more recent than 48 hours
7753                if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7754                        last;
7755                }
7756                my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7757
7758                # get list of changed files
7759                open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7760                        $co{'parent'} || "--root",
7761                        $co{'id'}, "--", (defined $file_name ? $file_name : ())
7762                        or next;
7763                my @difftree = map { chomp; $_ } <$fd>;
7764                close $fd
7765                        or next;
7766
7767                # print element (entry, item)
7768                my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7769                if ($format eq 'rss') {
7770                        print "<item>\n" .
7771                              "<title>" . esc_html($co{'title'}) . "</title>\n" .
7772                              "<author>" . esc_html($co{'author'}) . "</author>\n" .
7773                              "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7774                              "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7775                              "<link>$co_url</link>\n" .
7776                              "<description>" . esc_html($co{'title'}) . "</description>\n" .
7777                              "<content:encoded>" .
7778                              "<![CDATA[\n";
7779                } elsif ($format eq 'atom') {
7780                        print "<entry>\n" .
7781                              "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7782                              "<updated>$cd{'iso-8601'}</updated>\n" .
7783                              "<author>\n" .
7784                              "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7785                        if ($co{'author_email'}) {
7786                                print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7787                        }
7788                        print "</author>\n" .
7789                              # use committer for contributor
7790                              "<contributor>\n" .
7791                              "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7792                        if ($co{'committer_email'}) {
7793                                print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7794                        }
7795                        print "</contributor>\n" .
7796                              "<published>$cd{'iso-8601'}</published>\n" .
7797                              "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7798                              "<id>$co_url</id>\n" .
7799                              "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
7800                              "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
7801                }
7802                my $comment = $co{'comment'};
7803                print "<pre>\n";
7804                foreach my $line (@$comment) {
7805                        $line = esc_html($line);
7806                        print "$line\n";
7807                }
7808                print "</pre><ul>\n";
7809                foreach my $difftree_line (@difftree) {
7810                        my %difftree = parse_difftree_raw_line($difftree_line);
7811                        next if !$difftree{'from_id'};
7812
7813                        my $file = $difftree{'file'} || $difftree{'to_file'};
7814
7815                        print "<li>" .
7816                              "[" .
7817                              $cgi->a({-href => href(-full=>1, action=>"blobdiff",
7818                                                     hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
7819                                                     hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
7820                                                     file_name=>$file, file_parent=>$difftree{'from_file'}),
7821                                      -title => "diff"}, 'D');
7822                        if ($have_blame) {
7823                                print $cgi->a({-href => href(-full=>1, action=>"blame",
7824                                                             file_name=>$file, hash_base=>$commit),
7825                                              -title => "blame"}, 'B');
7826                        }
7827                        # if this is not a feed of a file history
7828                        if (!defined $file_name || $file_name ne $file) {
7829                                print $cgi->a({-href => href(-full=>1, action=>"history",
7830                                                             file_name=>$file, hash=>$commit),
7831                                              -title => "history"}, 'H');
7832                        }
7833                        $file = esc_path($file);
7834                        print "] ".
7835                              "$file</li>\n";
7836                }
7837                if ($format eq 'rss') {
7838                        print "</ul>]]>\n" .
7839                              "</content:encoded>\n" .
7840                              "</item>\n";
7841                } elsif ($format eq 'atom') {
7842                        print "</ul>\n</div>\n" .
7843                              "</content>\n" .
7844                              "</entry>\n";
7845                }
7846        }
7847
7848        # end of feed
7849        if ($format eq 'rss') {
7850                print "</channel>\n</rss>\n";
7851        } elsif ($format eq 'atom') {
7852                print "</feed>\n";
7853        }
7854}
7855
7856sub git_rss {
7857        git_feed('rss');
7858}
7859
7860sub git_atom {
7861        git_feed('atom');
7862}
7863
7864sub git_opml {
7865        my @list = git_get_projects_list();
7866        if (!@list) {
7867                die_error(404, "No projects found");
7868        }
7869
7870        print $cgi->header(
7871                -type => 'text/xml',
7872                -charset => 'utf-8',
7873                -content_disposition => 'inline; filename="opml.xml"');
7874
7875        my $title = esc_html($site_name);
7876        print <<XML;
7877<?xml version="1.0" encoding="utf-8"?>
7878<opml version="1.0">
7879<head>
7880  <title>$title OPML Export</title>
7881</head>
7882<body>
7883<outline text="git RSS feeds">
7884XML
7885
7886        foreach my $pr (@list) {
7887                my %proj = %$pr;
7888                my $head = git_get_head_hash($proj{'path'});
7889                if (!defined $head) {
7890                        next;
7891                }
7892                $git_dir = "$projectroot/$proj{'path'}";
7893                my %co = parse_commit($head);
7894                if (!%co) {
7895                        next;
7896                }
7897
7898                my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7899                my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7900                my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7901                print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7902        }
7903        print <<XML;
7904</outline>
7905</body>
7906</opml>
7907XML
7908}