gitweb / gitweb.perlon commit gitweb: place links to parent directories in page header (4426ba2)
   1#!/usr/bin/perl
   2
   3# gitweb - simple web interface to track changes in git repositories
   4#
   5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
   6# (C) 2005, Christian Gierke
   7#
   8# This program is licensed under the GPLv2
   9
  10use 5.008;
  11use strict;
  12use warnings;
  13use CGI qw(:standard :escapeHTML -nosticky);
  14use CGI::Util qw(unescape);
  15use CGI::Carp qw(fatalsToBrowser set_message);
  16use Encode;
  17use Fcntl ':mode';
  18use File::Find qw();
  19use File::Basename qw(basename);
  20use Time::HiRes qw(gettimeofday tv_interval);
  21binmode STDOUT, ':utf8';
  22
  23our $t0 = [ gettimeofday() ];
  24our $number_of_git_cmds = 0;
  25
  26BEGIN {
  27        CGI->compile() if $ENV{'MOD_PERL'};
  28}
  29
  30our $version = "++GIT_VERSION++";
  31
  32our ($my_url, $my_uri, $base_url, $path_info, $home_link);
  33sub evaluate_uri {
  34        our $cgi;
  35
  36        our $my_url = $cgi->url();
  37        our $my_uri = $cgi->url(-absolute => 1);
  38
  39        # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
  40        # needed and used only for URLs with nonempty PATH_INFO
  41        our $base_url = $my_url;
  42
  43        # When the script is used as DirectoryIndex, the URL does not contain the name
  44        # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
  45        # have to do it ourselves. We make $path_info global because it's also used
  46        # later on.
  47        #
  48        # Another issue with the script being the DirectoryIndex is that the resulting
  49        # $my_url data is not the full script URL: this is good, because we want
  50        # generated links to keep implying the script name if it wasn't explicitly
  51        # indicated in the URL we're handling, but it means that $my_url cannot be used
  52        # as base URL.
  53        # Therefore, if we needed to strip PATH_INFO, then we know that we have
  54        # to build the base URL ourselves:
  55        our $path_info = $ENV{"PATH_INFO"};
  56        if ($path_info) {
  57                if ($my_url =~ s,\Q$path_info\E$,, &&
  58                    $my_uri =~ s,\Q$path_info\E$,, &&
  59                    defined $ENV{'SCRIPT_NAME'}) {
  60                        $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
  61                }
  62        }
  63
  64        # target of the home link on top of all pages
  65        our $home_link = $my_uri || "/";
  66}
  67
  68# core git executable to use
  69# this can just be "git" if your webserver has a sensible PATH
  70our $GIT = "++GIT_BINDIR++/git";
  71
  72# absolute fs-path which will be prepended to the project path
  73#our $projectroot = "/pub/scm";
  74our $projectroot = "++GITWEB_PROJECTROOT++";
  75
  76# fs traversing limit for getting project list
  77# the number is relative to the projectroot
  78our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
  79
  80# string of the home link on top of all pages
  81our $home_link_str = "++GITWEB_HOME_LINK_STR++";
  82
  83# name of your site or organization to appear in page titles
  84# replace this with something more descriptive for clearer bookmarks
  85our $site_name = "++GITWEB_SITENAME++"
  86                 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
  87
  88# html snippet to include in the <head> section of each page
  89our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
  90# filename of html text to include at top of each page
  91our $site_header = "++GITWEB_SITE_HEADER++";
  92# html text to include at home page
  93our $home_text = "++GITWEB_HOMETEXT++";
  94# filename of html text to include at bottom of each page
  95our $site_footer = "++GITWEB_SITE_FOOTER++";
  96
  97# URI of stylesheets
  98our @stylesheets = ("++GITWEB_CSS++");
  99# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
 100our $stylesheet = undef;
 101# URI of GIT logo (72x27 size)
 102our $logo = "++GITWEB_LOGO++";
 103# URI of GIT favicon, assumed to be image/png type
 104our $favicon = "++GITWEB_FAVICON++";
 105# URI of gitweb.js (JavaScript code for gitweb)
 106our $javascript = "++GITWEB_JS++";
 107
 108# URI and label (title) of GIT logo link
 109#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
 110#our $logo_label = "git documentation";
 111our $logo_url = "http://git-scm.com/";
 112our $logo_label = "git homepage";
 113
 114# source of projects list
 115our $projects_list = "++GITWEB_LIST++";
 116
 117# the width (in characters) of the projects list "Description" column
 118our $projects_list_description_width = 25;
 119
 120# group projects by category on the projects list
 121# (enabled if this variable evaluates to true)
 122our $projects_list_group_categories = 0;
 123
 124# default category if none specified
 125# (leave the empty string for no category)
 126our $project_list_default_category = "";
 127
 128# default order of projects list
 129# valid values are none, project, descr, owner, and age
 130our $default_projects_order = "project";
 131
 132# show repository only if this file exists
 133# (only effective if this variable evaluates to true)
 134our $export_ok = "++GITWEB_EXPORT_OK++";
 135
 136# show repository only if this subroutine returns true
 137# when given the path to the project, for example:
 138#    sub { return -e "$_[0]/git-daemon-export-ok"; }
 139our $export_auth_hook = undef;
 140
 141# only allow viewing of repositories also shown on the overview page
 142our $strict_export = "++GITWEB_STRICT_EXPORT++";
 143
 144# list of git base URLs used for URL to where fetch project from,
 145# i.e. full URL is "$git_base_url/$project"
 146our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
 147
 148# default blob_plain mimetype and default charset for text/plain blob
 149our $default_blob_plain_mimetype = 'text/plain';
 150our $default_text_plain_charset  = undef;
 151
 152# file to use for guessing MIME types before trying /etc/mime.types
 153# (relative to the current git repository)
 154our $mimetypes_file = undef;
 155
 156# assume this charset if line contains non-UTF-8 characters;
 157# it should be valid encoding (see Encoding::Supported(3pm) for list),
 158# for which encoding all byte sequences are valid, for example
 159# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
 160# could be even 'utf-8' for the old behavior)
 161our $fallback_encoding = 'latin1';
 162
 163# rename detection options for git-diff and git-diff-tree
 164# - default is '-M', with the cost proportional to
 165#   (number of removed files) * (number of new files).
 166# - more costly is '-C' (which implies '-M'), with the cost proportional to
 167#   (number of changed files + number of removed files) * (number of new files)
 168# - even more costly is '-C', '--find-copies-harder' with cost
 169#   (number of files in the original tree) * (number of new files)
 170# - one might want to include '-B' option, e.g. '-B', '-M'
 171our @diff_opts = ('-M'); # taken from git_commit
 172
 173# Disables features that would allow repository owners to inject script into
 174# the gitweb domain.
 175our $prevent_xss = 0;
 176
 177# Path to the highlight executable to use (must be the one from
 178# http://www.andre-simon.de due to assumptions about parameters and output).
 179# Useful if highlight is not installed on your webserver's PATH.
 180# [Default: highlight]
 181our $highlight_bin = "++HIGHLIGHT_BIN++";
 182
 183# information about snapshot formats that gitweb is capable of serving
 184our %known_snapshot_formats = (
 185        # name => {
 186        #       'display' => display name,
 187        #       'type' => mime type,
 188        #       'suffix' => filename suffix,
 189        #       'format' => --format for git-archive,
 190        #       'compressor' => [compressor command and arguments]
 191        #                       (array reference, optional)
 192        #       'disabled' => boolean (optional)}
 193        #
 194        'tgz' => {
 195                'display' => 'tar.gz',
 196                'type' => 'application/x-gzip',
 197                'suffix' => '.tar.gz',
 198                'format' => 'tar',
 199                'compressor' => ['gzip', '-n']},
 200
 201        'tbz2' => {
 202                'display' => 'tar.bz2',
 203                'type' => 'application/x-bzip2',
 204                'suffix' => '.tar.bz2',
 205                'format' => 'tar',
 206                'compressor' => ['bzip2']},
 207
 208        'txz' => {
 209                'display' => 'tar.xz',
 210                'type' => 'application/x-xz',
 211                'suffix' => '.tar.xz',
 212                'format' => 'tar',
 213                'compressor' => ['xz'],
 214                'disabled' => 1},
 215
 216        'zip' => {
 217                'display' => 'zip',
 218                'type' => 'application/x-zip',
 219                'suffix' => '.zip',
 220                'format' => 'zip'},
 221);
 222
 223# Aliases so we understand old gitweb.snapshot values in repository
 224# configuration.
 225our %known_snapshot_format_aliases = (
 226        'gzip'  => 'tgz',
 227        'bzip2' => 'tbz2',
 228        'xz'    => 'txz',
 229
 230        # backward compatibility: legacy gitweb config support
 231        'x-gzip' => undef, 'gz' => undef,
 232        'x-bzip2' => undef, 'bz2' => undef,
 233        'x-zip' => undef, '' => undef,
 234);
 235
 236# Pixel sizes for icons and avatars. If the default font sizes or lineheights
 237# are changed, it may be appropriate to change these values too via
 238# $GITWEB_CONFIG.
 239our %avatar_size = (
 240        'default' => 16,
 241        'double'  => 32
 242);
 243
 244# Used to set the maximum load that we will still respond to gitweb queries.
 245# If server load exceed this value then return "503 server busy" error.
 246# If gitweb cannot determined server load, it is taken to be 0.
 247# Leave it undefined (or set to 'undef') to turn off load checking.
 248our $maxload = 300;
 249
 250# configuration for 'highlight' (http://www.andre-simon.de/)
 251# match by basename
 252our %highlight_basename = (
 253        #'Program' => 'py',
 254        #'Library' => 'py',
 255        'SConstruct' => 'py', # SCons equivalent of Makefile
 256        'Makefile' => 'make',
 257);
 258# match by extension
 259our %highlight_ext = (
 260        # main extensions, defining name of syntax;
 261        # see files in /usr/share/highlight/langDefs/ directory
 262        map { $_ => $_ }
 263                qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
 264        # alternate extensions, see /etc/highlight/filetypes.conf
 265        'h' => 'c',
 266        map { $_ => 'sh'  } qw(bash zsh ksh),
 267        map { $_ => 'cpp' } qw(cxx c++ cc),
 268        map { $_ => 'php' } qw(php3 php4 php5 phps),
 269        map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
 270        map { $_ => 'make'} qw(mak mk),
 271        map { $_ => 'xml' } qw(xhtml html htm),
 272);
 273
 274# You define site-wide feature defaults here; override them with
 275# $GITWEB_CONFIG as necessary.
 276our %feature = (
 277        # feature => {
 278        #       'sub' => feature-sub (subroutine),
 279        #       'override' => allow-override (boolean),
 280        #       'default' => [ default options...] (array reference)}
 281        #
 282        # if feature is overridable (it means that allow-override has true value),
 283        # then feature-sub will be called with default options as parameters;
 284        # return value of feature-sub indicates if to enable specified feature
 285        #
 286        # if there is no 'sub' key (no feature-sub), then feature cannot be
 287        # overridden
 288        #
 289        # use gitweb_get_feature(<feature>) to retrieve the <feature> value
 290        # (an array) or gitweb_check_feature(<feature>) to check if <feature>
 291        # is enabled
 292
 293        # Enable the 'blame' blob view, showing the last commit that modified
 294        # each line in the file. This can be very CPU-intensive.
 295
 296        # To enable system wide have in $GITWEB_CONFIG
 297        # $feature{'blame'}{'default'} = [1];
 298        # To have project specific config enable override in $GITWEB_CONFIG
 299        # $feature{'blame'}{'override'} = 1;
 300        # and in project config gitweb.blame = 0|1;
 301        'blame' => {
 302                'sub' => sub { feature_bool('blame', @_) },
 303                'override' => 0,
 304                'default' => [0]},
 305
 306        # Enable the 'snapshot' link, providing a compressed archive of any
 307        # tree. This can potentially generate high traffic if you have large
 308        # project.
 309
 310        # Value is a list of formats defined in %known_snapshot_formats that
 311        # you wish to offer.
 312        # To disable system wide have in $GITWEB_CONFIG
 313        # $feature{'snapshot'}{'default'} = [];
 314        # To have project specific config enable override in $GITWEB_CONFIG
 315        # $feature{'snapshot'}{'override'} = 1;
 316        # and in project config, a comma-separated list of formats or "none"
 317        # to disable.  Example: gitweb.snapshot = tbz2,zip;
 318        'snapshot' => {
 319                'sub' => \&feature_snapshot,
 320                'override' => 0,
 321                'default' => ['tgz']},
 322
 323        # Enable text search, which will list the commits which match author,
 324        # committer or commit text to a given string.  Enabled by default.
 325        # Project specific override is not supported.
 326        #
 327        # Note that this controls all search features, which means that if
 328        # it is disabled, then 'grep' and 'pickaxe' search would also be
 329        # disabled.
 330        'search' => {
 331                'override' => 0,
 332                'default' => [1]},
 333
 334        # Enable grep search, which will list the files in currently selected
 335        # tree containing the given string. Enabled by default. This can be
 336        # potentially CPU-intensive, of course.
 337        # Note that you need to have 'search' feature enabled too.
 338
 339        # To enable system wide have in $GITWEB_CONFIG
 340        # $feature{'grep'}{'default'} = [1];
 341        # To have project specific config enable override in $GITWEB_CONFIG
 342        # $feature{'grep'}{'override'} = 1;
 343        # and in project config gitweb.grep = 0|1;
 344        'grep' => {
 345                'sub' => sub { feature_bool('grep', @_) },
 346                'override' => 0,
 347                'default' => [1]},
 348
 349        # Enable the pickaxe search, which will list the commits that modified
 350        # a given string in a file. This can be practical and quite faster
 351        # alternative to 'blame', but still potentially CPU-intensive.
 352        # Note that you need to have 'search' feature enabled too.
 353
 354        # To enable system wide have in $GITWEB_CONFIG
 355        # $feature{'pickaxe'}{'default'} = [1];
 356        # To have project specific config enable override in $GITWEB_CONFIG
 357        # $feature{'pickaxe'}{'override'} = 1;
 358        # and in project config gitweb.pickaxe = 0|1;
 359        'pickaxe' => {
 360                'sub' => sub { feature_bool('pickaxe', @_) },
 361                'override' => 0,
 362                'default' => [1]},
 363
 364        # Enable showing size of blobs in a 'tree' view, in a separate
 365        # column, similar to what 'ls -l' does.  This cost a bit of IO.
 366
 367        # To disable system wide have in $GITWEB_CONFIG
 368        # $feature{'show-sizes'}{'default'} = [0];
 369        # To have project specific config enable override in $GITWEB_CONFIG
 370        # $feature{'show-sizes'}{'override'} = 1;
 371        # and in project config gitweb.showsizes = 0|1;
 372        'show-sizes' => {
 373                'sub' => sub { feature_bool('showsizes', @_) },
 374                'override' => 0,
 375                'default' => [1]},
 376
 377        # Make gitweb use an alternative format of the URLs which can be
 378        # more readable and natural-looking: project name is embedded
 379        # directly in the path and the query string contains other
 380        # auxiliary information. All gitweb installations recognize
 381        # URL in either format; this configures in which formats gitweb
 382        # generates links.
 383
 384        # To enable system wide have in $GITWEB_CONFIG
 385        # $feature{'pathinfo'}{'default'} = [1];
 386        # Project specific override is not supported.
 387
 388        # Note that you will need to change the default location of CSS,
 389        # favicon, logo and possibly other files to an absolute URL. Also,
 390        # if gitweb.cgi serves as your indexfile, you will need to force
 391        # $my_uri to contain the script name in your $GITWEB_CONFIG.
 392        'pathinfo' => {
 393                'override' => 0,
 394                'default' => [0]},
 395
 396        # Make gitweb consider projects in project root subdirectories
 397        # to be forks of existing projects. Given project $projname.git,
 398        # projects matching $projname/*.git will not be shown in the main
 399        # projects list, instead a '+' mark will be added to $projname
 400        # there and a 'forks' view will be enabled for the project, listing
 401        # all the forks. If project list is taken from a file, forks have
 402        # to be listed after the main project.
 403
 404        # To enable system wide have in $GITWEB_CONFIG
 405        # $feature{'forks'}{'default'} = [1];
 406        # Project specific override is not supported.
 407        'forks' => {
 408                'override' => 0,
 409                'default' => [0]},
 410
 411        # Insert custom links to the action bar of all project pages.
 412        # This enables you mainly to link to third-party scripts integrating
 413        # into gitweb; e.g. git-browser for graphical history representation
 414        # or custom web-based repository administration interface.
 415
 416        # The 'default' value consists of a list of triplets in the form
 417        # (label, link, position) where position is the label after which
 418        # to insert the link and link is a format string where %n expands
 419        # to the project name, %f to the project path within the filesystem,
 420        # %h to the current hash (h gitweb parameter) and %b to the current
 421        # hash base (hb gitweb parameter); %% expands to %.
 422
 423        # To enable system wide have in $GITWEB_CONFIG e.g.
 424        # $feature{'actions'}{'default'} = [('graphiclog',
 425        #       '/git-browser/by-commit.html?r=%n', 'summary')];
 426        # Project specific override is not supported.
 427        'actions' => {
 428                'override' => 0,
 429                'default' => []},
 430
 431        # Allow gitweb scan project content tags of project repository,
 432        # and display the popular Web 2.0-ish "tag cloud" near the projects
 433        # list.  Note that this is something COMPLETELY different from the
 434        # normal Git tags.
 435
 436        # gitweb by itself can show existing tags, but it does not handle
 437        # tagging itself; you need to do it externally, outside gitweb.
 438        # The format is described in git_get_project_ctags() subroutine.
 439        # You may want to install the HTML::TagCloud Perl module to get
 440        # a pretty tag cloud instead of just a list of tags.
 441
 442        # To enable system wide have in $GITWEB_CONFIG
 443        # $feature{'ctags'}{'default'} = [1];
 444        # Project specific override is not supported.
 445
 446        # In the future whether ctags editing is enabled might depend
 447        # on the value, but using 1 should always mean no editing of ctags.
 448        'ctags' => {
 449                'override' => 0,
 450                'default' => [0]},
 451
 452        # The maximum number of patches in a patchset generated in patch
 453        # view. Set this to 0 or undef to disable patch view, or to a
 454        # negative number to remove any limit.
 455
 456        # To disable system wide have in $GITWEB_CONFIG
 457        # $feature{'patches'}{'default'} = [0];
 458        # To have project specific config enable override in $GITWEB_CONFIG
 459        # $feature{'patches'}{'override'} = 1;
 460        # and in project config gitweb.patches = 0|n;
 461        # where n is the maximum number of patches allowed in a patchset.
 462        'patches' => {
 463                'sub' => \&feature_patches,
 464                'override' => 0,
 465                'default' => [16]},
 466
 467        # Avatar support. When this feature is enabled, views such as
 468        # shortlog or commit will display an avatar associated with
 469        # the email of the committer(s) and/or author(s).
 470
 471        # Currently available providers are gravatar and picon.
 472        # If an unknown provider is specified, the feature is disabled.
 473
 474        # Gravatar depends on Digest::MD5.
 475        # Picon currently relies on the indiana.edu database.
 476
 477        # To enable system wide have in $GITWEB_CONFIG
 478        # $feature{'avatar'}{'default'} = ['<provider>'];
 479        # where <provider> is either gravatar or picon.
 480        # To have project specific config enable override in $GITWEB_CONFIG
 481        # $feature{'avatar'}{'override'} = 1;
 482        # and in project config gitweb.avatar = <provider>;
 483        'avatar' => {
 484                'sub' => \&feature_avatar,
 485                'override' => 0,
 486                'default' => ['']},
 487
 488        # Enable displaying how much time and how many git commands
 489        # it took to generate and display page.  Disabled by default.
 490        # Project specific override is not supported.
 491        'timed' => {
 492                'override' => 0,
 493                'default' => [0]},
 494
 495        # Enable turning some links into links to actions which require
 496        # JavaScript to run (like 'blame_incremental').  Not enabled by
 497        # default.  Project specific override is currently not supported.
 498        'javascript-actions' => {
 499                'override' => 0,
 500                'default' => [0]},
 501
 502        # Enable and configure ability to change common timezone for dates
 503        # in gitweb output via JavaScript.  Enabled by default.
 504        # Project specific override is not supported.
 505        'javascript-timezone' => {
 506                'override' => 0,
 507                'default' => [
 508                        'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
 509                                     # or undef to turn off this feature
 510                        'gitweb_tz', # name of cookie where to store selected timezone
 511                        'datetime',  # CSS class used to mark up dates for manipulation
 512                ]},
 513
 514        # Syntax highlighting support. This is based on Daniel Svensson's
 515        # and Sham Chukoury's work in gitweb-xmms2.git.
 516        # It requires the 'highlight' program present in $PATH,
 517        # and therefore is disabled by default.
 518
 519        # To enable system wide have in $GITWEB_CONFIG
 520        # $feature{'highlight'}{'default'} = [1];
 521
 522        'highlight' => {
 523                'sub' => sub { feature_bool('highlight', @_) },
 524                'override' => 0,
 525                'default' => [0]},
 526
 527        # Enable displaying of remote heads in the heads list
 528
 529        # To enable system wide have in $GITWEB_CONFIG
 530        # $feature{'remote_heads'}{'default'} = [1];
 531        # To have project specific config enable override in $GITWEB_CONFIG
 532        # $feature{'remote_heads'}{'override'} = 1;
 533        # and in project config gitweb.remote_heads = 0|1;
 534        'remote_heads' => {
 535                'sub' => sub { feature_bool('remote_heads', @_) },
 536                'override' => 0,
 537                'default' => [0]},
 538);
 539
 540sub gitweb_get_feature {
 541        my ($name) = @_;
 542        return unless exists $feature{$name};
 543        my ($sub, $override, @defaults) = (
 544                $feature{$name}{'sub'},
 545                $feature{$name}{'override'},
 546                @{$feature{$name}{'default'}});
 547        # project specific override is possible only if we have project
 548        our $git_dir; # global variable, declared later
 549        if (!$override || !defined $git_dir) {
 550                return @defaults;
 551        }
 552        if (!defined $sub) {
 553                warn "feature $name is not overridable";
 554                return @defaults;
 555        }
 556        return $sub->(@defaults);
 557}
 558
 559# A wrapper to check if a given feature is enabled.
 560# With this, you can say
 561#
 562#   my $bool_feat = gitweb_check_feature('bool_feat');
 563#   gitweb_check_feature('bool_feat') or somecode;
 564#
 565# instead of
 566#
 567#   my ($bool_feat) = gitweb_get_feature('bool_feat');
 568#   (gitweb_get_feature('bool_feat'))[0] or somecode;
 569#
 570sub gitweb_check_feature {
 571        return (gitweb_get_feature(@_))[0];
 572}
 573
 574
 575sub feature_bool {
 576        my $key = shift;
 577        my ($val) = git_get_project_config($key, '--bool');
 578
 579        if (!defined $val) {
 580                return ($_[0]);
 581        } elsif ($val eq 'true') {
 582                return (1);
 583        } elsif ($val eq 'false') {
 584                return (0);
 585        }
 586}
 587
 588sub feature_snapshot {
 589        my (@fmts) = @_;
 590
 591        my ($val) = git_get_project_config('snapshot');
 592
 593        if ($val) {
 594                @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
 595        }
 596
 597        return @fmts;
 598}
 599
 600sub feature_patches {
 601        my @val = (git_get_project_config('patches', '--int'));
 602
 603        if (@val) {
 604                return @val;
 605        }
 606
 607        return ($_[0]);
 608}
 609
 610sub feature_avatar {
 611        my @val = (git_get_project_config('avatar'));
 612
 613        return @val ? @val : @_;
 614}
 615
 616# checking HEAD file with -e is fragile if the repository was
 617# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
 618# and then pruned.
 619sub check_head_link {
 620        my ($dir) = @_;
 621        my $headfile = "$dir/HEAD";
 622        return ((-e $headfile) ||
 623                (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
 624}
 625
 626sub check_export_ok {
 627        my ($dir) = @_;
 628        return (check_head_link($dir) &&
 629                (!$export_ok || -e "$dir/$export_ok") &&
 630                (!$export_auth_hook || $export_auth_hook->($dir)));
 631}
 632
 633# process alternate names for backward compatibility
 634# filter out unsupported (unknown) snapshot formats
 635sub filter_snapshot_fmts {
 636        my @fmts = @_;
 637
 638        @fmts = map {
 639                exists $known_snapshot_format_aliases{$_} ?
 640                       $known_snapshot_format_aliases{$_} : $_} @fmts;
 641        @fmts = grep {
 642                exists $known_snapshot_formats{$_} &&
 643                !$known_snapshot_formats{$_}{'disabled'}} @fmts;
 644}
 645
 646# If it is set to code reference, it is code that it is to be run once per
 647# request, allowing updating configurations that change with each request,
 648# while running other code in config file only once.
 649#
 650# Otherwise, if it is false then gitweb would process config file only once;
 651# if it is true then gitweb config would be run for each request.
 652our $per_request_config = 1;
 653
 654# read and parse gitweb config file given by its parameter.
 655# returns true on success, false on recoverable error, allowing
 656# to chain this subroutine, using first file that exists.
 657# dies on errors during parsing config file, as it is unrecoverable.
 658sub read_config_file {
 659        my $filename = shift;
 660        return unless defined $filename;
 661        # die if there are errors parsing config file
 662        if (-e $filename) {
 663                do $filename;
 664                die $@ if $@;
 665                return 1;
 666        }
 667        return;
 668}
 669
 670our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
 671sub evaluate_gitweb_config {
 672        our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
 673        our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
 674        our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
 675
 676        # Protect agains duplications of file names, to not read config twice.
 677        # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
 678        # there possibility of duplication of filename there doesn't matter.
 679        $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
 680        $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
 681
 682        # Common system-wide settings for convenience.
 683        # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
 684        read_config_file($GITWEB_CONFIG_COMMON);
 685
 686        # Use first config file that exists.  This means use the per-instance
 687        # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
 688        read_config_file($GITWEB_CONFIG) and return;
 689        read_config_file($GITWEB_CONFIG_SYSTEM);
 690}
 691
 692# Get loadavg of system, to compare against $maxload.
 693# Currently it requires '/proc/loadavg' present to get loadavg;
 694# if it is not present it returns 0, which means no load checking.
 695sub get_loadavg {
 696        if( -e '/proc/loadavg' ){
 697                open my $fd, '<', '/proc/loadavg'
 698                        or return 0;
 699                my @load = split(/\s+/, scalar <$fd>);
 700                close $fd;
 701
 702                # The first three columns measure CPU and IO utilization of the last one,
 703                # five, and 10 minute periods.  The fourth column shows the number of
 704                # currently running processes and the total number of processes in the m/n
 705                # format.  The last column displays the last process ID used.
 706                return $load[0] || 0;
 707        }
 708        # additional checks for load average should go here for things that don't export
 709        # /proc/loadavg
 710
 711        return 0;
 712}
 713
 714# version of the core git binary
 715our $git_version;
 716sub evaluate_git_version {
 717        our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
 718        $number_of_git_cmds++;
 719}
 720
 721sub check_loadavg {
 722        if (defined $maxload && get_loadavg() > $maxload) {
 723                die_error(503, "The load average on the server is too high");
 724        }
 725}
 726
 727# ======================================================================
 728# input validation and dispatch
 729
 730# input parameters can be collected from a variety of sources (presently, CGI
 731# and PATH_INFO), so we define an %input_params hash that collects them all
 732# together during validation: this allows subsequent uses (e.g. href()) to be
 733# agnostic of the parameter origin
 734
 735our %input_params = ();
 736
 737# input parameters are stored with the long parameter name as key. This will
 738# also be used in the href subroutine to convert parameters to their CGI
 739# equivalent, and since the href() usage is the most frequent one, we store
 740# the name -> CGI key mapping here, instead of the reverse.
 741#
 742# XXX: Warning: If you touch this, check the search form for updating,
 743# too.
 744
 745our @cgi_param_mapping = (
 746        project => "p",
 747        action => "a",
 748        file_name => "f",
 749        file_parent => "fp",
 750        hash => "h",
 751        hash_parent => "hp",
 752        hash_base => "hb",
 753        hash_parent_base => "hpb",
 754        page => "pg",
 755        order => "o",
 756        searchtext => "s",
 757        searchtype => "st",
 758        snapshot_format => "sf",
 759        extra_options => "opt",
 760        search_use_regexp => "sr",
 761        ctag => "by_tag",
 762        diff_style => "ds",
 763        project_filter => "pf",
 764        # this must be last entry (for manipulation from JavaScript)
 765        javascript => "js"
 766);
 767our %cgi_param_mapping = @cgi_param_mapping;
 768
 769# we will also need to know the possible actions, for validation
 770our %actions = (
 771        "blame" => \&git_blame,
 772        "blame_incremental" => \&git_blame_incremental,
 773        "blame_data" => \&git_blame_data,
 774        "blobdiff" => \&git_blobdiff,
 775        "blobdiff_plain" => \&git_blobdiff_plain,
 776        "blob" => \&git_blob,
 777        "blob_plain" => \&git_blob_plain,
 778        "commitdiff" => \&git_commitdiff,
 779        "commitdiff_plain" => \&git_commitdiff_plain,
 780        "commit" => \&git_commit,
 781        "forks" => \&git_forks,
 782        "heads" => \&git_heads,
 783        "history" => \&git_history,
 784        "log" => \&git_log,
 785        "patch" => \&git_patch,
 786        "patches" => \&git_patches,
 787        "remotes" => \&git_remotes,
 788        "rss" => \&git_rss,
 789        "atom" => \&git_atom,
 790        "search" => \&git_search,
 791        "search_help" => \&git_search_help,
 792        "shortlog" => \&git_shortlog,
 793        "summary" => \&git_summary,
 794        "tag" => \&git_tag,
 795        "tags" => \&git_tags,
 796        "tree" => \&git_tree,
 797        "snapshot" => \&git_snapshot,
 798        "object" => \&git_object,
 799        # those below don't need $project
 800        "opml" => \&git_opml,
 801        "project_list" => \&git_project_list,
 802        "project_index" => \&git_project_index,
 803);
 804
 805# finally, we have the hash of allowed extra_options for the commands that
 806# allow them
 807our %allowed_options = (
 808        "--no-merges" => [ qw(rss atom log shortlog history) ],
 809);
 810
 811# fill %input_params with the CGI parameters. All values except for 'opt'
 812# should be single values, but opt can be an array. We should probably
 813# build an array of parameters that can be multi-valued, but since for the time
 814# being it's only this one, we just single it out
 815sub evaluate_query_params {
 816        our $cgi;
 817
 818        while (my ($name, $symbol) = each %cgi_param_mapping) {
 819                if ($symbol eq 'opt') {
 820                        $input_params{$name} = [ $cgi->param($symbol) ];
 821                } else {
 822                        $input_params{$name} = $cgi->param($symbol);
 823                }
 824        }
 825}
 826
 827# now read PATH_INFO and update the parameter list for missing parameters
 828sub evaluate_path_info {
 829        return if defined $input_params{'project'};
 830        return if !$path_info;
 831        $path_info =~ s,^/+,,;
 832        return if !$path_info;
 833
 834        # find which part of PATH_INFO is project
 835        my $project = $path_info;
 836        $project =~ s,/+$,,;
 837        while ($project && !check_head_link("$projectroot/$project")) {
 838                $project =~ s,/*[^/]*$,,;
 839        }
 840        return unless $project;
 841        $input_params{'project'} = $project;
 842
 843        # do not change any parameters if an action is given using the query string
 844        return if $input_params{'action'};
 845        $path_info =~ s,^\Q$project\E/*,,;
 846
 847        # next, check if we have an action
 848        my $action = $path_info;
 849        $action =~ s,/.*$,,;
 850        if (exists $actions{$action}) {
 851                $path_info =~ s,^$action/*,,;
 852                $input_params{'action'} = $action;
 853        }
 854
 855        # list of actions that want hash_base instead of hash, but can have no
 856        # pathname (f) parameter
 857        my @wants_base = (
 858                'tree',
 859                'history',
 860        );
 861
 862        # we want to catch, among others
 863        # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
 864        my ($parentrefname, $parentpathname, $refname, $pathname) =
 865                ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
 866
 867        # first, analyze the 'current' part
 868        if (defined $pathname) {
 869                # we got "branch:filename" or "branch:dir/"
 870                # we could use git_get_type(branch:pathname), but:
 871                # - it needs $git_dir
 872                # - it does a git() call
 873                # - the convention of terminating directories with a slash
 874                #   makes it superfluous
 875                # - embedding the action in the PATH_INFO would make it even
 876                #   more superfluous
 877                $pathname =~ s,^/+,,;
 878                if (!$pathname || substr($pathname, -1) eq "/") {
 879                        $input_params{'action'} ||= "tree";
 880                        $pathname =~ s,/$,,;
 881                } else {
 882                        # the default action depends on whether we had parent info
 883                        # or not
 884                        if ($parentrefname) {
 885                                $input_params{'action'} ||= "blobdiff_plain";
 886                        } else {
 887                                $input_params{'action'} ||= "blob_plain";
 888                        }
 889                }
 890                $input_params{'hash_base'} ||= $refname;
 891                $input_params{'file_name'} ||= $pathname;
 892        } elsif (defined $refname) {
 893                # we got "branch". In this case we have to choose if we have to
 894                # set hash or hash_base.
 895                #
 896                # Most of the actions without a pathname only want hash to be
 897                # set, except for the ones specified in @wants_base that want
 898                # hash_base instead. It should also be noted that hand-crafted
 899                # links having 'history' as an action and no pathname or hash
 900                # set will fail, but that happens regardless of PATH_INFO.
 901                if (defined $parentrefname) {
 902                        # if there is parent let the default be 'shortlog' action
 903                        # (for http://git.example.com/repo.git/A..B links); if there
 904                        # is no parent, dispatch will detect type of object and set
 905                        # action appropriately if required (if action is not set)
 906                        $input_params{'action'} ||= "shortlog";
 907                }
 908                if ($input_params{'action'} &&
 909                    grep { $_ eq $input_params{'action'} } @wants_base) {
 910                        $input_params{'hash_base'} ||= $refname;
 911                } else {
 912                        $input_params{'hash'} ||= $refname;
 913                }
 914        }
 915
 916        # next, handle the 'parent' part, if present
 917        if (defined $parentrefname) {
 918                # a missing pathspec defaults to the 'current' filename, allowing e.g.
 919                # someproject/blobdiff/oldrev..newrev:/filename
 920                if ($parentpathname) {
 921                        $parentpathname =~ s,^/+,,;
 922                        $parentpathname =~ s,/$,,;
 923                        $input_params{'file_parent'} ||= $parentpathname;
 924                } else {
 925                        $input_params{'file_parent'} ||= $input_params{'file_name'};
 926                }
 927                # we assume that hash_parent_base is wanted if a path was specified,
 928                # or if the action wants hash_base instead of hash
 929                if (defined $input_params{'file_parent'} ||
 930                        grep { $_ eq $input_params{'action'} } @wants_base) {
 931                        $input_params{'hash_parent_base'} ||= $parentrefname;
 932                } else {
 933                        $input_params{'hash_parent'} ||= $parentrefname;
 934                }
 935        }
 936
 937        # for the snapshot action, we allow URLs in the form
 938        # $project/snapshot/$hash.ext
 939        # where .ext determines the snapshot and gets removed from the
 940        # passed $refname to provide the $hash.
 941        #
 942        # To be able to tell that $refname includes the format extension, we
 943        # require the following two conditions to be satisfied:
 944        # - the hash input parameter MUST have been set from the $refname part
 945        #   of the URL (i.e. they must be equal)
 946        # - the snapshot format MUST NOT have been defined already (e.g. from
 947        #   CGI parameter sf)
 948        # It's also useless to try any matching unless $refname has a dot,
 949        # so we check for that too
 950        if (defined $input_params{'action'} &&
 951                $input_params{'action'} eq 'snapshot' &&
 952                defined $refname && index($refname, '.') != -1 &&
 953                $refname eq $input_params{'hash'} &&
 954                !defined $input_params{'snapshot_format'}) {
 955                # We loop over the known snapshot formats, checking for
 956                # extensions. Allowed extensions are both the defined suffix
 957                # (which includes the initial dot already) and the snapshot
 958                # format key itself, with a prepended dot
 959                while (my ($fmt, $opt) = each %known_snapshot_formats) {
 960                        my $hash = $refname;
 961                        unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
 962                                next;
 963                        }
 964                        my $sfx = $1;
 965                        # a valid suffix was found, so set the snapshot format
 966                        # and reset the hash parameter
 967                        $input_params{'snapshot_format'} = $fmt;
 968                        $input_params{'hash'} = $hash;
 969                        # we also set the format suffix to the one requested
 970                        # in the URL: this way a request for e.g. .tgz returns
 971                        # a .tgz instead of a .tar.gz
 972                        $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
 973                        last;
 974                }
 975        }
 976}
 977
 978our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
 979     $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
 980     $searchtext, $search_regexp, $project_filter);
 981sub evaluate_and_validate_params {
 982        our $action = $input_params{'action'};
 983        if (defined $action) {
 984                if (!validate_action($action)) {
 985                        die_error(400, "Invalid action parameter");
 986                }
 987        }
 988
 989        # parameters which are pathnames
 990        our $project = $input_params{'project'};
 991        if (defined $project) {
 992                if (!validate_project($project)) {
 993                        undef $project;
 994                        die_error(404, "No such project");
 995                }
 996        }
 997
 998        our $project_filter = $input_params{'project_filter'};
 999        if (defined $project_filter) {
1000                if (!validate_pathname($project_filter)) {
1001                        die_error(404, "Invalid project_filter parameter");
1002                }
1003        }
1004
1005        our $file_name = $input_params{'file_name'};
1006        if (defined $file_name) {
1007                if (!validate_pathname($file_name)) {
1008                        die_error(400, "Invalid file parameter");
1009                }
1010        }
1011
1012        our $file_parent = $input_params{'file_parent'};
1013        if (defined $file_parent) {
1014                if (!validate_pathname($file_parent)) {
1015                        die_error(400, "Invalid file parent parameter");
1016                }
1017        }
1018
1019        # parameters which are refnames
1020        our $hash = $input_params{'hash'};
1021        if (defined $hash) {
1022                if (!validate_refname($hash)) {
1023                        die_error(400, "Invalid hash parameter");
1024                }
1025        }
1026
1027        our $hash_parent = $input_params{'hash_parent'};
1028        if (defined $hash_parent) {
1029                if (!validate_refname($hash_parent)) {
1030                        die_error(400, "Invalid hash parent parameter");
1031                }
1032        }
1033
1034        our $hash_base = $input_params{'hash_base'};
1035        if (defined $hash_base) {
1036                if (!validate_refname($hash_base)) {
1037                        die_error(400, "Invalid hash base parameter");
1038                }
1039        }
1040
1041        our @extra_options = @{$input_params{'extra_options'}};
1042        # @extra_options is always defined, since it can only be (currently) set from
1043        # CGI, and $cgi->param() returns the empty array in array context if the param
1044        # is not set
1045        foreach my $opt (@extra_options) {
1046                if (not exists $allowed_options{$opt}) {
1047                        die_error(400, "Invalid option parameter");
1048                }
1049                if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1050                        die_error(400, "Invalid option parameter for this action");
1051                }
1052        }
1053
1054        our $hash_parent_base = $input_params{'hash_parent_base'};
1055        if (defined $hash_parent_base) {
1056                if (!validate_refname($hash_parent_base)) {
1057                        die_error(400, "Invalid hash parent base parameter");
1058                }
1059        }
1060
1061        # other parameters
1062        our $page = $input_params{'page'};
1063        if (defined $page) {
1064                if ($page =~ m/[^0-9]/) {
1065                        die_error(400, "Invalid page parameter");
1066                }
1067        }
1068
1069        our $searchtype = $input_params{'searchtype'};
1070        if (defined $searchtype) {
1071                if ($searchtype =~ m/[^a-z]/) {
1072                        die_error(400, "Invalid searchtype parameter");
1073                }
1074        }
1075
1076        our $search_use_regexp = $input_params{'search_use_regexp'};
1077
1078        our $searchtext = $input_params{'searchtext'};
1079        our $search_regexp;
1080        if (defined $searchtext) {
1081                if (length($searchtext) < 2) {
1082                        die_error(403, "At least two characters are required for search parameter");
1083                }
1084                $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
1085        }
1086}
1087
1088# path to the current git repository
1089our $git_dir;
1090sub evaluate_git_dir {
1091        our $git_dir = "$projectroot/$project" if $project;
1092}
1093
1094our (@snapshot_fmts, $git_avatar);
1095sub configure_gitweb_features {
1096        # list of supported snapshot formats
1097        our @snapshot_fmts = gitweb_get_feature('snapshot');
1098        @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1099
1100        # check that the avatar feature is set to a known provider name,
1101        # and for each provider check if the dependencies are satisfied.
1102        # if the provider name is invalid or the dependencies are not met,
1103        # reset $git_avatar to the empty string.
1104        our ($git_avatar) = gitweb_get_feature('avatar');
1105        if ($git_avatar eq 'gravatar') {
1106                $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1107        } elsif ($git_avatar eq 'picon') {
1108                # no dependencies
1109        } else {
1110                $git_avatar = '';
1111        }
1112}
1113
1114# custom error handler: 'die <message>' is Internal Server Error
1115sub handle_errors_html {
1116        my $msg = shift; # it is already HTML escaped
1117
1118        # to avoid infinite loop where error occurs in die_error,
1119        # change handler to default handler, disabling handle_errors_html
1120        set_message("Error occured when inside die_error:\n$msg");
1121
1122        # you cannot jump out of die_error when called as error handler;
1123        # the subroutine set via CGI::Carp::set_message is called _after_
1124        # HTTP headers are already written, so it cannot write them itself
1125        die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1126}
1127set_message(\&handle_errors_html);
1128
1129# dispatch
1130sub dispatch {
1131        if (!defined $action) {
1132                if (defined $hash) {
1133                        $action = git_get_type($hash);
1134                } elsif (defined $hash_base && defined $file_name) {
1135                        $action = git_get_type("$hash_base:$file_name");
1136                } elsif (defined $project) {
1137                        $action = 'summary';
1138                } else {
1139                        $action = 'project_list';
1140                }
1141        }
1142        if (!defined($actions{$action})) {
1143                die_error(400, "Unknown action");
1144        }
1145        if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1146            !$project) {
1147                die_error(400, "Project needed");
1148        }
1149        $actions{$action}->();
1150}
1151
1152sub reset_timer {
1153        our $t0 = [ gettimeofday() ]
1154                if defined $t0;
1155        our $number_of_git_cmds = 0;
1156}
1157
1158our $first_request = 1;
1159sub run_request {
1160        reset_timer();
1161
1162        evaluate_uri();
1163        if ($first_request) {
1164                evaluate_gitweb_config();
1165                evaluate_git_version();
1166        }
1167        if ($per_request_config) {
1168                if (ref($per_request_config) eq 'CODE') {
1169                        $per_request_config->();
1170                } elsif (!$first_request) {
1171                        evaluate_gitweb_config();
1172                }
1173        }
1174        check_loadavg();
1175
1176        # $projectroot and $projects_list might be set in gitweb config file
1177        $projects_list ||= $projectroot;
1178
1179        evaluate_query_params();
1180        evaluate_path_info();
1181        evaluate_and_validate_params();
1182        evaluate_git_dir();
1183
1184        configure_gitweb_features();
1185
1186        dispatch();
1187}
1188
1189our $is_last_request = sub { 1 };
1190our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1191our $CGI = 'CGI';
1192our $cgi;
1193sub configure_as_fcgi {
1194        require CGI::Fast;
1195        our $CGI = 'CGI::Fast';
1196
1197        my $request_number = 0;
1198        # let each child service 100 requests
1199        our $is_last_request = sub { ++$request_number > 100 };
1200}
1201sub evaluate_argv {
1202        my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1203        configure_as_fcgi()
1204                if $script_name =~ /\.fcgi$/;
1205
1206        return unless (@ARGV);
1207
1208        require Getopt::Long;
1209        Getopt::Long::GetOptions(
1210                'fastcgi|fcgi|f' => \&configure_as_fcgi,
1211                'nproc|n=i' => sub {
1212                        my ($arg, $val) = @_;
1213                        return unless eval { require FCGI::ProcManager; 1; };
1214                        my $proc_manager = FCGI::ProcManager->new({
1215                                n_processes => $val,
1216                        });
1217                        our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1218                        our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1219                        our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1220                },
1221        );
1222}
1223
1224sub run {
1225        evaluate_argv();
1226
1227        $first_request = 1;
1228        $pre_listen_hook->()
1229                if $pre_listen_hook;
1230
1231 REQUEST:
1232        while ($cgi = $CGI->new()) {
1233                $pre_dispatch_hook->()
1234                        if $pre_dispatch_hook;
1235
1236                run_request();
1237
1238                $post_dispatch_hook->()
1239                        if $post_dispatch_hook;
1240                $first_request = 0;
1241
1242                last REQUEST if ($is_last_request->());
1243        }
1244
1245 DONE_GITWEB:
1246        1;
1247}
1248
1249run();
1250
1251if (defined caller) {
1252        # wrapped in a subroutine processing requests,
1253        # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1254        return;
1255} else {
1256        # pure CGI script, serving single request
1257        exit;
1258}
1259
1260## ======================================================================
1261## action links
1262
1263# possible values of extra options
1264# -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1265# -replay => 1      - start from a current view (replay with modifications)
1266# -path_info => 0|1 - don't use/use path_info URL (if possible)
1267# -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1268sub href {
1269        my %params = @_;
1270        # default is to use -absolute url() i.e. $my_uri
1271        my $href = $params{-full} ? $my_url : $my_uri;
1272
1273        # implicit -replay, must be first of implicit params
1274        $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1275
1276        $params{'project'} = $project unless exists $params{'project'};
1277
1278        if ($params{-replay}) {
1279                while (my ($name, $symbol) = each %cgi_param_mapping) {
1280                        if (!exists $params{$name}) {
1281                                $params{$name} = $input_params{$name};
1282                        }
1283                }
1284        }
1285
1286        my $use_pathinfo = gitweb_check_feature('pathinfo');
1287        if (defined $params{'project'} &&
1288            (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1289                # try to put as many parameters as possible in PATH_INFO:
1290                #   - project name
1291                #   - action
1292                #   - hash_parent or hash_parent_base:/file_parent
1293                #   - hash or hash_base:/filename
1294                #   - the snapshot_format as an appropriate suffix
1295
1296                # When the script is the root DirectoryIndex for the domain,
1297                # $href here would be something like http://gitweb.example.com/
1298                # Thus, we strip any trailing / from $href, to spare us double
1299                # slashes in the final URL
1300                $href =~ s,/$,,;
1301
1302                # Then add the project name, if present
1303                $href .= "/".esc_path_info($params{'project'});
1304                delete $params{'project'};
1305
1306                # since we destructively absorb parameters, we keep this
1307                # boolean that remembers if we're handling a snapshot
1308                my $is_snapshot = $params{'action'} eq 'snapshot';
1309
1310                # Summary just uses the project path URL, any other action is
1311                # added to the URL
1312                if (defined $params{'action'}) {
1313                        $href .= "/".esc_path_info($params{'action'})
1314                                unless $params{'action'} eq 'summary';
1315                        delete $params{'action'};
1316                }
1317
1318                # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1319                # stripping nonexistent or useless pieces
1320                $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1321                        || $params{'hash_parent'} || $params{'hash'});
1322                if (defined $params{'hash_base'}) {
1323                        if (defined $params{'hash_parent_base'}) {
1324                                $href .= esc_path_info($params{'hash_parent_base'});
1325                                # skip the file_parent if it's the same as the file_name
1326                                if (defined $params{'file_parent'}) {
1327                                        if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1328                                                delete $params{'file_parent'};
1329                                        } elsif ($params{'file_parent'} !~ /\.\./) {
1330                                                $href .= ":/".esc_path_info($params{'file_parent'});
1331                                                delete $params{'file_parent'};
1332                                        }
1333                                }
1334                                $href .= "..";
1335                                delete $params{'hash_parent'};
1336                                delete $params{'hash_parent_base'};
1337                        } elsif (defined $params{'hash_parent'}) {
1338                                $href .= esc_path_info($params{'hash_parent'}). "..";
1339                                delete $params{'hash_parent'};
1340                        }
1341
1342                        $href .= esc_path_info($params{'hash_base'});
1343                        if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1344                                $href .= ":/".esc_path_info($params{'file_name'});
1345                                delete $params{'file_name'};
1346                        }
1347                        delete $params{'hash'};
1348                        delete $params{'hash_base'};
1349                } elsif (defined $params{'hash'}) {
1350                        $href .= esc_path_info($params{'hash'});
1351                        delete $params{'hash'};
1352                }
1353
1354                # If the action was a snapshot, we can absorb the
1355                # snapshot_format parameter too
1356                if ($is_snapshot) {
1357                        my $fmt = $params{'snapshot_format'};
1358                        # snapshot_format should always be defined when href()
1359                        # is called, but just in case some code forgets, we
1360                        # fall back to the default
1361                        $fmt ||= $snapshot_fmts[0];
1362                        $href .= $known_snapshot_formats{$fmt}{'suffix'};
1363                        delete $params{'snapshot_format'};
1364                }
1365        }
1366
1367        # now encode the parameters explicitly
1368        my @result = ();
1369        for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1370                my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1371                if (defined $params{$name}) {
1372                        if (ref($params{$name}) eq "ARRAY") {
1373                                foreach my $par (@{$params{$name}}) {
1374                                        push @result, $symbol . "=" . esc_param($par);
1375                                }
1376                        } else {
1377                                push @result, $symbol . "=" . esc_param($params{$name});
1378                        }
1379                }
1380        }
1381        $href .= "?" . join(';', @result) if scalar @result;
1382
1383        # final transformation: trailing spaces must be escaped (URI-encoded)
1384        $href =~ s/(\s+)$/CGI::escape($1)/e;
1385
1386        if ($params{-anchor}) {
1387                $href .= "#".esc_param($params{-anchor});
1388        }
1389
1390        return $href;
1391}
1392
1393
1394## ======================================================================
1395## validation, quoting/unquoting and escaping
1396
1397sub validate_action {
1398        my $input = shift || return undef;
1399        return undef unless exists $actions{$input};
1400        return $input;
1401}
1402
1403sub validate_project {
1404        my $input = shift || return undef;
1405        if (!validate_pathname($input) ||
1406                !(-d "$projectroot/$input") ||
1407                !check_export_ok("$projectroot/$input") ||
1408                ($strict_export && !project_in_list($input))) {
1409                return undef;
1410        } else {
1411                return $input;
1412        }
1413}
1414
1415sub validate_pathname {
1416        my $input = shift || return undef;
1417
1418        # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1419        # at the beginning, at the end, and between slashes.
1420        # also this catches doubled slashes
1421        if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1422                return undef;
1423        }
1424        # no null characters
1425        if ($input =~ m!\0!) {
1426                return undef;
1427        }
1428        return $input;
1429}
1430
1431sub validate_refname {
1432        my $input = shift || return undef;
1433
1434        # textual hashes are O.K.
1435        if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1436                return $input;
1437        }
1438        # it must be correct pathname
1439        $input = validate_pathname($input)
1440                or return undef;
1441        # restrictions on ref name according to git-check-ref-format
1442        if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1443                return undef;
1444        }
1445        return $input;
1446}
1447
1448# decode sequences of octets in utf8 into Perl's internal form,
1449# which is utf-8 with utf8 flag set if needed.  gitweb writes out
1450# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1451sub to_utf8 {
1452        my $str = shift;
1453        return undef unless defined $str;
1454
1455        if (utf8::is_utf8($str) || utf8::decode($str)) {
1456                return $str;
1457        } else {
1458                return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1459        }
1460}
1461
1462# quote unsafe chars, but keep the slash, even when it's not
1463# correct, but quoted slashes look too horrible in bookmarks
1464sub esc_param {
1465        my $str = shift;
1466        return undef unless defined $str;
1467        $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1468        $str =~ s/ /\+/g;
1469        return $str;
1470}
1471
1472# the quoting rules for path_info fragment are slightly different
1473sub esc_path_info {
1474        my $str = shift;
1475        return undef unless defined $str;
1476
1477        # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1478        $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1479
1480        return $str;
1481}
1482
1483# quote unsafe chars in whole URL, so some characters cannot be quoted
1484sub esc_url {
1485        my $str = shift;
1486        return undef unless defined $str;
1487        $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1488        $str =~ s/ /\+/g;
1489        return $str;
1490}
1491
1492# quote unsafe characters in HTML attributes
1493sub esc_attr {
1494
1495        # for XHTML conformance escaping '"' to '&quot;' is not enough
1496        return esc_html(@_);
1497}
1498
1499# replace invalid utf8 character with SUBSTITUTION sequence
1500sub esc_html {
1501        my $str = shift;
1502        my %opts = @_;
1503
1504        return undef unless defined $str;
1505
1506        $str = to_utf8($str);
1507        $str = $cgi->escapeHTML($str);
1508        if ($opts{'-nbsp'}) {
1509                $str =~ s/ /&nbsp;/g;
1510        }
1511        $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1512        return $str;
1513}
1514
1515# quote control characters and escape filename to HTML
1516sub esc_path {
1517        my $str = shift;
1518        my %opts = @_;
1519
1520        return undef unless defined $str;
1521
1522        $str = to_utf8($str);
1523        $str = $cgi->escapeHTML($str);
1524        if ($opts{'-nbsp'}) {
1525                $str =~ s/ /&nbsp;/g;
1526        }
1527        $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1528        return $str;
1529}
1530
1531# Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1532sub sanitize {
1533        my $str = shift;
1534
1535        return undef unless defined $str;
1536
1537        $str = to_utf8($str);
1538        $str =~ s|([[:cntrl:]])|($1 =~ /[\t\n\r]/ ? $1 : quot_cec($1))|eg;
1539        return $str;
1540}
1541
1542# Make control characters "printable", using character escape codes (CEC)
1543sub quot_cec {
1544        my $cntrl = shift;
1545        my %opts = @_;
1546        my %es = ( # character escape codes, aka escape sequences
1547                "\t" => '\t',   # tab            (HT)
1548                "\n" => '\n',   # line feed      (LF)
1549                "\r" => '\r',   # carrige return (CR)
1550                "\f" => '\f',   # form feed      (FF)
1551                "\b" => '\b',   # backspace      (BS)
1552                "\a" => '\a',   # alarm (bell)   (BEL)
1553                "\e" => '\e',   # escape         (ESC)
1554                "\013" => '\v', # vertical tab   (VT)
1555                "\000" => '\0', # nul character  (NUL)
1556        );
1557        my $chr = ( (exists $es{$cntrl})
1558                    ? $es{$cntrl}
1559                    : sprintf('\%2x', ord($cntrl)) );
1560        if ($opts{-nohtml}) {
1561                return $chr;
1562        } else {
1563                return "<span class=\"cntrl\">$chr</span>";
1564        }
1565}
1566
1567# Alternatively use unicode control pictures codepoints,
1568# Unicode "printable representation" (PR)
1569sub quot_upr {
1570        my $cntrl = shift;
1571        my %opts = @_;
1572
1573        my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1574        if ($opts{-nohtml}) {
1575                return $chr;
1576        } else {
1577                return "<span class=\"cntrl\">$chr</span>";
1578        }
1579}
1580
1581# git may return quoted and escaped filenames
1582sub unquote {
1583        my $str = shift;
1584
1585        sub unq {
1586                my $seq = shift;
1587                my %es = ( # character escape codes, aka escape sequences
1588                        't' => "\t",   # tab            (HT, TAB)
1589                        'n' => "\n",   # newline        (NL)
1590                        'r' => "\r",   # return         (CR)
1591                        'f' => "\f",   # form feed      (FF)
1592                        'b' => "\b",   # backspace      (BS)
1593                        'a' => "\a",   # alarm (bell)   (BEL)
1594                        'e' => "\e",   # escape         (ESC)
1595                        'v' => "\013", # vertical tab   (VT)
1596                );
1597
1598                if ($seq =~ m/^[0-7]{1,3}$/) {
1599                        # octal char sequence
1600                        return chr(oct($seq));
1601                } elsif (exists $es{$seq}) {
1602                        # C escape sequence, aka character escape code
1603                        return $es{$seq};
1604                }
1605                # quoted ordinary character
1606                return $seq;
1607        }
1608
1609        if ($str =~ m/^"(.*)"$/) {
1610                # needs unquoting
1611                $str = $1;
1612                $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1613        }
1614        return $str;
1615}
1616
1617# escape tabs (convert tabs to spaces)
1618sub untabify {
1619        my $line = shift;
1620
1621        while ((my $pos = index($line, "\t")) != -1) {
1622                if (my $count = (8 - ($pos % 8))) {
1623                        my $spaces = ' ' x $count;
1624                        $line =~ s/\t/$spaces/;
1625                }
1626        }
1627
1628        return $line;
1629}
1630
1631sub project_in_list {
1632        my $project = shift;
1633        my @list = git_get_projects_list();
1634        return @list && scalar(grep { $_->{'path'} eq $project } @list);
1635}
1636
1637## ----------------------------------------------------------------------
1638## HTML aware string manipulation
1639
1640# Try to chop given string on a word boundary between position
1641# $len and $len+$add_len. If there is no word boundary there,
1642# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1643# (marking chopped part) would be longer than given string.
1644sub chop_str {
1645        my $str = shift;
1646        my $len = shift;
1647        my $add_len = shift || 10;
1648        my $where = shift || 'right'; # 'left' | 'center' | 'right'
1649
1650        # Make sure perl knows it is utf8 encoded so we don't
1651        # cut in the middle of a utf8 multibyte char.
1652        $str = to_utf8($str);
1653
1654        # allow only $len chars, but don't cut a word if it would fit in $add_len
1655        # if it doesn't fit, cut it if it's still longer than the dots we would add
1656        # remove chopped character entities entirely
1657
1658        # when chopping in the middle, distribute $len into left and right part
1659        # return early if chopping wouldn't make string shorter
1660        if ($where eq 'center') {
1661                return $str if ($len + 5 >= length($str)); # filler is length 5
1662                $len = int($len/2);
1663        } else {
1664                return $str if ($len + 4 >= length($str)); # filler is length 4
1665        }
1666
1667        # regexps: ending and beginning with word part up to $add_len
1668        my $endre = qr/.{$len}\w{0,$add_len}/;
1669        my $begre = qr/\w{0,$add_len}.{$len}/;
1670
1671        if ($where eq 'left') {
1672                $str =~ m/^(.*?)($begre)$/;
1673                my ($lead, $body) = ($1, $2);
1674                if (length($lead) > 4) {
1675                        $lead = " ...";
1676                }
1677                return "$lead$body";
1678
1679        } elsif ($where eq 'center') {
1680                $str =~ m/^($endre)(.*)$/;
1681                my ($left, $str)  = ($1, $2);
1682                $str =~ m/^(.*?)($begre)$/;
1683                my ($mid, $right) = ($1, $2);
1684                if (length($mid) > 5) {
1685                        $mid = " ... ";
1686                }
1687                return "$left$mid$right";
1688
1689        } else {
1690                $str =~ m/^($endre)(.*)$/;
1691                my $body = $1;
1692                my $tail = $2;
1693                if (length($tail) > 4) {
1694                        $tail = "... ";
1695                }
1696                return "$body$tail";
1697        }
1698}
1699
1700# takes the same arguments as chop_str, but also wraps a <span> around the
1701# result with a title attribute if it does get chopped. Additionally, the
1702# string is HTML-escaped.
1703sub chop_and_escape_str {
1704        my ($str) = @_;
1705
1706        my $chopped = chop_str(@_);
1707        $str = to_utf8($str);
1708        if ($chopped eq $str) {
1709                return esc_html($chopped);
1710        } else {
1711                $str =~ s/[[:cntrl:]]/?/g;
1712                return $cgi->span({-title=>$str}, esc_html($chopped));
1713        }
1714}
1715
1716## ----------------------------------------------------------------------
1717## functions returning short strings
1718
1719# CSS class for given age value (in seconds)
1720sub age_class {
1721        my $age = shift;
1722
1723        if (!defined $age) {
1724                return "noage";
1725        } elsif ($age < 60*60*2) {
1726                return "age0";
1727        } elsif ($age < 60*60*24*2) {
1728                return "age1";
1729        } else {
1730                return "age2";
1731        }
1732}
1733
1734# convert age in seconds to "nn units ago" string
1735sub age_string {
1736        my $age = shift;
1737        my $age_str;
1738
1739        if ($age > 60*60*24*365*2) {
1740                $age_str = (int $age/60/60/24/365);
1741                $age_str .= " years ago";
1742        } elsif ($age > 60*60*24*(365/12)*2) {
1743                $age_str = int $age/60/60/24/(365/12);
1744                $age_str .= " months ago";
1745        } elsif ($age > 60*60*24*7*2) {
1746                $age_str = int $age/60/60/24/7;
1747                $age_str .= " weeks ago";
1748        } elsif ($age > 60*60*24*2) {
1749                $age_str = int $age/60/60/24;
1750                $age_str .= " days ago";
1751        } elsif ($age > 60*60*2) {
1752                $age_str = int $age/60/60;
1753                $age_str .= " hours ago";
1754        } elsif ($age > 60*2) {
1755                $age_str = int $age/60;
1756                $age_str .= " min ago";
1757        } elsif ($age > 2) {
1758                $age_str = int $age;
1759                $age_str .= " sec ago";
1760        } else {
1761                $age_str .= " right now";
1762        }
1763        return $age_str;
1764}
1765
1766use constant {
1767        S_IFINVALID => 0030000,
1768        S_IFGITLINK => 0160000,
1769};
1770
1771# submodule/subproject, a commit object reference
1772sub S_ISGITLINK {
1773        my $mode = shift;
1774
1775        return (($mode & S_IFMT) == S_IFGITLINK)
1776}
1777
1778# convert file mode in octal to symbolic file mode string
1779sub mode_str {
1780        my $mode = oct shift;
1781
1782        if (S_ISGITLINK($mode)) {
1783                return 'm---------';
1784        } elsif (S_ISDIR($mode & S_IFMT)) {
1785                return 'drwxr-xr-x';
1786        } elsif (S_ISLNK($mode)) {
1787                return 'lrwxrwxrwx';
1788        } elsif (S_ISREG($mode)) {
1789                # git cares only about the executable bit
1790                if ($mode & S_IXUSR) {
1791                        return '-rwxr-xr-x';
1792                } else {
1793                        return '-rw-r--r--';
1794                };
1795        } else {
1796                return '----------';
1797        }
1798}
1799
1800# convert file mode in octal to file type string
1801sub file_type {
1802        my $mode = shift;
1803
1804        if ($mode !~ m/^[0-7]+$/) {
1805                return $mode;
1806        } else {
1807                $mode = oct $mode;
1808        }
1809
1810        if (S_ISGITLINK($mode)) {
1811                return "submodule";
1812        } elsif (S_ISDIR($mode & S_IFMT)) {
1813                return "directory";
1814        } elsif (S_ISLNK($mode)) {
1815                return "symlink";
1816        } elsif (S_ISREG($mode)) {
1817                return "file";
1818        } else {
1819                return "unknown";
1820        }
1821}
1822
1823# convert file mode in octal to file type description string
1824sub file_type_long {
1825        my $mode = shift;
1826
1827        if ($mode !~ m/^[0-7]+$/) {
1828                return $mode;
1829        } else {
1830                $mode = oct $mode;
1831        }
1832
1833        if (S_ISGITLINK($mode)) {
1834                return "submodule";
1835        } elsif (S_ISDIR($mode & S_IFMT)) {
1836                return "directory";
1837        } elsif (S_ISLNK($mode)) {
1838                return "symlink";
1839        } elsif (S_ISREG($mode)) {
1840                if ($mode & S_IXUSR) {
1841                        return "executable";
1842                } else {
1843                        return "file";
1844                };
1845        } else {
1846                return "unknown";
1847        }
1848}
1849
1850
1851## ----------------------------------------------------------------------
1852## functions returning short HTML fragments, or transforming HTML fragments
1853## which don't belong to other sections
1854
1855# format line of commit message.
1856sub format_log_line_html {
1857        my $line = shift;
1858
1859        $line = esc_html($line, -nbsp=>1);
1860        $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1861                $cgi->a({-href => href(action=>"object", hash=>$1),
1862                                        -class => "text"}, $1);
1863        }eg;
1864
1865        return $line;
1866}
1867
1868# format marker of refs pointing to given object
1869
1870# the destination action is chosen based on object type and current context:
1871# - for annotated tags, we choose the tag view unless it's the current view
1872#   already, in which case we go to shortlog view
1873# - for other refs, we keep the current view if we're in history, shortlog or
1874#   log view, and select shortlog otherwise
1875sub format_ref_marker {
1876        my ($refs, $id) = @_;
1877        my $markers = '';
1878
1879        if (defined $refs->{$id}) {
1880                foreach my $ref (@{$refs->{$id}}) {
1881                        # this code exploits the fact that non-lightweight tags are the
1882                        # only indirect objects, and that they are the only objects for which
1883                        # we want to use tag instead of shortlog as action
1884                        my ($type, $name) = qw();
1885                        my $indirect = ($ref =~ s/\^\{\}$//);
1886                        # e.g. tags/v2.6.11 or heads/next
1887                        if ($ref =~ m!^(.*?)s?/(.*)$!) {
1888                                $type = $1;
1889                                $name = $2;
1890                        } else {
1891                                $type = "ref";
1892                                $name = $ref;
1893                        }
1894
1895                        my $class = $type;
1896                        $class .= " indirect" if $indirect;
1897
1898                        my $dest_action = "shortlog";
1899
1900                        if ($indirect) {
1901                                $dest_action = "tag" unless $action eq "tag";
1902                        } elsif ($action =~ /^(history|(short)?log)$/) {
1903                                $dest_action = $action;
1904                        }
1905
1906                        my $dest = "";
1907                        $dest .= "refs/" unless $ref =~ m!^refs/!;
1908                        $dest .= $ref;
1909
1910                        my $link = $cgi->a({
1911                                -href => href(
1912                                        action=>$dest_action,
1913                                        hash=>$dest
1914                                )}, $name);
1915
1916                        $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
1917                                $link . "</span>";
1918                }
1919        }
1920
1921        if ($markers) {
1922                return ' <span class="refs">'. $markers . '</span>';
1923        } else {
1924                return "";
1925        }
1926}
1927
1928# format, perhaps shortened and with markers, title line
1929sub format_subject_html {
1930        my ($long, $short, $href, $extra) = @_;
1931        $extra = '' unless defined($extra);
1932
1933        if (length($short) < length($long)) {
1934                $long =~ s/[[:cntrl:]]/?/g;
1935                return $cgi->a({-href => $href, -class => "list subject",
1936                                -title => to_utf8($long)},
1937                       esc_html($short)) . $extra;
1938        } else {
1939                return $cgi->a({-href => $href, -class => "list subject"},
1940                       esc_html($long)) . $extra;
1941        }
1942}
1943
1944# Rather than recomputing the url for an email multiple times, we cache it
1945# after the first hit. This gives a visible benefit in views where the avatar
1946# for the same email is used repeatedly (e.g. shortlog).
1947# The cache is shared by all avatar engines (currently gravatar only), which
1948# are free to use it as preferred. Since only one avatar engine is used for any
1949# given page, there's no risk for cache conflicts.
1950our %avatar_cache = ();
1951
1952# Compute the picon url for a given email, by using the picon search service over at
1953# http://www.cs.indiana.edu/picons/search.html
1954sub picon_url {
1955        my $email = lc shift;
1956        if (!$avatar_cache{$email}) {
1957                my ($user, $domain) = split('@', $email);
1958                $avatar_cache{$email} =
1959                        "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1960                        "$domain/$user/" .
1961                        "users+domains+unknown/up/single";
1962        }
1963        return $avatar_cache{$email};
1964}
1965
1966# Compute the gravatar url for a given email, if it's not in the cache already.
1967# Gravatar stores only the part of the URL before the size, since that's the
1968# one computationally more expensive. This also allows reuse of the cache for
1969# different sizes (for this particular engine).
1970sub gravatar_url {
1971        my $email = lc shift;
1972        my $size = shift;
1973        $avatar_cache{$email} ||=
1974                "http://www.gravatar.com/avatar/" .
1975                        Digest::MD5::md5_hex($email) . "?s=";
1976        return $avatar_cache{$email} . $size;
1977}
1978
1979# Insert an avatar for the given $email at the given $size if the feature
1980# is enabled.
1981sub git_get_avatar {
1982        my ($email, %opts) = @_;
1983        my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1984        my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1985        $opts{-size} ||= 'default';
1986        my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1987        my $url = "";
1988        if ($git_avatar eq 'gravatar') {
1989                $url = gravatar_url($email, $size);
1990        } elsif ($git_avatar eq 'picon') {
1991                $url = picon_url($email);
1992        }
1993        # Other providers can be added by extending the if chain, defining $url
1994        # as needed. If no variant puts something in $url, we assume avatars
1995        # are completely disabled/unavailable.
1996        if ($url) {
1997                return $pre_white .
1998                       "<img width=\"$size\" " .
1999                            "class=\"avatar\" " .
2000                            "src=\"".esc_url($url)."\" " .
2001                            "alt=\"\" " .
2002                       "/>" . $post_white;
2003        } else {
2004                return "";
2005        }
2006}
2007
2008sub format_search_author {
2009        my ($author, $searchtype, $displaytext) = @_;
2010        my $have_search = gitweb_check_feature('search');
2011
2012        if ($have_search) {
2013                my $performed = "";
2014                if ($searchtype eq 'author') {
2015                        $performed = "authored";
2016                } elsif ($searchtype eq 'committer') {
2017                        $performed = "committed";
2018                }
2019
2020                return $cgi->a({-href => href(action=>"search", hash=>$hash,
2021                                searchtext=>$author,
2022                                searchtype=>$searchtype), class=>"list",
2023                                title=>"Search for commits $performed by $author"},
2024                                $displaytext);
2025
2026        } else {
2027                return $displaytext;
2028        }
2029}
2030
2031# format the author name of the given commit with the given tag
2032# the author name is chopped and escaped according to the other
2033# optional parameters (see chop_str).
2034sub format_author_html {
2035        my $tag = shift;
2036        my $co = shift;
2037        my $author = chop_and_escape_str($co->{'author_name'}, @_);
2038        return "<$tag class=\"author\">" .
2039               format_search_author($co->{'author_name'}, "author",
2040                       git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2041                       $author) .
2042               "</$tag>";
2043}
2044
2045# format git diff header line, i.e. "diff --(git|combined|cc) ..."
2046sub format_git_diff_header_line {
2047        my $line = shift;
2048        my $diffinfo = shift;
2049        my ($from, $to) = @_;
2050
2051        if ($diffinfo->{'nparents'}) {
2052                # combined diff
2053                $line =~ s!^(diff (.*?) )"?.*$!$1!;
2054                if ($to->{'href'}) {
2055                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2056                                         esc_path($to->{'file'}));
2057                } else { # file was deleted (no href)
2058                        $line .= esc_path($to->{'file'});
2059                }
2060        } else {
2061                # "ordinary" diff
2062                $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2063                if ($from->{'href'}) {
2064                        $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2065                                         'a/' . esc_path($from->{'file'}));
2066                } else { # file was added (no href)
2067                        $line .= 'a/' . esc_path($from->{'file'});
2068                }
2069                $line .= ' ';
2070                if ($to->{'href'}) {
2071                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2072                                         'b/' . esc_path($to->{'file'}));
2073                } else { # file was deleted
2074                        $line .= 'b/' . esc_path($to->{'file'});
2075                }
2076        }
2077
2078        return "<div class=\"diff header\">$line</div>\n";
2079}
2080
2081# format extended diff header line, before patch itself
2082sub format_extended_diff_header_line {
2083        my $line = shift;
2084        my $diffinfo = shift;
2085        my ($from, $to) = @_;
2086
2087        # match <path>
2088        if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2089                $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2090                                       esc_path($from->{'file'}));
2091        }
2092        if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2093                $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2094                                 esc_path($to->{'file'}));
2095        }
2096        # match single <mode>
2097        if ($line =~ m/\s(\d{6})$/) {
2098                $line .= '<span class="info"> (' .
2099                         file_type_long($1) .
2100                         ')</span>';
2101        }
2102        # match <hash>
2103        if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2104                # can match only for combined diff
2105                $line = 'index ';
2106                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2107                        if ($from->{'href'}[$i]) {
2108                                $line .= $cgi->a({-href=>$from->{'href'}[$i],
2109                                                  -class=>"hash"},
2110                                                 substr($diffinfo->{'from_id'}[$i],0,7));
2111                        } else {
2112                                $line .= '0' x 7;
2113                        }
2114                        # separator
2115                        $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2116                }
2117                $line .= '..';
2118                if ($to->{'href'}) {
2119                        $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2120                                         substr($diffinfo->{'to_id'},0,7));
2121                } else {
2122                        $line .= '0' x 7;
2123                }
2124
2125        } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2126                # can match only for ordinary diff
2127                my ($from_link, $to_link);
2128                if ($from->{'href'}) {
2129                        $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2130                                             substr($diffinfo->{'from_id'},0,7));
2131                } else {
2132                        $from_link = '0' x 7;
2133                }
2134                if ($to->{'href'}) {
2135                        $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2136                                           substr($diffinfo->{'to_id'},0,7));
2137                } else {
2138                        $to_link = '0' x 7;
2139                }
2140                my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2141                $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2142        }
2143
2144        return $line . "<br/>\n";
2145}
2146
2147# format from-file/to-file diff header
2148sub format_diff_from_to_header {
2149        my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2150        my $line;
2151        my $result = '';
2152
2153        $line = $from_line;
2154        #assert($line =~ m/^---/) if DEBUG;
2155        # no extra formatting for "^--- /dev/null"
2156        if (! $diffinfo->{'nparents'}) {
2157                # ordinary (single parent) diff
2158                if ($line =~ m!^--- "?a/!) {
2159                        if ($from->{'href'}) {
2160                                $line = '--- a/' .
2161                                        $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2162                                                esc_path($from->{'file'}));
2163                        } else {
2164                                $line = '--- a/' .
2165                                        esc_path($from->{'file'});
2166                        }
2167                }
2168                $result .= qq!<div class="diff from_file">$line</div>\n!;
2169
2170        } else {
2171                # combined diff (merge commit)
2172                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2173                        if ($from->{'href'}[$i]) {
2174                                $line = '--- ' .
2175                                        $cgi->a({-href=>href(action=>"blobdiff",
2176                                                             hash_parent=>$diffinfo->{'from_id'}[$i],
2177                                                             hash_parent_base=>$parents[$i],
2178                                                             file_parent=>$from->{'file'}[$i],
2179                                                             hash=>$diffinfo->{'to_id'},
2180                                                             hash_base=>$hash,
2181                                                             file_name=>$to->{'file'}),
2182                                                 -class=>"path",
2183                                                 -title=>"diff" . ($i+1)},
2184                                                $i+1) .
2185                                        '/' .
2186                                        $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2187                                                esc_path($from->{'file'}[$i]));
2188                        } else {
2189                                $line = '--- /dev/null';
2190                        }
2191                        $result .= qq!<div class="diff from_file">$line</div>\n!;
2192                }
2193        }
2194
2195        $line = $to_line;
2196        #assert($line =~ m/^\+\+\+/) if DEBUG;
2197        # no extra formatting for "^+++ /dev/null"
2198        if ($line =~ m!^\+\+\+ "?b/!) {
2199                if ($to->{'href'}) {
2200                        $line = '+++ b/' .
2201                                $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2202                                        esc_path($to->{'file'}));
2203                } else {
2204                        $line = '+++ b/' .
2205                                esc_path($to->{'file'});
2206                }
2207        }
2208        $result .= qq!<div class="diff to_file">$line</div>\n!;
2209
2210        return $result;
2211}
2212
2213# create note for patch simplified by combined diff
2214sub format_diff_cc_simplified {
2215        my ($diffinfo, @parents) = @_;
2216        my $result = '';
2217
2218        $result .= "<div class=\"diff header\">" .
2219                   "diff --cc ";
2220        if (!is_deleted($diffinfo)) {
2221                $result .= $cgi->a({-href => href(action=>"blob",
2222                                                  hash_base=>$hash,
2223                                                  hash=>$diffinfo->{'to_id'},
2224                                                  file_name=>$diffinfo->{'to_file'}),
2225                                    -class => "path"},
2226                                   esc_path($diffinfo->{'to_file'}));
2227        } else {
2228                $result .= esc_path($diffinfo->{'to_file'});
2229        }
2230        $result .= "</div>\n" . # class="diff header"
2231                   "<div class=\"diff nodifferences\">" .
2232                   "Simple merge" .
2233                   "</div>\n"; # class="diff nodifferences"
2234
2235        return $result;
2236}
2237
2238sub diff_line_class {
2239        my ($line, $from, $to) = @_;
2240
2241        # ordinary diff
2242        my $num_sign = 1;
2243        # combined diff
2244        if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2245                $num_sign = scalar @{$from->{'href'}};
2246        }
2247
2248        my @diff_line_classifier = (
2249                { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2250                { regexp => qr/^\\/,               class => "incomplete"  },
2251                { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2252                # classifier for context must come before classifier add/rem,
2253                # or we would have to use more complicated regexp, for example
2254                # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2255                { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2256                { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2257        );
2258        for my $clsfy (@diff_line_classifier) {
2259                return $clsfy->{'class'}
2260                        if ($line =~ $clsfy->{'regexp'});
2261        }
2262
2263        # fallback
2264        return "";
2265}
2266
2267# assumes that $from and $to are defined and correctly filled,
2268# and that $line holds a line of chunk header for unified diff
2269sub format_unidiff_chunk_header {
2270        my ($line, $from, $to) = @_;
2271
2272        my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2273                $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2274
2275        $from_lines = 0 unless defined $from_lines;
2276        $to_lines   = 0 unless defined $to_lines;
2277
2278        if ($from->{'href'}) {
2279                $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2280                                     -class=>"list"}, $from_text);
2281        }
2282        if ($to->{'href'}) {
2283                $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2284                                     -class=>"list"}, $to_text);
2285        }
2286        $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2287                "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2288        return $line;
2289}
2290
2291# assumes that $from and $to are defined and correctly filled,
2292# and that $line holds a line of chunk header for combined diff
2293sub format_cc_diff_chunk_header {
2294        my ($line, $from, $to) = @_;
2295
2296        my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2297        my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2298
2299        @from_text = split(' ', $ranges);
2300        for (my $i = 0; $i < @from_text; ++$i) {
2301                ($from_start[$i], $from_nlines[$i]) =
2302                        (split(',', substr($from_text[$i], 1)), 0);
2303        }
2304
2305        $to_text   = pop @from_text;
2306        $to_start  = pop @from_start;
2307        $to_nlines = pop @from_nlines;
2308
2309        $line = "<span class=\"chunk_info\">$prefix ";
2310        for (my $i = 0; $i < @from_text; ++$i) {
2311                if ($from->{'href'}[$i]) {
2312                        $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2313                                          -class=>"list"}, $from_text[$i]);
2314                } else {
2315                        $line .= $from_text[$i];
2316                }
2317                $line .= " ";
2318        }
2319        if ($to->{'href'}) {
2320                $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2321                                  -class=>"list"}, $to_text);
2322        } else {
2323                $line .= $to_text;
2324        }
2325        $line .= " $prefix</span>" .
2326                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2327        return $line;
2328}
2329
2330# process patch (diff) line (not to be used for diff headers),
2331# returning class and HTML-formatted (but not wrapped) line
2332sub process_diff_line {
2333        my $line = shift;
2334        my ($from, $to) = @_;
2335
2336        my $diff_class = diff_line_class($line, $from, $to);
2337
2338        chomp $line;
2339        $line = untabify($line);
2340
2341        if ($from && $to && $line =~ m/^\@{2} /) {
2342                $line = format_unidiff_chunk_header($line, $from, $to);
2343                return $diff_class, $line;
2344
2345        } elsif ($from && $to && $line =~ m/^\@{3}/) {
2346                $line = format_cc_diff_chunk_header($line, $from, $to);
2347                return $diff_class, $line;
2348
2349        }
2350        return $diff_class, esc_html($line, -nbsp=>1);
2351}
2352
2353# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2354# linked.  Pass the hash of the tree/commit to snapshot.
2355sub format_snapshot_links {
2356        my ($hash) = @_;
2357        my $num_fmts = @snapshot_fmts;
2358        if ($num_fmts > 1) {
2359                # A parenthesized list of links bearing format names.
2360                # e.g. "snapshot (_tar.gz_ _zip_)"
2361                return "snapshot (" . join(' ', map
2362                        $cgi->a({
2363                                -href => href(
2364                                        action=>"snapshot",
2365                                        hash=>$hash,
2366                                        snapshot_format=>$_
2367                                )
2368                        }, $known_snapshot_formats{$_}{'display'})
2369                , @snapshot_fmts) . ")";
2370        } elsif ($num_fmts == 1) {
2371                # A single "snapshot" link whose tooltip bears the format name.
2372                # i.e. "_snapshot_"
2373                my ($fmt) = @snapshot_fmts;
2374                return
2375                        $cgi->a({
2376                                -href => href(
2377                                        action=>"snapshot",
2378                                        hash=>$hash,
2379                                        snapshot_format=>$fmt
2380                                ),
2381                                -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2382                        }, "snapshot");
2383        } else { # $num_fmts == 0
2384                return undef;
2385        }
2386}
2387
2388## ......................................................................
2389## functions returning values to be passed, perhaps after some
2390## transformation, to other functions; e.g. returning arguments to href()
2391
2392# returns hash to be passed to href to generate gitweb URL
2393# in -title key it returns description of link
2394sub get_feed_info {
2395        my $format = shift || 'Atom';
2396        my %res = (action => lc($format));
2397
2398        # feed links are possible only for project views
2399        return unless (defined $project);
2400        # some views should link to OPML, or to generic project feed,
2401        # or don't have specific feed yet (so they should use generic)
2402        return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2403
2404        my $branch;
2405        # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2406        # from tag links; this also makes possible to detect branch links
2407        if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2408            (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2409                $branch = $1;
2410        }
2411        # find log type for feed description (title)
2412        my $type = 'log';
2413        if (defined $file_name) {
2414                $type  = "history of $file_name";
2415                $type .= "/" if ($action eq 'tree');
2416                $type .= " on '$branch'" if (defined $branch);
2417        } else {
2418                $type = "log of $branch" if (defined $branch);
2419        }
2420
2421        $res{-title} = $type;
2422        $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2423        $res{'file_name'} = $file_name;
2424
2425        return %res;
2426}
2427
2428## ----------------------------------------------------------------------
2429## git utility subroutines, invoking git commands
2430
2431# returns path to the core git executable and the --git-dir parameter as list
2432sub git_cmd {
2433        $number_of_git_cmds++;
2434        return $GIT, '--git-dir='.$git_dir;
2435}
2436
2437# quote the given arguments for passing them to the shell
2438# quote_command("command", "arg 1", "arg with ' and ! characters")
2439# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2440# Try to avoid using this function wherever possible.
2441sub quote_command {
2442        return join(' ',
2443                map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2444}
2445
2446# get HEAD ref of given project as hash
2447sub git_get_head_hash {
2448        return git_get_full_hash(shift, 'HEAD');
2449}
2450
2451sub git_get_full_hash {
2452        return git_get_hash(@_);
2453}
2454
2455sub git_get_short_hash {
2456        return git_get_hash(@_, '--short=7');
2457}
2458
2459sub git_get_hash {
2460        my ($project, $hash, @options) = @_;
2461        my $o_git_dir = $git_dir;
2462        my $retval = undef;
2463        $git_dir = "$projectroot/$project";
2464        if (open my $fd, '-|', git_cmd(), 'rev-parse',
2465            '--verify', '-q', @options, $hash) {
2466                $retval = <$fd>;
2467                chomp $retval if defined $retval;
2468                close $fd;
2469        }
2470        if (defined $o_git_dir) {
2471                $git_dir = $o_git_dir;
2472        }
2473        return $retval;
2474}
2475
2476# get type of given object
2477sub git_get_type {
2478        my $hash = shift;
2479
2480        open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2481        my $type = <$fd>;
2482        close $fd or return;
2483        chomp $type;
2484        return $type;
2485}
2486
2487# repository configuration
2488our $config_file = '';
2489our %config;
2490
2491# store multiple values for single key as anonymous array reference
2492# single values stored directly in the hash, not as [ <value> ]
2493sub hash_set_multi {
2494        my ($hash, $key, $value) = @_;
2495
2496        if (!exists $hash->{$key}) {
2497                $hash->{$key} = $value;
2498        } elsif (!ref $hash->{$key}) {
2499                $hash->{$key} = [ $hash->{$key}, $value ];
2500        } else {
2501                push @{$hash->{$key}}, $value;
2502        }
2503}
2504
2505# return hash of git project configuration
2506# optionally limited to some section, e.g. 'gitweb'
2507sub git_parse_project_config {
2508        my $section_regexp = shift;
2509        my %config;
2510
2511        local $/ = "\0";
2512
2513        open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2514                or return;
2515
2516        while (my $keyval = <$fh>) {
2517                chomp $keyval;
2518                my ($key, $value) = split(/\n/, $keyval, 2);
2519
2520                hash_set_multi(\%config, $key, $value)
2521                        if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2522        }
2523        close $fh;
2524
2525        return %config;
2526}
2527
2528# convert config value to boolean: 'true' or 'false'
2529# no value, number > 0, 'true' and 'yes' values are true
2530# rest of values are treated as false (never as error)
2531sub config_to_bool {
2532        my $val = shift;
2533
2534        return 1 if !defined $val;             # section.key
2535
2536        # strip leading and trailing whitespace
2537        $val =~ s/^\s+//;
2538        $val =~ s/\s+$//;
2539
2540        return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2541                ($val =~ /^(?:true|yes)$/i));  # section.key = true
2542}
2543
2544# convert config value to simple decimal number
2545# an optional value suffix of 'k', 'm', or 'g' will cause the value
2546# to be multiplied by 1024, 1048576, or 1073741824
2547sub config_to_int {
2548        my $val = shift;
2549
2550        # strip leading and trailing whitespace
2551        $val =~ s/^\s+//;
2552        $val =~ s/\s+$//;
2553
2554        if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2555                $unit = lc($unit);
2556                # unknown unit is treated as 1
2557                return $num * ($unit eq 'g' ? 1073741824 :
2558                               $unit eq 'm' ?    1048576 :
2559                               $unit eq 'k' ?       1024 : 1);
2560        }
2561        return $val;
2562}
2563
2564# convert config value to array reference, if needed
2565sub config_to_multi {
2566        my $val = shift;
2567
2568        return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2569}
2570
2571sub git_get_project_config {
2572        my ($key, $type) = @_;
2573
2574        return unless defined $git_dir;
2575
2576        # key sanity check
2577        return unless ($key);
2578        # only subsection, if exists, is case sensitive,
2579        # and not lowercased by 'git config -z -l'
2580        if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2581                $key = join(".", lc($hi), $mi, lc($lo));
2582        } else {
2583                $key = lc($key);
2584        }
2585        $key =~ s/^gitweb\.//;
2586        return if ($key =~ m/\W/);
2587
2588        # type sanity check
2589        if (defined $type) {
2590                $type =~ s/^--//;
2591                $type = undef
2592                        unless ($type eq 'bool' || $type eq 'int');
2593        }
2594
2595        # get config
2596        if (!defined $config_file ||
2597            $config_file ne "$git_dir/config") {
2598                %config = git_parse_project_config('gitweb');
2599                $config_file = "$git_dir/config";
2600        }
2601
2602        # check if config variable (key) exists
2603        return unless exists $config{"gitweb.$key"};
2604
2605        # ensure given type
2606        if (!defined $type) {
2607                return $config{"gitweb.$key"};
2608        } elsif ($type eq 'bool') {
2609                # backward compatibility: 'git config --bool' returns true/false
2610                return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2611        } elsif ($type eq 'int') {
2612                return config_to_int($config{"gitweb.$key"});
2613        }
2614        return $config{"gitweb.$key"};
2615}
2616
2617# get hash of given path at given ref
2618sub git_get_hash_by_path {
2619        my $base = shift;
2620        my $path = shift || return undef;
2621        my $type = shift;
2622
2623        $path =~ s,/+$,,;
2624
2625        open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2626                or die_error(500, "Open git-ls-tree failed");
2627        my $line = <$fd>;
2628        close $fd or return undef;
2629
2630        if (!defined $line) {
2631                # there is no tree or hash given by $path at $base
2632                return undef;
2633        }
2634
2635        #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2636        $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2637        if (defined $type && $type ne $2) {
2638                # type doesn't match
2639                return undef;
2640        }
2641        return $3;
2642}
2643
2644# get path of entry with given hash at given tree-ish (ref)
2645# used to get 'from' filename for combined diff (merge commit) for renames
2646sub git_get_path_by_hash {
2647        my $base = shift || return;
2648        my $hash = shift || return;
2649
2650        local $/ = "\0";
2651
2652        open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2653                or return undef;
2654        while (my $line = <$fd>) {
2655                chomp $line;
2656
2657                #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2658                #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2659                if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2660                        close $fd;
2661                        return $1;
2662                }
2663        }
2664        close $fd;
2665        return undef;
2666}
2667
2668## ......................................................................
2669## git utility functions, directly accessing git repository
2670
2671# get the value of config variable either from file named as the variable
2672# itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2673# configuration variable in the repository config file.
2674sub git_get_file_or_project_config {
2675        my ($path, $name) = @_;
2676
2677        $git_dir = "$projectroot/$path";
2678        open my $fd, '<', "$git_dir/$name"
2679                or return git_get_project_config($name);
2680        my $conf = <$fd>;
2681        close $fd;
2682        if (defined $conf) {
2683                chomp $conf;
2684        }
2685        return $conf;
2686}
2687
2688sub git_get_project_description {
2689        my $path = shift;
2690        return git_get_file_or_project_config($path, 'description');
2691}
2692
2693sub git_get_project_category {
2694        my $path = shift;
2695        return git_get_file_or_project_config($path, 'category');
2696}
2697
2698
2699# supported formats:
2700# * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2701#   - if its contents is a number, use it as tag weight,
2702#   - otherwise add a tag with weight 1
2703# * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2704#   the same value multiple times increases tag weight
2705# * `gitweb.ctag' multi-valued repo config variable
2706sub git_get_project_ctags {
2707        my $project = shift;
2708        my $ctags = {};
2709
2710        $git_dir = "$projectroot/$project";
2711        if (opendir my $dh, "$git_dir/ctags") {
2712                my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2713                foreach my $tagfile (@files) {
2714                        open my $ct, '<', $tagfile
2715                                or next;
2716                        my $val = <$ct>;
2717                        chomp $val if $val;
2718                        close $ct;
2719
2720                        (my $ctag = $tagfile) =~ s#.*/##;
2721                        if ($val =~ /^\d+$/) {
2722                                $ctags->{$ctag} = $val;
2723                        } else {
2724                                $ctags->{$ctag} = 1;
2725                        }
2726                }
2727                closedir $dh;
2728
2729        } elsif (open my $fh, '<', "$git_dir/ctags") {
2730                while (my $line = <$fh>) {
2731                        chomp $line;
2732                        $ctags->{$line}++ if $line;
2733                }
2734                close $fh;
2735
2736        } else {
2737                my $taglist = config_to_multi(git_get_project_config('ctag'));
2738                foreach my $tag (@$taglist) {
2739                        $ctags->{$tag}++;
2740                }
2741        }
2742
2743        return $ctags;
2744}
2745
2746# return hash, where keys are content tags ('ctags'),
2747# and values are sum of weights of given tag in every project
2748sub git_gather_all_ctags {
2749        my $projects = shift;
2750        my $ctags = {};
2751
2752        foreach my $p (@$projects) {
2753                foreach my $ct (keys %{$p->{'ctags'}}) {
2754                        $ctags->{$ct} += $p->{'ctags'}->{$ct};
2755                }
2756        }
2757
2758        return $ctags;
2759}
2760
2761sub git_populate_project_tagcloud {
2762        my $ctags = shift;
2763
2764        # First, merge different-cased tags; tags vote on casing
2765        my %ctags_lc;
2766        foreach (keys %$ctags) {
2767                $ctags_lc{lc $_}->{count} += $ctags->{$_};
2768                if (not $ctags_lc{lc $_}->{topcount}
2769                    or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2770                        $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2771                        $ctags_lc{lc $_}->{topname} = $_;
2772                }
2773        }
2774
2775        my $cloud;
2776        my $matched = $cgi->param('by_tag');
2777        if (eval { require HTML::TagCloud; 1; }) {
2778                $cloud = HTML::TagCloud->new;
2779                foreach my $ctag (sort keys %ctags_lc) {
2780                        # Pad the title with spaces so that the cloud looks
2781                        # less crammed.
2782                        my $title = esc_html($ctags_lc{$ctag}->{topname});
2783                        $title =~ s/ /&nbsp;/g;
2784                        $title =~ s/^/&nbsp;/g;
2785                        $title =~ s/$/&nbsp;/g;
2786                        if (defined $matched && $matched eq $ctag) {
2787                                $title = qq(<span class="match">$title</span>);
2788                        }
2789                        $cloud->add($title, href(project=>undef, ctag=>$ctag),
2790                                    $ctags_lc{$ctag}->{count});
2791                }
2792        } else {
2793                $cloud = {};
2794                foreach my $ctag (keys %ctags_lc) {
2795                        my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2796                        if (defined $matched && $matched eq $ctag) {
2797                                $title = qq(<span class="match">$title</span>);
2798                        }
2799                        $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2800                        $cloud->{$ctag}{ctag} =
2801                                $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2802                }
2803        }
2804        return $cloud;
2805}
2806
2807sub git_show_project_tagcloud {
2808        my ($cloud, $count) = @_;
2809        if (ref $cloud eq 'HTML::TagCloud') {
2810                return $cloud->html_and_css($count);
2811        } else {
2812                my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2813                return
2814                        '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2815                        join (', ', map {
2816                                $cloud->{$_}->{'ctag'}
2817                        } splice(@tags, 0, $count)) .
2818                        '</div>';
2819        }
2820}
2821
2822sub git_get_project_url_list {
2823        my $path = shift;
2824
2825        $git_dir = "$projectroot/$path";
2826        open my $fd, '<', "$git_dir/cloneurl"
2827                or return wantarray ?
2828                @{ config_to_multi(git_get_project_config('url')) } :
2829                   config_to_multi(git_get_project_config('url'));
2830        my @git_project_url_list = map { chomp; $_ } <$fd>;
2831        close $fd;
2832
2833        return wantarray ? @git_project_url_list : \@git_project_url_list;
2834}
2835
2836sub git_get_projects_list {
2837        my $filter = shift || '';
2838        my $paranoid = shift;
2839        my @list;
2840
2841        if (-d $projects_list) {
2842                # search in directory
2843                my $dir = $projects_list;
2844                # remove the trailing "/"
2845                $dir =~ s!/+$!!;
2846                my $pfxlen = length("$dir");
2847                my $pfxdepth = ($dir =~ tr!/!!);
2848                # when filtering, search only given subdirectory
2849                if ($filter && !$paranoid) {
2850                        $dir .= "/$filter";
2851                        $dir =~ s!/+$!!;
2852                }
2853
2854                File::Find::find({
2855                        follow_fast => 1, # follow symbolic links
2856                        follow_skip => 2, # ignore duplicates
2857                        dangling_symlinks => 0, # ignore dangling symlinks, silently
2858                        wanted => sub {
2859                                # global variables
2860                                our $project_maxdepth;
2861                                our $projectroot;
2862                                # skip project-list toplevel, if we get it.
2863                                return if (m!^[/.]$!);
2864                                # only directories can be git repositories
2865                                return unless (-d $_);
2866                                # don't traverse too deep (Find is super slow on os x)
2867                                # $project_maxdepth excludes depth of $projectroot
2868                                if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2869                                        $File::Find::prune = 1;
2870                                        return;
2871                                }
2872
2873                                my $path = substr($File::Find::name, $pfxlen + 1);
2874                                # paranoidly only filter here
2875                                if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
2876                                        next;
2877                                }
2878                                # we check related file in $projectroot
2879                                if (check_export_ok("$projectroot/$path")) {
2880                                        push @list, { path => $path };
2881                                        $File::Find::prune = 1;
2882                                }
2883                        },
2884                }, "$dir");
2885
2886        } elsif (-f $projects_list) {
2887                # read from file(url-encoded):
2888                # 'git%2Fgit.git Linus+Torvalds'
2889                # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2890                # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2891                open my $fd, '<', $projects_list or return;
2892        PROJECT:
2893                while (my $line = <$fd>) {
2894                        chomp $line;
2895                        my ($path, $owner) = split ' ', $line;
2896                        $path = unescape($path);
2897                        $owner = unescape($owner);
2898                        if (!defined $path) {
2899                                next;
2900                        }
2901                        # if $filter is rpovided, check if $path begins with $filter
2902                        if ($filter && $path !~ m!^\Q$filter\E/!) {
2903                                next;
2904                        }
2905                        if (check_export_ok("$projectroot/$path")) {
2906                                my $pr = {
2907                                        path => $path,
2908                                        owner => to_utf8($owner),
2909                                };
2910                                push @list, $pr;
2911                        }
2912                }
2913                close $fd;
2914        }
2915        return @list;
2916}
2917
2918# written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
2919# as side effects it sets 'forks' field to list of forks for forked projects
2920sub filter_forks_from_projects_list {
2921        my $projects = shift;
2922
2923        my %trie; # prefix tree of directories (path components)
2924        # generate trie out of those directories that might contain forks
2925        foreach my $pr (@$projects) {
2926                my $path = $pr->{'path'};
2927                $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
2928                next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
2929                next unless ($path);      # skip '.git' repository: tests, git-instaweb
2930                next unless (-d "$projectroot/$path"); # containing directory exists
2931                $pr->{'forks'} = [];      # there can be 0 or more forks of project
2932
2933                # add to trie
2934                my @dirs = split('/', $path);
2935                # walk the trie, until either runs out of components or out of trie
2936                my $ref = \%trie;
2937                while (scalar @dirs &&
2938                       exists($ref->{$dirs[0]})) {
2939                        $ref = $ref->{shift @dirs};
2940                }
2941                # create rest of trie structure from rest of components
2942                foreach my $dir (@dirs) {
2943                        $ref = $ref->{$dir} = {};
2944                }
2945                # create end marker, store $pr as a data
2946                $ref->{''} = $pr if (!exists $ref->{''});
2947        }
2948
2949        # filter out forks, by finding shortest prefix match for paths
2950        my @filtered;
2951 PROJECT:
2952        foreach my $pr (@$projects) {
2953                # trie lookup
2954                my $ref = \%trie;
2955        DIR:
2956                foreach my $dir (split('/', $pr->{'path'})) {
2957                        if (exists $ref->{''}) {
2958                                # found [shortest] prefix, is a fork - skip it
2959                                push @{$ref->{''}{'forks'}}, $pr;
2960                                next PROJECT;
2961                        }
2962                        if (!exists $ref->{$dir}) {
2963                                # not in trie, cannot have prefix, not a fork
2964                                push @filtered, $pr;
2965                                next PROJECT;
2966                        }
2967                        # If the dir is there, we just walk one step down the trie.
2968                        $ref = $ref->{$dir};
2969                }
2970                # we ran out of trie
2971                # (shouldn't happen: it's either no match, or end marker)
2972                push @filtered, $pr;
2973        }
2974
2975        return @filtered;
2976}
2977
2978# note: fill_project_list_info must be run first,
2979# for 'descr_long' and 'ctags' to be filled
2980sub search_projects_list {
2981        my ($projlist, %opts) = @_;
2982        my $tagfilter  = $opts{'tagfilter'};
2983        my $searchtext = $opts{'searchtext'};
2984
2985        return @$projlist
2986                unless ($tagfilter || $searchtext);
2987
2988        my @projects;
2989 PROJECT:
2990        foreach my $pr (@$projlist) {
2991
2992                if ($tagfilter) {
2993                        next unless ref($pr->{'ctags'}) eq 'HASH';
2994                        next unless
2995                                grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
2996                }
2997
2998                if ($searchtext) {
2999                        next unless
3000                                $pr->{'path'} =~ /$searchtext/ ||
3001                                $pr->{'descr_long'} =~ /$searchtext/;
3002                }
3003
3004                push @projects, $pr;
3005        }
3006
3007        return @projects;
3008}
3009
3010our $gitweb_project_owner = undef;
3011sub git_get_project_list_from_file {
3012
3013        return if (defined $gitweb_project_owner);
3014
3015        $gitweb_project_owner = {};
3016        # read from file (url-encoded):
3017        # 'git%2Fgit.git Linus+Torvalds'
3018        # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3019        # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3020        if (-f $projects_list) {
3021                open(my $fd, '<', $projects_list);
3022                while (my $line = <$fd>) {
3023                        chomp $line;
3024                        my ($pr, $ow) = split ' ', $line;
3025                        $pr = unescape($pr);
3026                        $ow = unescape($ow);
3027                        $gitweb_project_owner->{$pr} = to_utf8($ow);
3028                }
3029                close $fd;
3030        }
3031}
3032
3033sub git_get_project_owner {
3034        my $project = shift;
3035        my $owner;
3036
3037        return undef unless $project;
3038        $git_dir = "$projectroot/$project";
3039
3040        if (!defined $gitweb_project_owner) {
3041                git_get_project_list_from_file();
3042        }
3043
3044        if (exists $gitweb_project_owner->{$project}) {
3045                $owner = $gitweb_project_owner->{$project};
3046        }
3047        if (!defined $owner){
3048                $owner = git_get_project_config('owner');
3049        }
3050        if (!defined $owner) {
3051                $owner = get_file_owner("$git_dir");
3052        }
3053
3054        return $owner;
3055}
3056
3057sub git_get_last_activity {
3058        my ($path) = @_;
3059        my $fd;
3060
3061        $git_dir = "$projectroot/$path";
3062        open($fd, "-|", git_cmd(), 'for-each-ref',
3063             '--format=%(committer)',
3064             '--sort=-committerdate',
3065             '--count=1',
3066             'refs/heads') or return;
3067        my $most_recent = <$fd>;
3068        close $fd or return;
3069        if (defined $most_recent &&
3070            $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3071                my $timestamp = $1;
3072                my $age = time - $timestamp;
3073                return ($age, age_string($age));
3074        }
3075        return (undef, undef);
3076}
3077
3078# Implementation note: when a single remote is wanted, we cannot use 'git
3079# remote show -n' because that command always work (assuming it's a remote URL
3080# if it's not defined), and we cannot use 'git remote show' because that would
3081# try to make a network roundtrip. So the only way to find if that particular
3082# remote is defined is to walk the list provided by 'git remote -v' and stop if
3083# and when we find what we want.
3084sub git_get_remotes_list {
3085        my $wanted = shift;
3086        my %remotes = ();
3087
3088        open my $fd, '-|' , git_cmd(), 'remote', '-v';
3089        return unless $fd;
3090        while (my $remote = <$fd>) {
3091                chomp $remote;
3092                $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3093                next if $wanted and not $remote eq $wanted;
3094                my ($url, $key) = ($1, $2);
3095
3096                $remotes{$remote} ||= { 'heads' => () };
3097                $remotes{$remote}{$key} = $url;
3098        }
3099        close $fd or return;
3100        return wantarray ? %remotes : \%remotes;
3101}
3102
3103# Takes a hash of remotes as first parameter and fills it by adding the
3104# available remote heads for each of the indicated remotes.
3105sub fill_remote_heads {
3106        my $remotes = shift;
3107        my @heads = map { "remotes/$_" } keys %$remotes;
3108        my @remoteheads = git_get_heads_list(undef, @heads);
3109        foreach my $remote (keys %$remotes) {
3110                $remotes->{$remote}{'heads'} = [ grep {
3111                        $_->{'name'} =~ s!^$remote/!!
3112                        } @remoteheads ];
3113        }
3114}
3115
3116sub git_get_references {
3117        my $type = shift || "";
3118        my %refs;
3119        # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3120        # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3121        open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3122                ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3123                or return;
3124
3125        while (my $line = <$fd>) {
3126                chomp $line;
3127                if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3128                        if (defined $refs{$1}) {
3129                                push @{$refs{$1}}, $2;
3130                        } else {
3131                                $refs{$1} = [ $2 ];
3132                        }
3133                }
3134        }
3135        close $fd or return;
3136        return \%refs;
3137}
3138
3139sub git_get_rev_name_tags {
3140        my $hash = shift || return undef;
3141
3142        open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3143                or return;
3144        my $name_rev = <$fd>;
3145        close $fd;
3146
3147        if ($name_rev =~ m|^$hash tags/(.*)$|) {
3148                return $1;
3149        } else {
3150                # catches also '$hash undefined' output
3151                return undef;
3152        }
3153}
3154
3155## ----------------------------------------------------------------------
3156## parse to hash functions
3157
3158sub parse_date {
3159        my $epoch = shift;
3160        my $tz = shift || "-0000";
3161
3162        my %date;
3163        my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3164        my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3165        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3166        $date{'hour'} = $hour;
3167        $date{'minute'} = $min;
3168        $date{'mday'} = $mday;
3169        $date{'day'} = $days[$wday];
3170        $date{'month'} = $months[$mon];
3171        $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3172                             $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3173        $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3174                             $mday, $months[$mon], $hour ,$min;
3175        $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3176                             1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3177
3178        my ($tz_sign, $tz_hour, $tz_min) =
3179                ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3180        $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3181        my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3182        ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3183        $date{'hour_local'} = $hour;
3184        $date{'minute_local'} = $min;
3185        $date{'tz_local'} = $tz;
3186        $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3187                                  1900+$year, $mon+1, $mday,
3188                                  $hour, $min, $sec, $tz);
3189        return %date;
3190}
3191
3192sub parse_tag {
3193        my $tag_id = shift;
3194        my %tag;
3195        my @comment;
3196
3197        open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3198        $tag{'id'} = $tag_id;
3199        while (my $line = <$fd>) {
3200                chomp $line;
3201                if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3202                        $tag{'object'} = $1;
3203                } elsif ($line =~ m/^type (.+)$/) {
3204                        $tag{'type'} = $1;
3205                } elsif ($line =~ m/^tag (.+)$/) {
3206                        $tag{'name'} = $1;
3207                } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3208                        $tag{'author'} = $1;
3209                        $tag{'author_epoch'} = $2;
3210                        $tag{'author_tz'} = $3;
3211                        if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3212                                $tag{'author_name'}  = $1;
3213                                $tag{'author_email'} = $2;
3214                        } else {
3215                                $tag{'author_name'} = $tag{'author'};
3216                        }
3217                } elsif ($line =~ m/--BEGIN/) {
3218                        push @comment, $line;
3219                        last;
3220                } elsif ($line eq "") {
3221                        last;
3222                }
3223        }
3224        push @comment, <$fd>;
3225        $tag{'comment'} = \@comment;
3226        close $fd or return;
3227        if (!defined $tag{'name'}) {
3228                return
3229        };
3230        return %tag
3231}
3232
3233sub parse_commit_text {
3234        my ($commit_text, $withparents) = @_;
3235        my @commit_lines = split '\n', $commit_text;
3236        my %co;
3237
3238        pop @commit_lines; # Remove '\0'
3239
3240        if (! @commit_lines) {
3241                return;
3242        }
3243
3244        my $header = shift @commit_lines;
3245        if ($header !~ m/^[0-9a-fA-F]{40}/) {
3246                return;
3247        }
3248        ($co{'id'}, my @parents) = split ' ', $header;
3249        while (my $line = shift @commit_lines) {
3250                last if $line eq "\n";
3251                if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3252                        $co{'tree'} = $1;
3253                } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3254                        push @parents, $1;
3255                } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3256                        $co{'author'} = to_utf8($1);
3257                        $co{'author_epoch'} = $2;
3258                        $co{'author_tz'} = $3;
3259                        if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3260                                $co{'author_name'}  = $1;
3261                                $co{'author_email'} = $2;
3262                        } else {
3263                                $co{'author_name'} = $co{'author'};
3264                        }
3265                } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3266                        $co{'committer'} = to_utf8($1);
3267                        $co{'committer_epoch'} = $2;
3268                        $co{'committer_tz'} = $3;
3269                        if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3270                                $co{'committer_name'}  = $1;
3271                                $co{'committer_email'} = $2;
3272                        } else {
3273                                $co{'committer_name'} = $co{'committer'};
3274                        }
3275                }
3276        }
3277        if (!defined $co{'tree'}) {
3278                return;
3279        };
3280        $co{'parents'} = \@parents;
3281        $co{'parent'} = $parents[0];
3282
3283        foreach my $title (@commit_lines) {
3284                $title =~ s/^    //;
3285                if ($title ne "") {
3286                        $co{'title'} = chop_str($title, 80, 5);
3287                        # remove leading stuff of merges to make the interesting part visible
3288                        if (length($title) > 50) {
3289                                $title =~ s/^Automatic //;
3290                                $title =~ s/^merge (of|with) /Merge ... /i;
3291                                if (length($title) > 50) {
3292                                        $title =~ s/(http|rsync):\/\///;
3293                                }
3294                                if (length($title) > 50) {
3295                                        $title =~ s/(master|www|rsync)\.//;
3296                                }
3297                                if (length($title) > 50) {
3298                                        $title =~ s/kernel.org:?//;
3299                                }
3300                                if (length($title) > 50) {
3301                                        $title =~ s/\/pub\/scm//;
3302                                }
3303                        }
3304                        $co{'title_short'} = chop_str($title, 50, 5);
3305                        last;
3306                }
3307        }
3308        if (! defined $co{'title'} || $co{'title'} eq "") {
3309                $co{'title'} = $co{'title_short'} = '(no commit message)';
3310        }
3311        # remove added spaces
3312        foreach my $line (@commit_lines) {
3313                $line =~ s/^    //;
3314        }
3315        $co{'comment'} = \@commit_lines;
3316
3317        my $age = time - $co{'committer_epoch'};
3318        $co{'age'} = $age;
3319        $co{'age_string'} = age_string($age);
3320        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3321        if ($age > 60*60*24*7*2) {
3322                $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3323                $co{'age_string_age'} = $co{'age_string'};
3324        } else {
3325                $co{'age_string_date'} = $co{'age_string'};
3326                $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3327        }
3328        return %co;
3329}
3330
3331sub parse_commit {
3332        my ($commit_id) = @_;
3333        my %co;
3334
3335        local $/ = "\0";
3336
3337        open my $fd, "-|", git_cmd(), "rev-list",
3338                "--parents",
3339                "--header",
3340                "--max-count=1",
3341                $commit_id,
3342                "--",
3343                or die_error(500, "Open git-rev-list failed");
3344        %co = parse_commit_text(<$fd>, 1);
3345        close $fd;
3346
3347        return %co;
3348}
3349
3350sub parse_commits {
3351        my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3352        my @cos;
3353
3354        $maxcount ||= 1;
3355        $skip ||= 0;
3356
3357        local $/ = "\0";
3358
3359        open my $fd, "-|", git_cmd(), "rev-list",
3360                "--header",
3361                @args,
3362                ("--max-count=" . $maxcount),
3363                ("--skip=" . $skip),
3364                @extra_options,
3365                $commit_id,
3366                "--",
3367                ($filename ? ($filename) : ())
3368                or die_error(500, "Open git-rev-list failed");
3369        while (my $line = <$fd>) {
3370                my %co = parse_commit_text($line);
3371                push @cos, \%co;
3372        }
3373        close $fd;
3374
3375        return wantarray ? @cos : \@cos;
3376}
3377
3378# parse line of git-diff-tree "raw" output
3379sub parse_difftree_raw_line {
3380        my $line = shift;
3381        my %res;
3382
3383        # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3384        # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3385        if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3386                $res{'from_mode'} = $1;
3387                $res{'to_mode'} = $2;
3388                $res{'from_id'} = $3;
3389                $res{'to_id'} = $4;
3390                $res{'status'} = $5;
3391                $res{'similarity'} = $6;
3392                if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3393                        ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3394                } else {
3395                        $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3396                }
3397        }
3398        # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3399        # combined diff (for merge commit)
3400        elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3401                $res{'nparents'}  = length($1);
3402                $res{'from_mode'} = [ split(' ', $2) ];
3403                $res{'to_mode'} = pop @{$res{'from_mode'}};
3404                $res{'from_id'} = [ split(' ', $3) ];
3405                $res{'to_id'} = pop @{$res{'from_id'}};
3406                $res{'status'} = [ split('', $4) ];
3407                $res{'to_file'} = unquote($5);
3408        }
3409        # 'c512b523472485aef4fff9e57b229d9d243c967f'
3410        elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3411                $res{'commit'} = $1;
3412        }
3413
3414        return wantarray ? %res : \%res;
3415}
3416
3417# wrapper: return parsed line of git-diff-tree "raw" output
3418# (the argument might be raw line, or parsed info)
3419sub parsed_difftree_line {
3420        my $line_or_ref = shift;
3421
3422        if (ref($line_or_ref) eq "HASH") {
3423                # pre-parsed (or generated by hand)
3424                return $line_or_ref;
3425        } else {
3426                return parse_difftree_raw_line($line_or_ref);
3427        }
3428}
3429
3430# parse line of git-ls-tree output
3431sub parse_ls_tree_line {
3432        my $line = shift;
3433        my %opts = @_;
3434        my %res;
3435
3436        if ($opts{'-l'}) {
3437                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3438                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3439
3440                $res{'mode'} = $1;
3441                $res{'type'} = $2;
3442                $res{'hash'} = $3;
3443                $res{'size'} = $4;
3444                if ($opts{'-z'}) {
3445                        $res{'name'} = $5;
3446                } else {
3447                        $res{'name'} = unquote($5);
3448                }
3449        } else {
3450                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3451                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3452
3453                $res{'mode'} = $1;
3454                $res{'type'} = $2;
3455                $res{'hash'} = $3;
3456                if ($opts{'-z'}) {
3457                        $res{'name'} = $4;
3458                } else {
3459                        $res{'name'} = unquote($4);
3460                }
3461        }
3462
3463        return wantarray ? %res : \%res;
3464}
3465
3466# generates _two_ hashes, references to which are passed as 2 and 3 argument
3467sub parse_from_to_diffinfo {
3468        my ($diffinfo, $from, $to, @parents) = @_;
3469
3470        if ($diffinfo->{'nparents'}) {
3471                # combined diff
3472                $from->{'file'} = [];
3473                $from->{'href'} = [];
3474                fill_from_file_info($diffinfo, @parents)
3475                        unless exists $diffinfo->{'from_file'};
3476                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3477                        $from->{'file'}[$i] =
3478                                defined $diffinfo->{'from_file'}[$i] ?
3479                                        $diffinfo->{'from_file'}[$i] :
3480                                        $diffinfo->{'to_file'};
3481                        if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3482                                $from->{'href'}[$i] = href(action=>"blob",
3483                                                           hash_base=>$parents[$i],
3484                                                           hash=>$diffinfo->{'from_id'}[$i],
3485                                                           file_name=>$from->{'file'}[$i]);
3486                        } else {
3487                                $from->{'href'}[$i] = undef;
3488                        }
3489                }
3490        } else {
3491                # ordinary (not combined) diff
3492                $from->{'file'} = $diffinfo->{'from_file'};
3493                if ($diffinfo->{'status'} ne "A") { # not new (added) file
3494                        $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3495                                               hash=>$diffinfo->{'from_id'},
3496                                               file_name=>$from->{'file'});
3497                } else {
3498                        delete $from->{'href'};
3499                }
3500        }
3501
3502        $to->{'file'} = $diffinfo->{'to_file'};
3503        if (!is_deleted($diffinfo)) { # file exists in result
3504                $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3505                                     hash=>$diffinfo->{'to_id'},
3506                                     file_name=>$to->{'file'});
3507        } else {
3508                delete $to->{'href'};
3509        }
3510}
3511
3512## ......................................................................
3513## parse to array of hashes functions
3514
3515sub git_get_heads_list {
3516        my ($limit, @classes) = @_;
3517        @classes = ('heads') unless @classes;
3518        my @patterns = map { "refs/$_" } @classes;
3519        my @headslist;
3520
3521        open my $fd, '-|', git_cmd(), 'for-each-ref',
3522                ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3523                '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3524                @patterns
3525                or return;
3526        while (my $line = <$fd>) {
3527                my %ref_item;
3528
3529                chomp $line;
3530                my ($refinfo, $committerinfo) = split(/\0/, $line);
3531                my ($hash, $name, $title) = split(' ', $refinfo, 3);
3532                my ($committer, $epoch, $tz) =
3533                        ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3534                $ref_item{'fullname'}  = $name;
3535                $name =~ s!^refs/(?:head|remote)s/!!;
3536
3537                $ref_item{'name'}  = $name;
3538                $ref_item{'id'}    = $hash;
3539                $ref_item{'title'} = $title || '(no commit message)';
3540                $ref_item{'epoch'} = $epoch;
3541                if ($epoch) {
3542                        $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3543                } else {
3544                        $ref_item{'age'} = "unknown";
3545                }
3546
3547                push @headslist, \%ref_item;
3548        }
3549        close $fd;
3550
3551        return wantarray ? @headslist : \@headslist;
3552}
3553
3554sub git_get_tags_list {
3555        my $limit = shift;
3556        my @tagslist;
3557
3558        open my $fd, '-|', git_cmd(), 'for-each-ref',
3559                ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3560                '--format=%(objectname) %(objecttype) %(refname) '.
3561                '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3562                'refs/tags'
3563                or return;
3564        while (my $line = <$fd>) {
3565                my %ref_item;
3566
3567                chomp $line;
3568                my ($refinfo, $creatorinfo) = split(/\0/, $line);
3569                my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3570                my ($creator, $epoch, $tz) =
3571                        ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3572                $ref_item{'fullname'} = $name;
3573                $name =~ s!^refs/tags/!!;
3574
3575                $ref_item{'type'} = $type;
3576                $ref_item{'id'} = $id;
3577                $ref_item{'name'} = $name;
3578                if ($type eq "tag") {
3579                        $ref_item{'subject'} = $title;
3580                        $ref_item{'reftype'} = $reftype;
3581                        $ref_item{'refid'}   = $refid;
3582                } else {
3583                        $ref_item{'reftype'} = $type;
3584                        $ref_item{'refid'}   = $id;
3585                }
3586
3587                if ($type eq "tag" || $type eq "commit") {
3588                        $ref_item{'epoch'} = $epoch;
3589                        if ($epoch) {
3590                                $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3591                        } else {
3592                                $ref_item{'age'} = "unknown";
3593                        }
3594                }
3595
3596                push @tagslist, \%ref_item;
3597        }
3598        close $fd;
3599
3600        return wantarray ? @tagslist : \@tagslist;
3601}
3602
3603## ----------------------------------------------------------------------
3604## filesystem-related functions
3605
3606sub get_file_owner {
3607        my $path = shift;
3608
3609        my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3610        my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3611        if (!defined $gcos) {
3612                return undef;
3613        }
3614        my $owner = $gcos;
3615        $owner =~ s/[,;].*$//;
3616        return to_utf8($owner);
3617}
3618
3619# assume that file exists
3620sub insert_file {
3621        my $filename = shift;
3622
3623        open my $fd, '<', $filename;
3624        print map { to_utf8($_) } <$fd>;
3625        close $fd;
3626}
3627
3628## ......................................................................
3629## mimetype related functions
3630
3631sub mimetype_guess_file {
3632        my $filename = shift;
3633        my $mimemap = shift;
3634        -r $mimemap or return undef;
3635
3636        my %mimemap;
3637        open(my $mh, '<', $mimemap) or return undef;
3638        while (<$mh>) {
3639                next if m/^#/; # skip comments
3640                my ($mimetype, @exts) = split(/\s+/);
3641                foreach my $ext (@exts) {
3642                        $mimemap{$ext} = $mimetype;
3643                }
3644        }
3645        close($mh);
3646
3647        $filename =~ /\.([^.]*)$/;
3648        return $mimemap{$1};
3649}
3650
3651sub mimetype_guess {
3652        my $filename = shift;
3653        my $mime;
3654        $filename =~ /\./ or return undef;
3655
3656        if ($mimetypes_file) {
3657                my $file = $mimetypes_file;
3658                if ($file !~ m!^/!) { # if it is relative path
3659                        # it is relative to project
3660                        $file = "$projectroot/$project/$file";
3661                }
3662                $mime = mimetype_guess_file($filename, $file);
3663        }
3664        $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3665        return $mime;
3666}
3667
3668sub blob_mimetype {
3669        my $fd = shift;
3670        my $filename = shift;
3671
3672        if ($filename) {
3673                my $mime = mimetype_guess($filename);
3674                $mime and return $mime;
3675        }
3676
3677        # just in case
3678        return $default_blob_plain_mimetype unless $fd;
3679
3680        if (-T $fd) {
3681                return 'text/plain';
3682        } elsif (! $filename) {
3683                return 'application/octet-stream';
3684        } elsif ($filename =~ m/\.png$/i) {
3685                return 'image/png';
3686        } elsif ($filename =~ m/\.gif$/i) {
3687                return 'image/gif';
3688        } elsif ($filename =~ m/\.jpe?g$/i) {
3689                return 'image/jpeg';
3690        } else {
3691                return 'application/octet-stream';
3692        }
3693}
3694
3695sub blob_contenttype {
3696        my ($fd, $file_name, $type) = @_;
3697
3698        $type ||= blob_mimetype($fd, $file_name);
3699        if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3700                $type .= "; charset=$default_text_plain_charset";
3701        }
3702
3703        return $type;
3704}
3705
3706# guess file syntax for syntax highlighting; return undef if no highlighting
3707# the name of syntax can (in the future) depend on syntax highlighter used
3708sub guess_file_syntax {
3709        my ($highlight, $mimetype, $file_name) = @_;
3710        return undef unless ($highlight && defined $file_name);
3711        my $basename = basename($file_name, '.in');
3712        return $highlight_basename{$basename}
3713                if exists $highlight_basename{$basename};
3714
3715        $basename =~ /\.([^.]*)$/;
3716        my $ext = $1 or return undef;
3717        return $highlight_ext{$ext}
3718                if exists $highlight_ext{$ext};
3719
3720        return undef;
3721}
3722
3723# run highlighter and return FD of its output,
3724# or return original FD if no highlighting
3725sub run_highlighter {
3726        my ($fd, $highlight, $syntax) = @_;
3727        return $fd unless ($highlight && defined $syntax);
3728
3729        close $fd;
3730        open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3731                  quote_command($highlight_bin).
3732                  " --replace-tabs=8 --fragment --syntax $syntax |"
3733                or die_error(500, "Couldn't open file or run syntax highlighter");
3734        return $fd;
3735}
3736
3737## ======================================================================
3738## functions printing HTML: header, footer, error page
3739
3740sub get_page_title {
3741        my $title = to_utf8($site_name);
3742
3743        unless (defined $project) {
3744                if (defined $project_filter) {
3745                        $title .= " - " . to_utf8($project_filter);
3746                }
3747                return $title;
3748        }
3749        $title .= " - " . to_utf8($project);
3750
3751        return $title unless (defined $action);
3752        $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3753
3754        return $title unless (defined $file_name);
3755        $title .= " - " . esc_path($file_name);
3756        if ($action eq "tree" && $file_name !~ m|/$|) {
3757                $title .= "/";
3758        }
3759
3760        return $title;
3761}
3762
3763sub get_content_type_html {
3764        # require explicit support from the UA if we are to send the page as
3765        # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3766        # we have to do this because MSIE sometimes globs '*/*', pretending to
3767        # support xhtml+xml but choking when it gets what it asked for.
3768        if (defined $cgi->http('HTTP_ACCEPT') &&
3769            $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3770            $cgi->Accept('application/xhtml+xml') != 0) {
3771                return 'application/xhtml+xml';
3772        } else {
3773                return 'text/html';
3774        }
3775}
3776
3777sub print_feed_meta {
3778        if (defined $project) {
3779                my %href_params = get_feed_info();
3780                if (!exists $href_params{'-title'}) {
3781                        $href_params{'-title'} = 'log';
3782                }
3783
3784                foreach my $format (qw(RSS Atom)) {
3785                        my $type = lc($format);
3786                        my %link_attr = (
3787                                '-rel' => 'alternate',
3788                                '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3789                                '-type' => "application/$type+xml"
3790                        );
3791
3792                        $href_params{'action'} = $type;
3793                        $link_attr{'-href'} = href(%href_params);
3794                        print "<link ".
3795                              "rel=\"$link_attr{'-rel'}\" ".
3796                              "title=\"$link_attr{'-title'}\" ".
3797                              "href=\"$link_attr{'-href'}\" ".
3798                              "type=\"$link_attr{'-type'}\" ".
3799                              "/>\n";
3800
3801                        $href_params{'extra_options'} = '--no-merges';
3802                        $link_attr{'-href'} = href(%href_params);
3803                        $link_attr{'-title'} .= ' (no merges)';
3804                        print "<link ".
3805                              "rel=\"$link_attr{'-rel'}\" ".
3806                              "title=\"$link_attr{'-title'}\" ".
3807                              "href=\"$link_attr{'-href'}\" ".
3808                              "type=\"$link_attr{'-type'}\" ".
3809                              "/>\n";
3810                }
3811
3812        } else {
3813                printf('<link rel="alternate" title="%s projects list" '.
3814                       'href="%s" type="text/plain; charset=utf-8" />'."\n",
3815                       esc_attr($site_name), href(project=>undef, action=>"project_index"));
3816                printf('<link rel="alternate" title="%s projects feeds" '.
3817                       'href="%s" type="text/x-opml" />'."\n",
3818                       esc_attr($site_name), href(project=>undef, action=>"opml"));
3819        }
3820}
3821
3822sub print_header_links {
3823        my $status = shift;
3824
3825        # print out each stylesheet that exist, providing backwards capability
3826        # for those people who defined $stylesheet in a config file
3827        if (defined $stylesheet) {
3828                print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3829        } else {
3830                foreach my $stylesheet (@stylesheets) {
3831                        next unless $stylesheet;
3832                        print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3833                }
3834        }
3835        print_feed_meta()
3836                if ($status eq '200 OK');
3837        if (defined $favicon) {
3838                print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3839        }
3840}
3841
3842sub print_nav_breadcrumbs_path {
3843        my $dirprefix = undef;
3844        while (my $part = shift) {
3845                $dirprefix .= "/" if defined $dirprefix;
3846                $dirprefix .= $part;
3847                print $cgi->a({-href => href(project => undef,
3848                                             project_filter => $dirprefix,
3849                                             action => "project_list")},
3850                              esc_html($part)) . " / ";
3851        }
3852}
3853
3854sub print_nav_breadcrumbs {
3855        my %opts = @_;
3856
3857        print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3858        if (defined $project) {
3859                my @dirname = split '/', $project;
3860                my $projectbasename = pop @dirname;
3861                print_nav_breadcrumbs_path(@dirname);
3862                print $cgi->a({-href => href(action=>"summary")}, esc_html($projectbasename));
3863                if (defined $action) {
3864                        my $action_print = $action ;
3865                        if (defined $opts{-action_extra}) {
3866                                $action_print = $cgi->a({-href => href(action=>$action)},
3867                                        $action);
3868                        }
3869                        print " / $action_print";
3870                }
3871                if (defined $opts{-action_extra}) {
3872                        print " / $opts{-action_extra}";
3873                }
3874                print "\n";
3875        } elsif (defined $project_filter) {
3876                print_nav_breadcrumbs_path(split '/', $project_filter);
3877        }
3878}
3879
3880sub print_search_form {
3881        if (!defined $searchtext) {
3882                $searchtext = "";
3883        }
3884        my $search_hash;
3885        if (defined $hash_base) {
3886                $search_hash = $hash_base;
3887        } elsif (defined $hash) {
3888                $search_hash = $hash;
3889        } else {
3890                $search_hash = "HEAD";
3891        }
3892        my $action = $my_uri;
3893        my $use_pathinfo = gitweb_check_feature('pathinfo');
3894        if ($use_pathinfo) {
3895                $action .= "/".esc_url($project);
3896        }
3897        print $cgi->startform(-method => "get", -action => $action) .
3898              "<div class=\"search\">\n" .
3899              (!$use_pathinfo &&
3900              $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3901              $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3902              $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3903              $cgi->popup_menu(-name => 'st', -default => 'commit',
3904                               -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3905              $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3906              " search:\n",
3907              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3908              "<span title=\"Extended regular expression\">" .
3909              $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3910                             -checked => $search_use_regexp) .
3911              "</span>" .
3912              "</div>" .
3913              $cgi->end_form() . "\n";
3914}
3915
3916sub git_header_html {
3917        my $status = shift || "200 OK";
3918        my $expires = shift;
3919        my %opts = @_;
3920
3921        my $title = get_page_title();
3922        my $content_type = get_content_type_html();
3923        print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3924                           -status=> $status, -expires => $expires)
3925                unless ($opts{'-no_http_header'});
3926        my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3927        print <<EOF;
3928<?xml version="1.0" encoding="utf-8"?>
3929<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3930<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3931<!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3932<!-- git core binaries version $git_version -->
3933<head>
3934<meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3935<meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3936<meta name="robots" content="index, nofollow"/>
3937<title>$title</title>
3938EOF
3939        # the stylesheet, favicon etc urls won't work correctly with path_info
3940        # unless we set the appropriate base URL
3941        if ($ENV{'PATH_INFO'}) {
3942                print "<base href=\"".esc_url($base_url)."\" />\n";
3943        }
3944        print_header_links($status);
3945
3946        if (defined $site_html_head_string) {
3947                print to_utf8($site_html_head_string);
3948        }
3949
3950        print "</head>\n" .
3951              "<body>\n";
3952
3953        if (defined $site_header && -f $site_header) {
3954                insert_file($site_header);
3955        }
3956
3957        print "<div class=\"page_header\">\n";
3958        if (defined $logo) {
3959                print $cgi->a({-href => esc_url($logo_url),
3960                               -title => $logo_label},
3961                              $cgi->img({-src => esc_url($logo),
3962                                         -width => 72, -height => 27,
3963                                         -alt => "git",
3964                                         -class => "logo"}));
3965        }
3966        print_nav_breadcrumbs(%opts);
3967        print "</div>\n";
3968
3969        my $have_search = gitweb_check_feature('search');
3970        if (defined $project && $have_search) {
3971                print_search_form();
3972        }
3973}
3974
3975sub git_footer_html {
3976        my $feed_class = 'rss_logo';
3977
3978        print "<div class=\"page_footer\">\n";
3979        if (defined $project) {
3980                my $descr = git_get_project_description($project);
3981                if (defined $descr) {
3982                        print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3983                }
3984
3985                my %href_params = get_feed_info();
3986                if (!%href_params) {
3987                        $feed_class .= ' generic';
3988                }
3989                $href_params{'-title'} ||= 'log';
3990
3991                foreach my $format (qw(RSS Atom)) {
3992                        $href_params{'action'} = lc($format);
3993                        print $cgi->a({-href => href(%href_params),
3994                                      -title => "$href_params{'-title'} $format feed",
3995                                      -class => $feed_class}, $format)."\n";
3996                }
3997
3998        } else {
3999                print $cgi->a({-href => href(project=>undef, action=>"opml",
4000                                             project_filter => $project_filter),
4001                              -class => $feed_class}, "OPML") . " ";
4002                print $cgi->a({-href => href(project=>undef, action=>"project_index",
4003                                             project_filter => $project_filter),
4004                              -class => $feed_class}, "TXT") . "\n";
4005        }
4006        print "</div>\n"; # class="page_footer"
4007
4008        if (defined $t0 && gitweb_check_feature('timed')) {
4009                print "<div id=\"generating_info\">\n";
4010                print 'This page took '.
4011                      '<span id="generating_time" class="time_span">'.
4012                      tv_interval($t0, [ gettimeofday() ]).
4013                      ' seconds </span>'.
4014                      ' and '.
4015                      '<span id="generating_cmd">'.
4016                      $number_of_git_cmds.
4017                      '</span> git commands '.
4018                      " to generate.\n";
4019                print "</div>\n"; # class="page_footer"
4020        }
4021
4022        if (defined $site_footer && -f $site_footer) {
4023                insert_file($site_footer);
4024        }
4025
4026        print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
4027        if (defined $action &&
4028            $action eq 'blame_incremental') {
4029                print qq!<script type="text/javascript">\n!.
4030                      qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
4031                      qq!           "!. href() .qq!");\n!.
4032                      qq!</script>\n!;
4033        } else {
4034                my ($jstimezone, $tz_cookie, $datetime_class) =
4035                        gitweb_get_feature('javascript-timezone');
4036
4037                print qq!<script type="text/javascript">\n!.
4038                      qq!window.onload = function () {\n!;
4039                if (gitweb_check_feature('javascript-actions')) {
4040                        print qq!       fixLinks();\n!;
4041                }
4042                if ($jstimezone && $tz_cookie && $datetime_class) {
4043                        print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4044                              qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4045                }
4046                print qq!};\n!.
4047                      qq!</script>\n!;
4048        }
4049
4050        print "</body>\n" .
4051              "</html>";
4052}
4053
4054# die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4055# Example: die_error(404, 'Hash not found')
4056# By convention, use the following status codes (as defined in RFC 2616):
4057# 400: Invalid or missing CGI parameters, or
4058#      requested object exists but has wrong type.
4059# 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4060#      this server or project.
4061# 404: Requested object/revision/project doesn't exist.
4062# 500: The server isn't configured properly, or
4063#      an internal error occurred (e.g. failed assertions caused by bugs), or
4064#      an unknown error occurred (e.g. the git binary died unexpectedly).
4065# 503: The server is currently unavailable (because it is overloaded,
4066#      or down for maintenance).  Generally, this is a temporary state.
4067sub die_error {
4068        my $status = shift || 500;
4069        my $error = esc_html(shift) || "Internal Server Error";
4070        my $extra = shift;
4071        my %opts = @_;
4072
4073        my %http_responses = (
4074                400 => '400 Bad Request',
4075                403 => '403 Forbidden',
4076                404 => '404 Not Found',
4077                500 => '500 Internal Server Error',
4078                503 => '503 Service Unavailable',
4079        );
4080        git_header_html($http_responses{$status}, undef, %opts);
4081        print <<EOF;
4082<div class="page_body">
4083<br /><br />
4084$status - $error
4085<br />
4086EOF
4087        if (defined $extra) {
4088                print "<hr />\n" .
4089                      "$extra\n";
4090        }
4091        print "</div>\n";
4092
4093        git_footer_html();
4094        goto DONE_GITWEB
4095                unless ($opts{'-error_handler'});
4096}
4097
4098## ----------------------------------------------------------------------
4099## functions printing or outputting HTML: navigation
4100
4101sub git_print_page_nav {
4102        my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4103        $extra = '' if !defined $extra; # pager or formats
4104
4105        my @navs = qw(summary shortlog log commit commitdiff tree);
4106        if ($suppress) {
4107                @navs = grep { $_ ne $suppress } @navs;
4108        }
4109
4110        my %arg = map { $_ => {action=>$_} } @navs;
4111        if (defined $head) {
4112                for (qw(commit commitdiff)) {
4113                        $arg{$_}{'hash'} = $head;
4114                }
4115                if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4116                        for (qw(shortlog log)) {
4117                                $arg{$_}{'hash'} = $head;
4118                        }
4119                }
4120        }
4121
4122        $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4123        $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4124
4125        my @actions = gitweb_get_feature('actions');
4126        my %repl = (
4127                '%' => '%',
4128                'n' => $project,         # project name
4129                'f' => $git_dir,         # project path within filesystem
4130                'h' => $treehead || '',  # current hash ('h' parameter)
4131                'b' => $treebase || '',  # hash base ('hb' parameter)
4132        );
4133        while (@actions) {
4134                my ($label, $link, $pos) = splice(@actions,0,3);
4135                # insert
4136                @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4137                # munch munch
4138                $link =~ s/%([%nfhb])/$repl{$1}/g;
4139                $arg{$label}{'_href'} = $link;
4140        }
4141
4142        print "<div class=\"page_nav\">\n" .
4143                (join " | ",
4144                 map { $_ eq $current ?
4145                       $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4146                 } @navs);
4147        print "<br/>\n$extra<br/>\n" .
4148              "</div>\n";
4149}
4150
4151# returns a submenu for the nagivation of the refs views (tags, heads,
4152# remotes) with the current view disabled and the remotes view only
4153# available if the feature is enabled
4154sub format_ref_views {
4155        my ($current) = @_;
4156        my @ref_views = qw{tags heads};
4157        push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4158        return join " | ", map {
4159                $_ eq $current ? $_ :
4160                $cgi->a({-href => href(action=>$_)}, $_)
4161        } @ref_views
4162}
4163
4164sub format_paging_nav {
4165        my ($action, $page, $has_next_link) = @_;
4166        my $paging_nav;
4167
4168
4169        if ($page > 0) {
4170                $paging_nav .=
4171                        $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4172                        " &sdot; " .
4173                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
4174                                 -accesskey => "p", -title => "Alt-p"}, "prev");
4175        } else {
4176                $paging_nav .= "first &sdot; prev";
4177        }
4178
4179        if ($has_next_link) {
4180                $paging_nav .= " &sdot; " .
4181                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
4182                                 -accesskey => "n", -title => "Alt-n"}, "next");
4183        } else {
4184                $paging_nav .= " &sdot; next";
4185        }
4186
4187        return $paging_nav;
4188}
4189
4190## ......................................................................
4191## functions printing or outputting HTML: div
4192
4193sub git_print_header_div {
4194        my ($action, $title, $hash, $hash_base) = @_;
4195        my %args = ();
4196
4197        $args{'action'} = $action;
4198        $args{'hash'} = $hash if $hash;
4199        $args{'hash_base'} = $hash_base if $hash_base;
4200
4201        print "<div class=\"header\">\n" .
4202              $cgi->a({-href => href(%args), -class => "title"},
4203              $title ? $title : $action) .
4204              "\n</div>\n";
4205}
4206
4207sub format_repo_url {
4208        my ($name, $url) = @_;
4209        return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4210}
4211
4212# Group output by placing it in a DIV element and adding a header.
4213# Options for start_div() can be provided by passing a hash reference as the
4214# first parameter to the function.
4215# Options to git_print_header_div() can be provided by passing an array
4216# reference. This must follow the options to start_div if they are present.
4217# The content can be a scalar, which is output as-is, a scalar reference, which
4218# is output after html escaping, an IO handle passed either as *handle or
4219# *handle{IO}, or a function reference. In the latter case all following
4220# parameters will be taken as argument to the content function call.
4221sub git_print_section {
4222        my ($div_args, $header_args, $content);
4223        my $arg = shift;
4224        if (ref($arg) eq 'HASH') {
4225                $div_args = $arg;
4226                $arg = shift;
4227        }
4228        if (ref($arg) eq 'ARRAY') {
4229                $header_args = $arg;
4230                $arg = shift;
4231        }
4232        $content = $arg;
4233
4234        print $cgi->start_div($div_args);
4235        git_print_header_div(@$header_args);
4236
4237        if (ref($content) eq 'CODE') {
4238                $content->(@_);
4239        } elsif (ref($content) eq 'SCALAR') {
4240                print esc_html($$content);
4241        } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4242                print <$content>;
4243        } elsif (!ref($content) && defined($content)) {
4244                print $content;
4245        }
4246
4247        print $cgi->end_div;
4248}
4249
4250sub format_timestamp_html {
4251        my $date = shift;
4252        my $strtime = $date->{'rfc2822'};
4253
4254        my (undef, undef, $datetime_class) =
4255                gitweb_get_feature('javascript-timezone');
4256        if ($datetime_class) {
4257                $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4258        }
4259
4260        my $localtime_format = '(%02d:%02d %s)';
4261        if ($date->{'hour_local'} < 6) {
4262                $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4263        }
4264        $strtime .= ' ' .
4265                    sprintf($localtime_format,
4266                            $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4267
4268        return $strtime;
4269}
4270
4271# Outputs the author name and date in long form
4272sub git_print_authorship {
4273        my $co = shift;
4274        my %opts = @_;
4275        my $tag = $opts{-tag} || 'div';
4276        my $author = $co->{'author_name'};
4277
4278        my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4279        print "<$tag class=\"author_date\">" .
4280              format_search_author($author, "author", esc_html($author)) .
4281              " [".format_timestamp_html(\%ad)."]".
4282              git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4283              "</$tag>\n";
4284}
4285
4286# Outputs table rows containing the full author or committer information,
4287# in the format expected for 'commit' view (& similar).
4288# Parameters are a commit hash reference, followed by the list of people
4289# to output information for. If the list is empty it defaults to both
4290# author and committer.
4291sub git_print_authorship_rows {
4292        my $co = shift;
4293        # too bad we can't use @people = @_ || ('author', 'committer')
4294        my @people = @_;
4295        @people = ('author', 'committer') unless @people;
4296        foreach my $who (@people) {
4297                my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4298                print "<tr><td>$who</td><td>" .
4299                      format_search_author($co->{"${who}_name"}, $who,
4300                                           esc_html($co->{"${who}_name"})) . " " .
4301                      format_search_author($co->{"${who}_email"}, $who,
4302                                           esc_html("<" . $co->{"${who}_email"} . ">")) .
4303                      "</td><td rowspan=\"2\">" .
4304                      git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4305                      "</td></tr>\n" .
4306                      "<tr>" .
4307                      "<td></td><td>" .
4308                      format_timestamp_html(\%wd) .
4309                      "</td>" .
4310                      "</tr>\n";
4311        }
4312}
4313
4314sub git_print_page_path {
4315        my $name = shift;
4316        my $type = shift;
4317        my $hb = shift;
4318
4319
4320        print "<div class=\"page_path\">";
4321        print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4322                      -title => 'tree root'}, to_utf8("[$project]"));
4323        print " / ";
4324        if (defined $name) {
4325                my @dirname = split '/', $name;
4326                my $basename = pop @dirname;
4327                my $fullname = '';
4328
4329                foreach my $dir (@dirname) {
4330                        $fullname .= ($fullname ? '/' : '') . $dir;
4331                        print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4332                                                     hash_base=>$hb),
4333                                      -title => $fullname}, esc_path($dir));
4334                        print " / ";
4335                }
4336                if (defined $type && $type eq 'blob') {
4337                        print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4338                                                     hash_base=>$hb),
4339                                      -title => $name}, esc_path($basename));
4340                } elsif (defined $type && $type eq 'tree') {
4341                        print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4342                                                     hash_base=>$hb),
4343                                      -title => $name}, esc_path($basename));
4344                        print " / ";
4345                } else {
4346                        print esc_path($basename);
4347                }
4348        }
4349        print "<br/></div>\n";
4350}
4351
4352sub git_print_log {
4353        my $log = shift;
4354        my %opts = @_;
4355
4356        if ($opts{'-remove_title'}) {
4357                # remove title, i.e. first line of log
4358                shift @$log;
4359        }
4360        # remove leading empty lines
4361        while (defined $log->[0] && $log->[0] eq "") {
4362                shift @$log;
4363        }
4364
4365        # print log
4366        my $signoff = 0;
4367        my $empty = 0;
4368        foreach my $line (@$log) {
4369                if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4370                        $signoff = 1;
4371                        $empty = 0;
4372                        if (! $opts{'-remove_signoff'}) {
4373                                print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4374                                next;
4375                        } else {
4376                                # remove signoff lines
4377                                next;
4378                        }
4379                } else {
4380                        $signoff = 0;
4381                }
4382
4383                # print only one empty line
4384                # do not print empty line after signoff
4385                if ($line eq "") {
4386                        next if ($empty || $signoff);
4387                        $empty = 1;
4388                } else {
4389                        $empty = 0;
4390                }
4391
4392                print format_log_line_html($line) . "<br/>\n";
4393        }
4394
4395        if ($opts{'-final_empty_line'}) {
4396                # end with single empty line
4397                print "<br/>\n" unless $empty;
4398        }
4399}
4400
4401# return link target (what link points to)
4402sub git_get_link_target {
4403        my $hash = shift;
4404        my $link_target;
4405
4406        # read link
4407        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4408                or return;
4409        {
4410                local $/ = undef;
4411                $link_target = <$fd>;
4412        }
4413        close $fd
4414                or return;
4415
4416        return $link_target;
4417}
4418
4419# given link target, and the directory (basedir) the link is in,
4420# return target of link relative to top directory (top tree);
4421# return undef if it is not possible (including absolute links).
4422sub normalize_link_target {
4423        my ($link_target, $basedir) = @_;
4424
4425        # absolute symlinks (beginning with '/') cannot be normalized
4426        return if (substr($link_target, 0, 1) eq '/');
4427
4428        # normalize link target to path from top (root) tree (dir)
4429        my $path;
4430        if ($basedir) {
4431                $path = $basedir . '/' . $link_target;
4432        } else {
4433                # we are in top (root) tree (dir)
4434                $path = $link_target;
4435        }
4436
4437        # remove //, /./, and /../
4438        my @path_parts;
4439        foreach my $part (split('/', $path)) {
4440                # discard '.' and ''
4441                next if (!$part || $part eq '.');
4442                # handle '..'
4443                if ($part eq '..') {
4444                        if (@path_parts) {
4445                                pop @path_parts;
4446                        } else {
4447                                # link leads outside repository (outside top dir)
4448                                return;
4449                        }
4450                } else {
4451                        push @path_parts, $part;
4452                }
4453        }
4454        $path = join('/', @path_parts);
4455
4456        return $path;
4457}
4458
4459# print tree entry (row of git_tree), but without encompassing <tr> element
4460sub git_print_tree_entry {
4461        my ($t, $basedir, $hash_base, $have_blame) = @_;
4462
4463        my %base_key = ();
4464        $base_key{'hash_base'} = $hash_base if defined $hash_base;
4465
4466        # The format of a table row is: mode list link.  Where mode is
4467        # the mode of the entry, list is the name of the entry, an href,
4468        # and link is the action links of the entry.
4469
4470        print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4471        if (exists $t->{'size'}) {
4472                print "<td class=\"size\">$t->{'size'}</td>\n";
4473        }
4474        if ($t->{'type'} eq "blob") {
4475                print "<td class=\"list\">" .
4476                        $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4477                                               file_name=>"$basedir$t->{'name'}", %base_key),
4478                                -class => "list"}, esc_path($t->{'name'}));
4479                if (S_ISLNK(oct $t->{'mode'})) {
4480                        my $link_target = git_get_link_target($t->{'hash'});
4481                        if ($link_target) {
4482                                my $norm_target = normalize_link_target($link_target, $basedir);
4483                                if (defined $norm_target) {
4484                                        print " -> " .
4485                                              $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4486                                                                     file_name=>$norm_target),
4487                                                       -title => $norm_target}, esc_path($link_target));
4488                                } else {
4489                                        print " -> " . esc_path($link_target);
4490                                }
4491                        }
4492                }
4493                print "</td>\n";
4494                print "<td class=\"link\">";
4495                print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4496                                             file_name=>"$basedir$t->{'name'}", %base_key)},
4497                              "blob");
4498                if ($have_blame) {
4499                        print " | " .
4500                              $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4501                                                     file_name=>"$basedir$t->{'name'}", %base_key)},
4502                                      "blame");
4503                }
4504                if (defined $hash_base) {
4505                        print " | " .
4506                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4507                                                     hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4508                                      "history");
4509                }
4510                print " | " .
4511                        $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4512                                               file_name=>"$basedir$t->{'name'}")},
4513                                "raw");
4514                print "</td>\n";
4515
4516        } elsif ($t->{'type'} eq "tree") {
4517                print "<td class=\"list\">";
4518                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4519                                             file_name=>"$basedir$t->{'name'}",
4520                                             %base_key)},
4521                              esc_path($t->{'name'}));
4522                print "</td>\n";
4523                print "<td class=\"link\">";
4524                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4525                                             file_name=>"$basedir$t->{'name'}",
4526                                             %base_key)},
4527                              "tree");
4528                if (defined $hash_base) {
4529                        print " | " .
4530                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4531                                                     file_name=>"$basedir$t->{'name'}")},
4532                                      "history");
4533                }
4534                print "</td>\n";
4535        } else {
4536                # unknown object: we can only present history for it
4537                # (this includes 'commit' object, i.e. submodule support)
4538                print "<td class=\"list\">" .
4539                      esc_path($t->{'name'}) .
4540                      "</td>\n";
4541                print "<td class=\"link\">";
4542                if (defined $hash_base) {
4543                        print $cgi->a({-href => href(action=>"history",
4544                                                     hash_base=>$hash_base,
4545                                                     file_name=>"$basedir$t->{'name'}")},
4546                                      "history");
4547                }
4548                print "</td>\n";
4549        }
4550}
4551
4552## ......................................................................
4553## functions printing large fragments of HTML
4554
4555# get pre-image filenames for merge (combined) diff
4556sub fill_from_file_info {
4557        my ($diff, @parents) = @_;
4558
4559        $diff->{'from_file'} = [ ];
4560        $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4561        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4562                if ($diff->{'status'}[$i] eq 'R' ||
4563                    $diff->{'status'}[$i] eq 'C') {
4564                        $diff->{'from_file'}[$i] =
4565                                git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4566                }
4567        }
4568
4569        return $diff;
4570}
4571
4572# is current raw difftree line of file deletion
4573sub is_deleted {
4574        my $diffinfo = shift;
4575
4576        return $diffinfo->{'to_id'} eq ('0' x 40);
4577}
4578
4579# does patch correspond to [previous] difftree raw line
4580# $diffinfo  - hashref of parsed raw diff format
4581# $patchinfo - hashref of parsed patch diff format
4582#              (the same keys as in $diffinfo)
4583sub is_patch_split {
4584        my ($diffinfo, $patchinfo) = @_;
4585
4586        return defined $diffinfo && defined $patchinfo
4587                && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4588}
4589
4590
4591sub git_difftree_body {
4592        my ($difftree, $hash, @parents) = @_;
4593        my ($parent) = $parents[0];
4594        my $have_blame = gitweb_check_feature('blame');
4595        print "<div class=\"list_head\">\n";
4596        if ($#{$difftree} > 10) {
4597                print(($#{$difftree} + 1) . " files changed:\n");
4598        }
4599        print "</div>\n";
4600
4601        print "<table class=\"" .
4602              (@parents > 1 ? "combined " : "") .
4603              "diff_tree\">\n";
4604
4605        # header only for combined diff in 'commitdiff' view
4606        my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4607        if ($has_header) {
4608                # table header
4609                print "<thead><tr>\n" .
4610                       "<th></th><th></th>\n"; # filename, patchN link
4611                for (my $i = 0; $i < @parents; $i++) {
4612                        my $par = $parents[$i];
4613                        print "<th>" .
4614                              $cgi->a({-href => href(action=>"commitdiff",
4615                                                     hash=>$hash, hash_parent=>$par),
4616                                       -title => 'commitdiff to parent number ' .
4617                                                  ($i+1) . ': ' . substr($par,0,7)},
4618                                      $i+1) .
4619                              "&nbsp;</th>\n";
4620                }
4621                print "</tr></thead>\n<tbody>\n";
4622        }
4623
4624        my $alternate = 1;
4625        my $patchno = 0;
4626        foreach my $line (@{$difftree}) {
4627                my $diff = parsed_difftree_line($line);
4628
4629                if ($alternate) {
4630                        print "<tr class=\"dark\">\n";
4631                } else {
4632                        print "<tr class=\"light\">\n";
4633                }
4634                $alternate ^= 1;
4635
4636                if (exists $diff->{'nparents'}) { # combined diff
4637
4638                        fill_from_file_info($diff, @parents)
4639                                unless exists $diff->{'from_file'};
4640
4641                        if (!is_deleted($diff)) {
4642                                # file exists in the result (child) commit
4643                                print "<td>" .
4644                                      $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4645                                                             file_name=>$diff->{'to_file'},
4646                                                             hash_base=>$hash),
4647                                              -class => "list"}, esc_path($diff->{'to_file'})) .
4648                                      "</td>\n";
4649                        } else {
4650                                print "<td>" .
4651                                      esc_path($diff->{'to_file'}) .
4652                                      "</td>\n";
4653                        }
4654
4655                        if ($action eq 'commitdiff') {
4656                                # link to patch
4657                                $patchno++;
4658                                print "<td class=\"link\">" .
4659                                      $cgi->a({-href => href(-anchor=>"patch$patchno")},
4660                                              "patch") .
4661                                      " | " .
4662                                      "</td>\n";
4663                        }
4664
4665                        my $has_history = 0;
4666                        my $not_deleted = 0;
4667                        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4668                                my $hash_parent = $parents[$i];
4669                                my $from_hash = $diff->{'from_id'}[$i];
4670                                my $from_path = $diff->{'from_file'}[$i];
4671                                my $status = $diff->{'status'}[$i];
4672
4673                                $has_history ||= ($status ne 'A');
4674                                $not_deleted ||= ($status ne 'D');
4675
4676                                if ($status eq 'A') {
4677                                        print "<td  class=\"link\" align=\"right\"> | </td>\n";
4678                                } elsif ($status eq 'D') {
4679                                        print "<td class=\"link\">" .
4680                                              $cgi->a({-href => href(action=>"blob",
4681                                                                     hash_base=>$hash,
4682                                                                     hash=>$from_hash,
4683                                                                     file_name=>$from_path)},
4684                                                      "blob" . ($i+1)) .
4685                                              " | </td>\n";
4686                                } else {
4687                                        if ($diff->{'to_id'} eq $from_hash) {
4688                                                print "<td class=\"link nochange\">";
4689                                        } else {
4690                                                print "<td class=\"link\">";
4691                                        }
4692                                        print $cgi->a({-href => href(action=>"blobdiff",
4693                                                                     hash=>$diff->{'to_id'},
4694                                                                     hash_parent=>$from_hash,
4695                                                                     hash_base=>$hash,
4696                                                                     hash_parent_base=>$hash_parent,
4697                                                                     file_name=>$diff->{'to_file'},
4698                                                                     file_parent=>$from_path)},
4699                                                      "diff" . ($i+1)) .
4700                                              " | </td>\n";
4701                                }
4702                        }
4703
4704                        print "<td class=\"link\">";
4705                        if ($not_deleted) {
4706                                print $cgi->a({-href => href(action=>"blob",
4707                                                             hash=>$diff->{'to_id'},
4708                                                             file_name=>$diff->{'to_file'},
4709                                                             hash_base=>$hash)},
4710                                              "blob");
4711                                print " | " if ($has_history);
4712                        }
4713                        if ($has_history) {
4714                                print $cgi->a({-href => href(action=>"history",
4715                                                             file_name=>$diff->{'to_file'},
4716                                                             hash_base=>$hash)},
4717                                              "history");
4718                        }
4719                        print "</td>\n";
4720
4721                        print "</tr>\n";
4722                        next; # instead of 'else' clause, to avoid extra indent
4723                }
4724                # else ordinary diff
4725
4726                my ($to_mode_oct, $to_mode_str, $to_file_type);
4727                my ($from_mode_oct, $from_mode_str, $from_file_type);
4728                if ($diff->{'to_mode'} ne ('0' x 6)) {
4729                        $to_mode_oct = oct $diff->{'to_mode'};
4730                        if (S_ISREG($to_mode_oct)) { # only for regular file
4731                                $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4732                        }
4733                        $to_file_type = file_type($diff->{'to_mode'});
4734                }
4735                if ($diff->{'from_mode'} ne ('0' x 6)) {
4736                        $from_mode_oct = oct $diff->{'from_mode'};
4737                        if (S_ISREG($from_mode_oct)) { # only for regular file
4738                                $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4739                        }
4740                        $from_file_type = file_type($diff->{'from_mode'});
4741                }
4742
4743                if ($diff->{'status'} eq "A") { # created
4744                        my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4745                        $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4746                        $mode_chng   .= "]</span>";
4747                        print "<td>";
4748                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4749                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4750                                      -class => "list"}, esc_path($diff->{'file'}));
4751                        print "</td>\n";
4752                        print "<td>$mode_chng</td>\n";
4753                        print "<td class=\"link\">";
4754                        if ($action eq 'commitdiff') {
4755                                # link to patch
4756                                $patchno++;
4757                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4758                                              "patch") .
4759                                      " | ";
4760                        }
4761                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4762                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4763                                      "blob");
4764                        print "</td>\n";
4765
4766                } elsif ($diff->{'status'} eq "D") { # deleted
4767                        my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4768                        print "<td>";
4769                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4770                                                     hash_base=>$parent, file_name=>$diff->{'file'}),
4771                                       -class => "list"}, esc_path($diff->{'file'}));
4772                        print "</td>\n";
4773                        print "<td>$mode_chng</td>\n";
4774                        print "<td class=\"link\">";
4775                        if ($action eq 'commitdiff') {
4776                                # link to patch
4777                                $patchno++;
4778                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4779                                              "patch") .
4780                                      " | ";
4781                        }
4782                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4783                                                     hash_base=>$parent, file_name=>$diff->{'file'})},
4784                                      "blob") . " | ";
4785                        if ($have_blame) {
4786                                print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4787                                                             file_name=>$diff->{'file'})},
4788                                              "blame") . " | ";
4789                        }
4790                        print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4791                                                     file_name=>$diff->{'file'})},
4792                                      "history");
4793                        print "</td>\n";
4794
4795                } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4796                        my $mode_chnge = "";
4797                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4798                                $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4799                                if ($from_file_type ne $to_file_type) {
4800                                        $mode_chnge .= " from $from_file_type to $to_file_type";
4801                                }
4802                                if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4803                                        if ($from_mode_str && $to_mode_str) {
4804                                                $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4805                                        } elsif ($to_mode_str) {
4806                                                $mode_chnge .= " mode: $to_mode_str";
4807                                        }
4808                                }
4809                                $mode_chnge .= "]</span>\n";
4810                        }
4811                        print "<td>";
4812                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4813                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4814                                      -class => "list"}, esc_path($diff->{'file'}));
4815                        print "</td>\n";
4816                        print "<td>$mode_chnge</td>\n";
4817                        print "<td class=\"link\">";
4818                        if ($action eq 'commitdiff') {
4819                                # link to patch
4820                                $patchno++;
4821                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4822                                              "patch") .
4823                                      " | ";
4824                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4825                                # "commit" view and modified file (not onlu mode changed)
4826                                print $cgi->a({-href => href(action=>"blobdiff",
4827                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4828                                                             hash_base=>$hash, hash_parent_base=>$parent,
4829                                                             file_name=>$diff->{'file'})},
4830                                              "diff") .
4831                                      " | ";
4832                        }
4833                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4834                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4835                                       "blob") . " | ";
4836                        if ($have_blame) {
4837                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4838                                                             file_name=>$diff->{'file'})},
4839                                              "blame") . " | ";
4840                        }
4841                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4842                                                     file_name=>$diff->{'file'})},
4843                                      "history");
4844                        print "</td>\n";
4845
4846                } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4847                        my %status_name = ('R' => 'moved', 'C' => 'copied');
4848                        my $nstatus = $status_name{$diff->{'status'}};
4849                        my $mode_chng = "";
4850                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4851                                # mode also for directories, so we cannot use $to_mode_str
4852                                $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4853                        }
4854                        print "<td>" .
4855                              $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4856                                                     hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4857                                      -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4858                              "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4859                              $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4860                                                     hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4861                                      -class => "list"}, esc_path($diff->{'from_file'})) .
4862                              " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4863                              "<td class=\"link\">";
4864                        if ($action eq 'commitdiff') {
4865                                # link to patch
4866                                $patchno++;
4867                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4868                                              "patch") .
4869                                      " | ";
4870                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4871                                # "commit" view and modified file (not only pure rename or copy)
4872                                print $cgi->a({-href => href(action=>"blobdiff",
4873                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4874                                                             hash_base=>$hash, hash_parent_base=>$parent,
4875                                                             file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4876                                              "diff") .
4877                                      " | ";
4878                        }
4879                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4880                                                     hash_base=>$parent, file_name=>$diff->{'to_file'})},
4881                                      "blob") . " | ";
4882                        if ($have_blame) {
4883                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4884                                                             file_name=>$diff->{'to_file'})},
4885                                              "blame") . " | ";
4886                        }
4887                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4888                                                    file_name=>$diff->{'to_file'})},
4889                                      "history");
4890                        print "</td>\n";
4891
4892                } # we should not encounter Unmerged (U) or Unknown (X) status
4893                print "</tr>\n";
4894        }
4895        print "</tbody>" if $has_header;
4896        print "</table>\n";
4897}
4898
4899sub print_sidebyside_diff_chunk {
4900        my @chunk = @_;
4901        my (@ctx, @rem, @add);
4902
4903        return unless @chunk;
4904
4905        # incomplete last line might be among removed or added lines,
4906        # or both, or among context lines: find which
4907        for (my $i = 1; $i < @chunk; $i++) {
4908                if ($chunk[$i][0] eq 'incomplete') {
4909                        $chunk[$i][0] = $chunk[$i-1][0];
4910                }
4911        }
4912
4913        # guardian
4914        push @chunk, ["", ""];
4915
4916        foreach my $line_info (@chunk) {
4917                my ($class, $line) = @$line_info;
4918
4919                # print chunk headers
4920                if ($class && $class eq 'chunk_header') {
4921                        print $line;
4922                        next;
4923                }
4924
4925                ## print from accumulator when type of class of lines change
4926                # empty contents block on start rem/add block, or end of chunk
4927                if (@ctx && (!$class || $class eq 'rem' || $class eq 'add')) {
4928                        print join '',
4929                                '<div class="chunk_block ctx">',
4930                                        '<div class="old">',
4931                                        @ctx,
4932                                        '</div>',
4933                                        '<div class="new">',
4934                                        @ctx,
4935                                        '</div>',
4936                                '</div>';
4937                        @ctx = ();
4938                }
4939                # empty add/rem block on start context block, or end of chunk
4940                if ((@rem || @add) && (!$class || $class eq 'ctx')) {
4941                        if (!@add) {
4942                                # pure removal
4943                                print join '',
4944                                        '<div class="chunk_block rem">',
4945                                                '<div class="old">',
4946                                                @rem,
4947                                                '</div>',
4948                                        '</div>';
4949                        } elsif (!@rem) {
4950                                # pure addition
4951                                print join '',
4952                                        '<div class="chunk_block add">',
4953                                                '<div class="new">',
4954                                                @add,
4955                                                '</div>',
4956                                        '</div>';
4957                        } else {
4958                                # assume that it is change
4959                                print join '',
4960                                        '<div class="chunk_block chg">',
4961                                                '<div class="old">',
4962                                                @rem,
4963                                                '</div>',
4964                                                '<div class="new">',
4965                                                @add,
4966                                                '</div>',
4967                                        '</div>';
4968                        }
4969                        @rem = @add = ();
4970                }
4971
4972                ## adding lines to accumulator
4973                # guardian value
4974                last unless $line;
4975                # rem, add or change
4976                if ($class eq 'rem') {
4977                        push @rem, $line;
4978                } elsif ($class eq 'add') {
4979                        push @add, $line;
4980                }
4981                # context line
4982                if ($class eq 'ctx') {
4983                        push @ctx, $line;
4984                }
4985        }
4986}
4987
4988sub git_patchset_body {
4989        my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
4990        my ($hash_parent) = $hash_parents[0];
4991
4992        my $is_combined = (@hash_parents > 1);
4993        my $patch_idx = 0;
4994        my $patch_number = 0;
4995        my $patch_line;
4996        my $diffinfo;
4997        my $to_name;
4998        my (%from, %to);
4999        my @chunk; # for side-by-side diff
5000
5001        print "<div class=\"patchset\">\n";
5002
5003        # skip to first patch
5004        while ($patch_line = <$fd>) {
5005                chomp $patch_line;
5006
5007                last if ($patch_line =~ m/^diff /);
5008        }
5009
5010 PATCH:
5011        while ($patch_line) {
5012
5013                # parse "git diff" header line
5014                if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
5015                        # $1 is from_name, which we do not use
5016                        $to_name = unquote($2);
5017                        $to_name =~ s!^b/!!;
5018                } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
5019                        # $1 is 'cc' or 'combined', which we do not use
5020                        $to_name = unquote($2);
5021                } else {
5022                        $to_name = undef;
5023                }
5024
5025                # check if current patch belong to current raw line
5026                # and parse raw git-diff line if needed
5027                if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
5028                        # this is continuation of a split patch
5029                        print "<div class=\"patch cont\">\n";
5030                } else {
5031                        # advance raw git-diff output if needed
5032                        $patch_idx++ if defined $diffinfo;
5033
5034                        # read and prepare patch information
5035                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5036
5037                        # compact combined diff output can have some patches skipped
5038                        # find which patch (using pathname of result) we are at now;
5039                        if ($is_combined) {
5040                                while ($to_name ne $diffinfo->{'to_file'}) {
5041                                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5042                                              format_diff_cc_simplified($diffinfo, @hash_parents) .
5043                                              "</div>\n";  # class="patch"
5044
5045                                        $patch_idx++;
5046                                        $patch_number++;
5047
5048                                        last if $patch_idx > $#$difftree;
5049                                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5050                                }
5051                        }
5052
5053                        # modifies %from, %to hashes
5054                        parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5055
5056                        # this is first patch for raw difftree line with $patch_idx index
5057                        # we index @$difftree array from 0, but number patches from 1
5058                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5059                }
5060
5061                # git diff header
5062                #assert($patch_line =~ m/^diff /) if DEBUG;
5063                #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5064                $patch_number++;
5065                # print "git diff" header
5066                print format_git_diff_header_line($patch_line, $diffinfo,
5067                                                  \%from, \%to);
5068
5069                # print extended diff header
5070                print "<div class=\"diff extended_header\">\n";
5071        EXTENDED_HEADER:
5072                while ($patch_line = <$fd>) {
5073                        chomp $patch_line;
5074
5075                        last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5076
5077                        print format_extended_diff_header_line($patch_line, $diffinfo,
5078                                                               \%from, \%to);
5079                }
5080                print "</div>\n"; # class="diff extended_header"
5081
5082                # from-file/to-file diff header
5083                if (! $patch_line) {
5084                        print "</div>\n"; # class="patch"
5085                        last PATCH;
5086                }
5087                next PATCH if ($patch_line =~ m/^diff /);
5088                #assert($patch_line =~ m/^---/) if DEBUG;
5089
5090                my $last_patch_line = $patch_line;
5091                $patch_line = <$fd>;
5092                chomp $patch_line;
5093                #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5094
5095                print format_diff_from_to_header($last_patch_line, $patch_line,
5096                                                 $diffinfo, \%from, \%to,
5097                                                 @hash_parents);
5098
5099                # the patch itself
5100        LINE:
5101                while ($patch_line = <$fd>) {
5102                        chomp $patch_line;
5103
5104                        next PATCH if ($patch_line =~ m/^diff /);
5105
5106                        my ($class, $line) = process_diff_line($patch_line, \%from, \%to);
5107                        my $diff_classes = "diff";
5108                        $diff_classes .= " $class" if ($class);
5109                        $line = "<div class=\"$diff_classes\">$line</div>\n";
5110
5111                        if ($diff_style eq 'sidebyside' && !$is_combined) {
5112                                if ($class eq 'chunk_header') {
5113                                        print_sidebyside_diff_chunk(@chunk);
5114                                        @chunk = ( [ $class, $line ] );
5115                                } else {
5116                                        push @chunk, [ $class, $line ];
5117                                }
5118                        } else {
5119                                # default 'inline' style and unknown styles
5120                                print $line;
5121                        }
5122                }
5123
5124        } continue {
5125                if (@chunk) {
5126                        print_sidebyside_diff_chunk(@chunk);
5127                        @chunk = ();
5128                }
5129                print "</div>\n"; # class="patch"
5130        }
5131
5132        # for compact combined (--cc) format, with chunk and patch simplification
5133        # the patchset might be empty, but there might be unprocessed raw lines
5134        for (++$patch_idx if $patch_number > 0;
5135             $patch_idx < @$difftree;
5136             ++$patch_idx) {
5137                # read and prepare patch information
5138                $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5139
5140                # generate anchor for "patch" links in difftree / whatchanged part
5141                print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5142                      format_diff_cc_simplified($diffinfo, @hash_parents) .
5143                      "</div>\n";  # class="patch"
5144
5145                $patch_number++;
5146        }
5147
5148        if ($patch_number == 0) {
5149                if (@hash_parents > 1) {
5150                        print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5151                } else {
5152                        print "<div class=\"diff nodifferences\">No differences found</div>\n";
5153                }
5154        }
5155
5156        print "</div>\n"; # class="patchset"
5157}
5158
5159# . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5160
5161# fills project list info (age, description, owner, category, forks)
5162# for each project in the list, removing invalid projects from
5163# returned list
5164# NOTE: modifies $projlist, but does not remove entries from it
5165sub fill_project_list_info {
5166        my $projlist = shift;
5167        my @projects;
5168
5169        my $show_ctags = gitweb_check_feature('ctags');
5170 PROJECT:
5171        foreach my $pr (@$projlist) {
5172                my (@activity) = git_get_last_activity($pr->{'path'});
5173                unless (@activity) {
5174                        next PROJECT;
5175                }
5176                ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5177                if (!defined $pr->{'descr'}) {
5178                        my $descr = git_get_project_description($pr->{'path'}) || "";
5179                        $descr = to_utf8($descr);
5180                        $pr->{'descr_long'} = $descr;
5181                        $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5182                }
5183                if (!defined $pr->{'owner'}) {
5184                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5185                }
5186                if ($show_ctags) {
5187                        $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5188                }
5189                if ($projects_list_group_categories && !defined $pr->{'category'}) {
5190                        my $cat = git_get_project_category($pr->{'path'}) ||
5191                                                           $project_list_default_category;
5192                        $pr->{'category'} = to_utf8($cat);
5193                }
5194
5195                push @projects, $pr;
5196        }
5197
5198        return @projects;
5199}
5200
5201sub sort_projects_list {
5202        my ($projlist, $order) = @_;
5203        my @projects;
5204
5205        my %order_info = (
5206                project => { key => 'path', type => 'str' },
5207                descr => { key => 'descr_long', type => 'str' },
5208                owner => { key => 'owner', type => 'str' },
5209                age => { key => 'age', type => 'num' }
5210        );
5211        my $oi = $order_info{$order};
5212        return @$projlist unless defined $oi;
5213        if ($oi->{'type'} eq 'str') {
5214                @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5215        } else {
5216                @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5217        }
5218
5219        return @projects;
5220}
5221
5222# returns a hash of categories, containing the list of project
5223# belonging to each category
5224sub build_projlist_by_category {
5225        my ($projlist, $from, $to) = @_;
5226        my %categories;
5227
5228        $from = 0 unless defined $from;
5229        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5230
5231        for (my $i = $from; $i <= $to; $i++) {
5232                my $pr = $projlist->[$i];
5233                push @{$categories{ $pr->{'category'} }}, $pr;
5234        }
5235
5236        return wantarray ? %categories : \%categories;
5237}
5238
5239# print 'sort by' <th> element, generating 'sort by $name' replay link
5240# if that order is not selected
5241sub print_sort_th {
5242        print format_sort_th(@_);
5243}
5244
5245sub format_sort_th {
5246        my ($name, $order, $header) = @_;
5247        my $sort_th = "";
5248        $header ||= ucfirst($name);
5249
5250        if ($order eq $name) {
5251                $sort_th .= "<th>$header</th>\n";
5252        } else {
5253                $sort_th .= "<th>" .
5254                            $cgi->a({-href => href(-replay=>1, order=>$name),
5255                                     -class => "header"}, $header) .
5256                            "</th>\n";
5257        }
5258
5259        return $sort_th;
5260}
5261
5262sub git_project_list_rows {
5263        my ($projlist, $from, $to, $check_forks) = @_;
5264
5265        $from = 0 unless defined $from;
5266        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5267
5268        my $alternate = 1;
5269        for (my $i = $from; $i <= $to; $i++) {
5270                my $pr = $projlist->[$i];
5271
5272                if ($alternate) {
5273                        print "<tr class=\"dark\">\n";
5274                } else {
5275                        print "<tr class=\"light\">\n";
5276                }
5277                $alternate ^= 1;
5278
5279                if ($check_forks) {
5280                        print "<td>";
5281                        if ($pr->{'forks'}) {
5282                                my $nforks = scalar @{$pr->{'forks'}};
5283                                if ($nforks > 0) {
5284                                        print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5285                                                       -title => "$nforks forks"}, "+");
5286                                } else {
5287                                        print $cgi->span({-title => "$nforks forks"}, "+");
5288                                }
5289                        }
5290                        print "</td>\n";
5291                }
5292                print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5293                                        -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
5294                      "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5295                                        -class => "list", -title => $pr->{'descr_long'}},
5296                                        esc_html($pr->{'descr'})) . "</td>\n" .
5297                      "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5298                print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5299                      (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
5300                      "<td class=\"link\">" .
5301                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5302                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5303                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5304                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5305                      ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5306                      "</td>\n" .
5307                      "</tr>\n";
5308        }
5309}
5310
5311sub git_project_list_body {
5312        # actually uses global variable $project
5313        my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5314        my @projects = @$projlist;
5315
5316        my $check_forks = gitweb_check_feature('forks');
5317        my $show_ctags  = gitweb_check_feature('ctags');
5318        my $tagfilter = $show_ctags ? $cgi->param('by_tag') : undef;
5319        $check_forks = undef
5320                if ($tagfilter || $searchtext);
5321
5322        # filtering out forks before filling info allows to do less work
5323        @projects = filter_forks_from_projects_list(\@projects)
5324                if ($check_forks);
5325        @projects = fill_project_list_info(\@projects);
5326        # searching projects require filling to be run before it
5327        @projects = search_projects_list(\@projects,
5328                                         'searchtext' => $searchtext,
5329                                         'tagfilter'  => $tagfilter)
5330                if ($tagfilter || $searchtext);
5331
5332        $order ||= $default_projects_order;
5333        $from = 0 unless defined $from;
5334        $to = $#projects if (!defined $to || $#projects < $to);
5335
5336        # short circuit
5337        if ($from > $to) {
5338                print "<center>\n".
5339                      "<b>No such projects found</b><br />\n".
5340                      "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5341                      "</center>\n<br />\n";
5342                return;
5343        }
5344
5345        @projects = sort_projects_list(\@projects, $order);
5346
5347        if ($show_ctags) {
5348                my $ctags = git_gather_all_ctags(\@projects);
5349                my $cloud = git_populate_project_tagcloud($ctags);
5350                print git_show_project_tagcloud($cloud, 64);
5351        }
5352
5353        print "<table class=\"project_list\">\n";
5354        unless ($no_header) {
5355                print "<tr>\n";
5356                if ($check_forks) {
5357                        print "<th></th>\n";
5358                }
5359                print_sort_th('project', $order, 'Project');
5360                print_sort_th('descr', $order, 'Description');
5361                print_sort_th('owner', $order, 'Owner');
5362                print_sort_th('age', $order, 'Last Change');
5363                print "<th></th>\n" . # for links
5364                      "</tr>\n";
5365        }
5366
5367        if ($projects_list_group_categories) {
5368                # only display categories with projects in the $from-$to window
5369                @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5370                my %categories = build_projlist_by_category(\@projects, $from, $to);
5371                foreach my $cat (sort keys %categories) {
5372                        unless ($cat eq "") {
5373                                print "<tr>\n";
5374                                if ($check_forks) {
5375                                        print "<td></td>\n";
5376                                }
5377                                print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5378                                print "</tr>\n";
5379                        }
5380
5381                        git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5382                }
5383        } else {
5384                git_project_list_rows(\@projects, $from, $to, $check_forks);
5385        }
5386
5387        if (defined $extra) {
5388                print "<tr>\n";
5389                if ($check_forks) {
5390                        print "<td></td>\n";
5391                }
5392                print "<td colspan=\"5\">$extra</td>\n" .
5393                      "</tr>\n";
5394        }
5395        print "</table>\n";
5396}
5397
5398sub git_log_body {
5399        # uses global variable $project
5400        my ($commitlist, $from, $to, $refs, $extra) = @_;
5401
5402        $from = 0 unless defined $from;
5403        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5404
5405        for (my $i = 0; $i <= $to; $i++) {
5406                my %co = %{$commitlist->[$i]};
5407                next if !%co;
5408                my $commit = $co{'id'};
5409                my $ref = format_ref_marker($refs, $commit);
5410                git_print_header_div('commit',
5411                               "<span class=\"age\">$co{'age_string'}</span>" .
5412                               esc_html($co{'title'}) . $ref,
5413                               $commit);
5414                print "<div class=\"title_text\">\n" .
5415                      "<div class=\"log_link\">\n" .
5416                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5417                      " | " .
5418                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5419                      " | " .
5420                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5421                      "<br/>\n" .
5422                      "</div>\n";
5423                      git_print_authorship(\%co, -tag => 'span');
5424                      print "<br/>\n</div>\n";
5425
5426                print "<div class=\"log_body\">\n";
5427                git_print_log($co{'comment'}, -final_empty_line=> 1);
5428                print "</div>\n";
5429        }
5430        if ($extra) {
5431                print "<div class=\"page_nav\">\n";
5432                print "$extra\n";
5433                print "</div>\n";
5434        }
5435}
5436
5437sub git_shortlog_body {
5438        # uses global variable $project
5439        my ($commitlist, $from, $to, $refs, $extra) = @_;
5440
5441        $from = 0 unless defined $from;
5442        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5443
5444        print "<table class=\"shortlog\">\n";
5445        my $alternate = 1;
5446        for (my $i = $from; $i <= $to; $i++) {
5447                my %co = %{$commitlist->[$i]};
5448                my $commit = $co{'id'};
5449                my $ref = format_ref_marker($refs, $commit);
5450                if ($alternate) {
5451                        print "<tr class=\"dark\">\n";
5452                } else {
5453                        print "<tr class=\"light\">\n";
5454                }
5455                $alternate ^= 1;
5456                # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5457                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5458                      format_author_html('td', \%co, 10) . "<td>";
5459                print format_subject_html($co{'title'}, $co{'title_short'},
5460                                          href(action=>"commit", hash=>$commit), $ref);
5461                print "</td>\n" .
5462                      "<td class=\"link\">" .
5463                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5464                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5465                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5466                my $snapshot_links = format_snapshot_links($commit);
5467                if (defined $snapshot_links) {
5468                        print " | " . $snapshot_links;
5469                }
5470                print "</td>\n" .
5471                      "</tr>\n";
5472        }
5473        if (defined $extra) {
5474                print "<tr>\n" .
5475                      "<td colspan=\"4\">$extra</td>\n" .
5476                      "</tr>\n";
5477        }
5478        print "</table>\n";
5479}
5480
5481sub git_history_body {
5482        # Warning: assumes constant type (blob or tree) during history
5483        my ($commitlist, $from, $to, $refs, $extra,
5484            $file_name, $file_hash, $ftype) = @_;
5485
5486        $from = 0 unless defined $from;
5487        $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5488
5489        print "<table class=\"history\">\n";
5490        my $alternate = 1;
5491        for (my $i = $from; $i <= $to; $i++) {
5492                my %co = %{$commitlist->[$i]};
5493                if (!%co) {
5494                        next;
5495                }
5496                my $commit = $co{'id'};
5497
5498                my $ref = format_ref_marker($refs, $commit);
5499
5500                if ($alternate) {
5501                        print "<tr class=\"dark\">\n";
5502                } else {
5503                        print "<tr class=\"light\">\n";
5504                }
5505                $alternate ^= 1;
5506                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5507        # shortlog:   format_author_html('td', \%co, 10)
5508                      format_author_html('td', \%co, 15, 3) . "<td>";
5509                # originally git_history used chop_str($co{'title'}, 50)
5510                print format_subject_html($co{'title'}, $co{'title_short'},
5511                                          href(action=>"commit", hash=>$commit), $ref);
5512                print "</td>\n" .
5513                      "<td class=\"link\">" .
5514                      $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5515                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5516
5517                if ($ftype eq 'blob') {
5518                        my $blob_current = $file_hash;
5519                        my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5520                        if (defined $blob_current && defined $blob_parent &&
5521                                        $blob_current ne $blob_parent) {
5522                                print " | " .
5523                                        $cgi->a({-href => href(action=>"blobdiff",
5524                                                               hash=>$blob_current, hash_parent=>$blob_parent,
5525                                                               hash_base=>$hash_base, hash_parent_base=>$commit,
5526                                                               file_name=>$file_name)},
5527                                                "diff to current");
5528                        }
5529                }
5530                print "</td>\n" .
5531                      "</tr>\n";
5532        }
5533        if (defined $extra) {
5534                print "<tr>\n" .
5535                      "<td colspan=\"4\">$extra</td>\n" .
5536                      "</tr>\n";
5537        }
5538        print "</table>\n";
5539}
5540
5541sub git_tags_body {
5542        # uses global variable $project
5543        my ($taglist, $from, $to, $extra) = @_;
5544        $from = 0 unless defined $from;
5545        $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5546
5547        print "<table class=\"tags\">\n";
5548        my $alternate = 1;
5549        for (my $i = $from; $i <= $to; $i++) {
5550                my $entry = $taglist->[$i];
5551                my %tag = %$entry;
5552                my $comment = $tag{'subject'};
5553                my $comment_short;
5554                if (defined $comment) {
5555                        $comment_short = chop_str($comment, 30, 5);
5556                }
5557                if ($alternate) {
5558                        print "<tr class=\"dark\">\n";
5559                } else {
5560                        print "<tr class=\"light\">\n";
5561                }
5562                $alternate ^= 1;
5563                if (defined $tag{'age'}) {
5564                        print "<td><i>$tag{'age'}</i></td>\n";
5565                } else {
5566                        print "<td></td>\n";
5567                }
5568                print "<td>" .
5569                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5570                               -class => "list name"}, esc_html($tag{'name'})) .
5571                      "</td>\n" .
5572                      "<td>";
5573                if (defined $comment) {
5574                        print format_subject_html($comment, $comment_short,
5575                                                  href(action=>"tag", hash=>$tag{'id'}));
5576                }
5577                print "</td>\n" .
5578                      "<td class=\"selflink\">";
5579                if ($tag{'type'} eq "tag") {
5580                        print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5581                } else {
5582                        print "&nbsp;";
5583                }
5584                print "</td>\n" .
5585                      "<td class=\"link\">" . " | " .
5586                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5587                if ($tag{'reftype'} eq "commit") {
5588                        print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5589                              " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5590                } elsif ($tag{'reftype'} eq "blob") {
5591                        print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5592                }
5593                print "</td>\n" .
5594                      "</tr>";
5595        }
5596        if (defined $extra) {
5597                print "<tr>\n" .
5598                      "<td colspan=\"5\">$extra</td>\n" .
5599                      "</tr>\n";
5600        }
5601        print "</table>\n";
5602}
5603
5604sub git_heads_body {
5605        # uses global variable $project
5606        my ($headlist, $head, $from, $to, $extra) = @_;
5607        $from = 0 unless defined $from;
5608        $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5609
5610        print "<table class=\"heads\">\n";
5611        my $alternate = 1;
5612        for (my $i = $from; $i <= $to; $i++) {
5613                my $entry = $headlist->[$i];
5614                my %ref = %$entry;
5615                my $curr = $ref{'id'} eq $head;
5616                if ($alternate) {
5617                        print "<tr class=\"dark\">\n";
5618                } else {
5619                        print "<tr class=\"light\">\n";
5620                }
5621                $alternate ^= 1;
5622                print "<td><i>$ref{'age'}</i></td>\n" .
5623                      ($curr ? "<td class=\"current_head\">" : "<td>") .
5624                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5625                               -class => "list name"},esc_html($ref{'name'})) .
5626                      "</td>\n" .
5627                      "<td class=\"link\">" .
5628                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5629                      $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5630                      $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5631                      "</td>\n" .
5632                      "</tr>";
5633        }
5634        if (defined $extra) {
5635                print "<tr>\n" .
5636                      "<td colspan=\"3\">$extra</td>\n" .
5637                      "</tr>\n";
5638        }
5639        print "</table>\n";
5640}
5641
5642# Display a single remote block
5643sub git_remote_block {
5644        my ($remote, $rdata, $limit, $head) = @_;
5645
5646        my $heads = $rdata->{'heads'};
5647        my $fetch = $rdata->{'fetch'};
5648        my $push = $rdata->{'push'};
5649
5650        my $urls_table = "<table class=\"projects_list\">\n" ;
5651
5652        if (defined $fetch) {
5653                if ($fetch eq $push) {
5654                        $urls_table .= format_repo_url("URL", $fetch);
5655                } else {
5656                        $urls_table .= format_repo_url("Fetch URL", $fetch);
5657                        $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5658                }
5659        } elsif (defined $push) {
5660                $urls_table .= format_repo_url("Push URL", $push);
5661        } else {
5662                $urls_table .= format_repo_url("", "No remote URL");
5663        }
5664
5665        $urls_table .= "</table>\n";
5666
5667        my $dots;
5668        if (defined $limit && $limit < @$heads) {
5669                $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5670        }
5671
5672        print $urls_table;
5673        git_heads_body($heads, $head, 0, $limit, $dots);
5674}
5675
5676# Display a list of remote names with the respective fetch and push URLs
5677sub git_remotes_list {
5678        my ($remotedata, $limit) = @_;
5679        print "<table class=\"heads\">\n";
5680        my $alternate = 1;
5681        my @remotes = sort keys %$remotedata;
5682
5683        my $limited = $limit && $limit < @remotes;
5684
5685        $#remotes = $limit - 1 if $limited;
5686
5687        while (my $remote = shift @remotes) {
5688                my $rdata = $remotedata->{$remote};
5689                my $fetch = $rdata->{'fetch'};
5690                my $push = $rdata->{'push'};
5691                if ($alternate) {
5692                        print "<tr class=\"dark\">\n";
5693                } else {
5694                        print "<tr class=\"light\">\n";
5695                }
5696                $alternate ^= 1;
5697                print "<td>" .
5698                      $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5699                               -class=> "list name"},esc_html($remote)) .
5700                      "</td>";
5701                print "<td class=\"link\">" .
5702                      (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5703                      " | " .
5704                      (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5705                      "</td>";
5706
5707                print "</tr>\n";
5708        }
5709
5710        if ($limited) {
5711                print "<tr>\n" .
5712                      "<td colspan=\"3\">" .
5713                      $cgi->a({-href => href(action=>"remotes")}, "...") .
5714                      "</td>\n" . "</tr>\n";
5715        }
5716
5717        print "</table>";
5718}
5719
5720# Display remote heads grouped by remote, unless there are too many
5721# remotes, in which case we only display the remote names
5722sub git_remotes_body {
5723        my ($remotedata, $limit, $head) = @_;
5724        if ($limit and $limit < keys %$remotedata) {
5725                git_remotes_list($remotedata, $limit);
5726        } else {
5727                fill_remote_heads($remotedata);
5728                while (my ($remote, $rdata) = each %$remotedata) {
5729                        git_print_section({-class=>"remote", -id=>$remote},
5730                                ["remotes", $remote, $remote], sub {
5731                                        git_remote_block($remote, $rdata, $limit, $head);
5732                                });
5733                }
5734        }
5735}
5736
5737sub git_search_message {
5738        my %co = @_;
5739
5740        my $greptype;
5741        if ($searchtype eq 'commit') {
5742                $greptype = "--grep=";
5743        } elsif ($searchtype eq 'author') {
5744                $greptype = "--author=";
5745        } elsif ($searchtype eq 'committer') {
5746                $greptype = "--committer=";
5747        }
5748        $greptype .= $searchtext;
5749        my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
5750                                       $greptype, '--regexp-ignore-case',
5751                                       $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
5752
5753        my $paging_nav = '';
5754        if ($page > 0) {
5755                $paging_nav .=
5756                        $cgi->a({-href => href(-replay=>1, page=>undef)},
5757                                "first") .
5758                        " &sdot; " .
5759                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
5760                                 -accesskey => "p", -title => "Alt-p"}, "prev");
5761        } else {
5762                $paging_nav .= "first &sdot; prev";
5763        }
5764        my $next_link = '';
5765        if ($#commitlist >= 100) {
5766                $next_link =
5767                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
5768                                 -accesskey => "n", -title => "Alt-n"}, "next");
5769                $paging_nav .= " &sdot; $next_link";
5770        } else {
5771                $paging_nav .= " &sdot; next";
5772        }
5773
5774        git_header_html();
5775
5776        git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
5777        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5778        if ($page == 0 && !@commitlist) {
5779                print "<p>No match.</p>\n";
5780        } else {
5781                git_search_grep_body(\@commitlist, 0, 99, $next_link);
5782        }
5783
5784        git_footer_html();
5785}
5786
5787sub git_search_changes {
5788        my %co = @_;
5789
5790        local $/ = "\n";
5791        open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
5792                '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
5793                ($search_use_regexp ? '--pickaxe-regex' : ())
5794                        or die_error(500, "Open git-log failed");
5795
5796        git_header_html();
5797
5798        git_print_page_nav('','', $hash,$co{'tree'},$hash);
5799        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5800
5801        print "<table class=\"pickaxe search\">\n";
5802        my $alternate = 1;
5803        undef %co;
5804        my @files;
5805        while (my $line = <$fd>) {
5806                chomp $line;
5807                next unless $line;
5808
5809                my %set = parse_difftree_raw_line($line);
5810                if (defined $set{'commit'}) {
5811                        # finish previous commit
5812                        if (%co) {
5813                                print "</td>\n" .
5814                                      "<td class=\"link\">" .
5815                                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5816                                              "commit") .
5817                                      " | " .
5818                                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5819                                                             hash_base=>$co{'id'})},
5820                                              "tree") .
5821                                      "</td>\n" .
5822                                      "</tr>\n";
5823                        }
5824
5825                        if ($alternate) {
5826                                print "<tr class=\"dark\">\n";
5827                        } else {
5828                                print "<tr class=\"light\">\n";
5829                        }
5830                        $alternate ^= 1;
5831                        %co = parse_commit($set{'commit'});
5832                        my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
5833                        print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5834                              "<td><i>$author</i></td>\n" .
5835                              "<td>" .
5836                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5837                                      -class => "list subject"},
5838                                      chop_and_escape_str($co{'title'}, 50) . "<br/>");
5839                } elsif (defined $set{'to_id'}) {
5840                        next if ($set{'to_id'} =~ m/^0{40}$/);
5841
5842                        print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
5843                                                     hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
5844                                      -class => "list"},
5845                                      "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
5846                              "<br/>\n";
5847                }
5848        }
5849        close $fd;
5850
5851        # finish last commit (warning: repetition!)
5852        if (%co) {
5853                print "</td>\n" .
5854                      "<td class=\"link\">" .
5855                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5856                              "commit") .
5857                      " | " .
5858                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5859                                             hash_base=>$co{'id'})},
5860                              "tree") .
5861                      "</td>\n" .
5862                      "</tr>\n";
5863        }
5864
5865        print "</table>\n";
5866
5867        git_footer_html();
5868}
5869
5870sub git_search_files {
5871        my %co = @_;
5872
5873        local $/ = "\n";
5874        open my $fd, "-|", git_cmd(), 'grep', '-n', '-z',
5875                $search_use_regexp ? ('-E', '-i') : '-F',
5876                $searchtext, $co{'tree'}
5877                        or die_error(500, "Open git-grep failed");
5878
5879        git_header_html();
5880
5881        git_print_page_nav('','', $hash,$co{'tree'},$hash);
5882        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5883
5884        print "<table class=\"grep_search\">\n";
5885        my $alternate = 1;
5886        my $matches = 0;
5887        my $lastfile = '';
5888        while (my $line = <$fd>) {
5889                chomp $line;
5890                my ($file, $file_href, $lno, $ltext, $binary);
5891                last if ($matches++ > 1000);
5892                if ($line =~ /^Binary file (.+) matches$/) {
5893                        $file = $1;
5894                        $binary = 1;
5895                } else {
5896                        ($file, $lno, $ltext) = split(/\0/, $line, 3);
5897                        $file =~ s/^$co{'tree'}://;
5898                }
5899                if ($file ne $lastfile) {
5900                        $lastfile and print "</td></tr>\n";
5901                        if ($alternate++) {
5902                                print "<tr class=\"dark\">\n";
5903                        } else {
5904                                print "<tr class=\"light\">\n";
5905                        }
5906                        $file_href = href(action=>"blob", hash_base=>$co{'id'},
5907                                          file_name=>$file);
5908                        print "<td class=\"list\">".
5909                                $cgi->a({-href => $file_href, -class => "list"}, esc_path($file));
5910                        print "</td><td>\n";
5911                        $lastfile = $file;
5912                }
5913                if ($binary) {
5914                        print "<div class=\"binary\">Binary file</div>\n";
5915                } else {
5916                        $ltext = untabify($ltext);
5917                        if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
5918                                $ltext = esc_html($1, -nbsp=>1);
5919                                $ltext .= '<span class="match">';
5920                                $ltext .= esc_html($2, -nbsp=>1);
5921                                $ltext .= '</span>';
5922                                $ltext .= esc_html($3, -nbsp=>1);
5923                        } else {
5924                                $ltext = esc_html($ltext, -nbsp=>1);
5925                        }
5926                        print "<div class=\"pre\">" .
5927                                $cgi->a({-href => $file_href.'#l'.$lno,
5928                                        -class => "linenr"}, sprintf('%4i', $lno)) .
5929                                ' ' .  $ltext . "</div>\n";
5930                }
5931        }
5932        if ($lastfile) {
5933                print "</td></tr>\n";
5934                if ($matches > 1000) {
5935                        print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
5936                }
5937        } else {
5938                print "<div class=\"diff nodifferences\">No matches found</div>\n";
5939        }
5940        close $fd;
5941
5942        print "</table>\n";
5943
5944        git_footer_html();
5945}
5946
5947sub git_search_grep_body {
5948        my ($commitlist, $from, $to, $extra) = @_;
5949        $from = 0 unless defined $from;
5950        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5951
5952        print "<table class=\"commit_search\">\n";
5953        my $alternate = 1;
5954        for (my $i = $from; $i <= $to; $i++) {
5955                my %co = %{$commitlist->[$i]};
5956                if (!%co) {
5957                        next;
5958                }
5959                my $commit = $co{'id'};
5960                if ($alternate) {
5961                        print "<tr class=\"dark\">\n";
5962                } else {
5963                        print "<tr class=\"light\">\n";
5964                }
5965                $alternate ^= 1;
5966                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5967                      format_author_html('td', \%co, 15, 5) .
5968                      "<td>" .
5969                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5970                               -class => "list subject"},
5971                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
5972                my $comment = $co{'comment'};
5973                foreach my $line (@$comment) {
5974                        if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
5975                                my ($lead, $match, $trail) = ($1, $2, $3);
5976                                $match = chop_str($match, 70, 5, 'center');
5977                                my $contextlen = int((80 - length($match))/2);
5978                                $contextlen = 30 if ($contextlen > 30);
5979                                $lead  = chop_str($lead,  $contextlen, 10, 'left');
5980                                $trail = chop_str($trail, $contextlen, 10, 'right');
5981
5982                                $lead  = esc_html($lead);
5983                                $match = esc_html($match);
5984                                $trail = esc_html($trail);
5985
5986                                print "$lead<span class=\"match\">$match</span>$trail<br />";
5987                        }
5988                }
5989                print "</td>\n" .
5990                      "<td class=\"link\">" .
5991                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5992                      " | " .
5993                      $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5994                      " | " .
5995                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5996                print "</td>\n" .
5997                      "</tr>\n";
5998        }
5999        if (defined $extra) {
6000                print "<tr>\n" .
6001                      "<td colspan=\"3\">$extra</td>\n" .
6002                      "</tr>\n";
6003        }
6004        print "</table>\n";
6005}
6006
6007## ======================================================================
6008## ======================================================================
6009## actions
6010
6011sub git_project_list {
6012        my $order = $input_params{'order'};
6013        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6014                die_error(400, "Unknown order parameter");
6015        }
6016
6017        my @list = git_get_projects_list($project_filter, $strict_export);
6018        if (!@list) {
6019                die_error(404, "No projects found");
6020        }
6021
6022        git_header_html();
6023        if (defined $home_text && -f $home_text) {
6024                print "<div class=\"index_include\">\n";
6025                insert_file($home_text);
6026                print "</div>\n";
6027        }
6028        print $cgi->startform(-method => "get") .
6029              "<p class=\"projsearch\">Search:\n" .
6030              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
6031              "</p>" .
6032              $cgi->end_form() . "\n";
6033        git_project_list_body(\@list, $order);
6034        git_footer_html();
6035}
6036
6037sub git_forks {
6038        my $order = $input_params{'order'};
6039        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6040                die_error(400, "Unknown order parameter");
6041        }
6042
6043        my $filter = $project;
6044        $filter =~ s/\.git$//;
6045        my @list = git_get_projects_list($filter);
6046        if (!@list) {
6047                die_error(404, "No forks found");
6048        }
6049
6050        git_header_html();
6051        git_print_page_nav('','');
6052        git_print_header_div('summary', "$project forks");
6053        git_project_list_body(\@list, $order);
6054        git_footer_html();
6055}
6056
6057sub git_project_index {
6058        my @projects = git_get_projects_list($project_filter, $strict_export);
6059        if (!@projects) {
6060                die_error(404, "No projects found");
6061        }
6062
6063        print $cgi->header(
6064                -type => 'text/plain',
6065                -charset => 'utf-8',
6066                -content_disposition => 'inline; filename="index.aux"');
6067
6068        foreach my $pr (@projects) {
6069                if (!exists $pr->{'owner'}) {
6070                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6071                }
6072
6073                my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6074                # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6075                $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6076                $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6077                $path  =~ s/ /\+/g;
6078                $owner =~ s/ /\+/g;
6079
6080                print "$path $owner\n";
6081        }
6082}
6083
6084sub git_summary {
6085        my $descr = git_get_project_description($project) || "none";
6086        my %co = parse_commit("HEAD");
6087        my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6088        my $head = $co{'id'};
6089        my $remote_heads = gitweb_check_feature('remote_heads');
6090
6091        my $owner = git_get_project_owner($project);
6092
6093        my $refs = git_get_references();
6094        # These get_*_list functions return one more to allow us to see if
6095        # there are more ...
6096        my @taglist  = git_get_tags_list(16);
6097        my @headlist = git_get_heads_list(16);
6098        my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6099        my @forklist;
6100        my $check_forks = gitweb_check_feature('forks');
6101
6102        if ($check_forks) {
6103                # find forks of a project
6104                my $filter = $project;
6105                $filter =~ s/\.git$//;
6106                @forklist = git_get_projects_list($filter);
6107                # filter out forks of forks
6108                @forklist = filter_forks_from_projects_list(\@forklist)
6109                        if (@forklist);
6110        }
6111
6112        git_header_html();
6113        git_print_page_nav('summary','', $head);
6114
6115        print "<div class=\"title\">&nbsp;</div>\n";
6116        print "<table class=\"projects_list\">\n" .
6117              "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
6118              "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6119        if (defined $cd{'rfc2822'}) {
6120                print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6121                      "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6122        }
6123
6124        # use per project git URL list in $projectroot/$project/cloneurl
6125        # or make project git URL from git base URL and project name
6126        my $url_tag = "URL";
6127        my @url_list = git_get_project_url_list($project);
6128        @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6129        foreach my $git_url (@url_list) {
6130                next unless $git_url;
6131                print format_repo_url($url_tag, $git_url);
6132                $url_tag = "";
6133        }
6134
6135        # Tag cloud
6136        my $show_ctags = gitweb_check_feature('ctags');
6137        if ($show_ctags) {
6138                my $ctags = git_get_project_ctags($project);
6139                if (%$ctags) {
6140                        # without ability to add tags, don't show if there are none
6141                        my $cloud = git_populate_project_tagcloud($ctags);
6142                        print "<tr id=\"metadata_ctags\">" .
6143                              "<td>content tags</td>" .
6144                              "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6145                              "</tr>\n";
6146                }
6147        }
6148
6149        print "</table>\n";
6150
6151        # If XSS prevention is on, we don't include README.html.
6152        # TODO: Allow a readme in some safe format.
6153        if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6154                print "<div class=\"title\">readme</div>\n" .
6155                      "<div class=\"readme\">\n";
6156                insert_file("$projectroot/$project/README.html");
6157                print "\n</div>\n"; # class="readme"
6158        }
6159
6160        # we need to request one more than 16 (0..15) to check if
6161        # those 16 are all
6162        my @commitlist = $head ? parse_commits($head, 17) : ();
6163        if (@commitlist) {
6164                git_print_header_div('shortlog');
6165                git_shortlog_body(\@commitlist, 0, 15, $refs,
6166                                  $#commitlist <=  15 ? undef :
6167                                  $cgi->a({-href => href(action=>"shortlog")}, "..."));
6168        }
6169
6170        if (@taglist) {
6171                git_print_header_div('tags');
6172                git_tags_body(\@taglist, 0, 15,
6173                              $#taglist <=  15 ? undef :
6174                              $cgi->a({-href => href(action=>"tags")}, "..."));
6175        }
6176
6177        if (@headlist) {
6178                git_print_header_div('heads');
6179                git_heads_body(\@headlist, $head, 0, 15,
6180                               $#headlist <= 15 ? undef :
6181                               $cgi->a({-href => href(action=>"heads")}, "..."));
6182        }
6183
6184        if (%remotedata) {
6185                git_print_header_div('remotes');
6186                git_remotes_body(\%remotedata, 15, $head);
6187        }
6188
6189        if (@forklist) {
6190                git_print_header_div('forks');
6191                git_project_list_body(\@forklist, 'age', 0, 15,
6192                                      $#forklist <= 15 ? undef :
6193                                      $cgi->a({-href => href(action=>"forks")}, "..."),
6194                                      'no_header');
6195        }
6196
6197        git_footer_html();
6198}
6199
6200sub git_tag {
6201        my %tag = parse_tag($hash);
6202
6203        if (! %tag) {
6204                die_error(404, "Unknown tag object");
6205        }
6206
6207        my $head = git_get_head_hash($project);
6208        git_header_html();
6209        git_print_page_nav('','', $head,undef,$head);
6210        git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6211        print "<div class=\"title_text\">\n" .
6212              "<table class=\"object_header\">\n" .
6213              "<tr>\n" .
6214              "<td>object</td>\n" .
6215              "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6216                               $tag{'object'}) . "</td>\n" .
6217              "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6218                                              $tag{'type'}) . "</td>\n" .
6219              "</tr>\n";
6220        if (defined($tag{'author'})) {
6221                git_print_authorship_rows(\%tag, 'author');
6222        }
6223        print "</table>\n\n" .
6224              "</div>\n";
6225        print "<div class=\"page_body\">";
6226        my $comment = $tag{'comment'};
6227        foreach my $line (@$comment) {
6228                chomp $line;
6229                print esc_html($line, -nbsp=>1) . "<br/>\n";
6230        }
6231        print "</div>\n";
6232        git_footer_html();
6233}
6234
6235sub git_blame_common {
6236        my $format = shift || 'porcelain';
6237        if ($format eq 'porcelain' && $cgi->param('js')) {
6238                $format = 'incremental';
6239                $action = 'blame_incremental'; # for page title etc
6240        }
6241
6242        # permissions
6243        gitweb_check_feature('blame')
6244                or die_error(403, "Blame view not allowed");
6245
6246        # error checking
6247        die_error(400, "No file name given") unless $file_name;
6248        $hash_base ||= git_get_head_hash($project);
6249        die_error(404, "Couldn't find base commit") unless $hash_base;
6250        my %co = parse_commit($hash_base)
6251                or die_error(404, "Commit not found");
6252        my $ftype = "blob";
6253        if (!defined $hash) {
6254                $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6255                        or die_error(404, "Error looking up file");
6256        } else {
6257                $ftype = git_get_type($hash);
6258                if ($ftype !~ "blob") {
6259                        die_error(400, "Object is not a blob");
6260                }
6261        }
6262
6263        my $fd;
6264        if ($format eq 'incremental') {
6265                # get file contents (as base)
6266                open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6267                        or die_error(500, "Open git-cat-file failed");
6268        } elsif ($format eq 'data') {
6269                # run git-blame --incremental
6270                open $fd, "-|", git_cmd(), "blame", "--incremental",
6271                        $hash_base, "--", $file_name
6272                        or die_error(500, "Open git-blame --incremental failed");
6273        } else {
6274                # run git-blame --porcelain
6275                open $fd, "-|", git_cmd(), "blame", '-p',
6276                        $hash_base, '--', $file_name
6277                        or die_error(500, "Open git-blame --porcelain failed");
6278        }
6279
6280        # incremental blame data returns early
6281        if ($format eq 'data') {
6282                print $cgi->header(
6283                        -type=>"text/plain", -charset => "utf-8",
6284                        -status=> "200 OK");
6285                local $| = 1; # output autoflush
6286                while (my $line = <$fd>) {
6287                        print to_utf8($line);
6288                }
6289                close $fd
6290                        or print "ERROR $!\n";
6291
6292                print 'END';
6293                if (defined $t0 && gitweb_check_feature('timed')) {
6294                        print ' '.
6295                              tv_interval($t0, [ gettimeofday() ]).
6296                              ' '.$number_of_git_cmds;
6297                }
6298                print "\n";
6299
6300                return;
6301        }
6302
6303        # page header
6304        git_header_html();
6305        my $formats_nav =
6306                $cgi->a({-href => href(action=>"blob", -replay=>1)},
6307                        "blob") .
6308                " | ";
6309        if ($format eq 'incremental') {
6310                $formats_nav .=
6311                        $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6312                                "blame") . " (non-incremental)";
6313        } else {
6314                $formats_nav .=
6315                        $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6316                                "blame") . " (incremental)";
6317        }
6318        $formats_nav .=
6319                " | " .
6320                $cgi->a({-href => href(action=>"history", -replay=>1)},
6321                        "history") .
6322                " | " .
6323                $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6324                        "HEAD");
6325        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6326        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6327        git_print_page_path($file_name, $ftype, $hash_base);
6328
6329        # page body
6330        if ($format eq 'incremental') {
6331                print "<noscript>\n<div class=\"error\"><center><b>\n".
6332                      "This page requires JavaScript to run.\n Use ".
6333                      $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6334                              'this page').
6335                      " instead.\n".
6336                      "</b></center></div>\n</noscript>\n";
6337
6338                print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6339        }
6340
6341        print qq!<div class="page_body">\n!;
6342        print qq!<div id="progress_info">... / ...</div>\n!
6343                if ($format eq 'incremental');
6344        print qq!<table id="blame_table" class="blame" width="100%">\n!.
6345              #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6346              qq!<thead>\n!.
6347              qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6348              qq!</thead>\n!.
6349              qq!<tbody>\n!;
6350
6351        my @rev_color = qw(light dark);
6352        my $num_colors = scalar(@rev_color);
6353        my $current_color = 0;
6354
6355        if ($format eq 'incremental') {
6356                my $color_class = $rev_color[$current_color];
6357
6358                #contents of a file
6359                my $linenr = 0;
6360        LINE:
6361                while (my $line = <$fd>) {
6362                        chomp $line;
6363                        $linenr++;
6364
6365                        print qq!<tr id="l$linenr" class="$color_class">!.
6366                              qq!<td class="sha1"><a href=""> </a></td>!.
6367                              qq!<td class="linenr">!.
6368                              qq!<a class="linenr" href="">$linenr</a></td>!;
6369                        print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6370                        print qq!</tr>\n!;
6371                }
6372
6373        } else { # porcelain, i.e. ordinary blame
6374                my %metainfo = (); # saves information about commits
6375
6376                # blame data
6377        LINE:
6378                while (my $line = <$fd>) {
6379                        chomp $line;
6380                        # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6381                        # no <lines in group> for subsequent lines in group of lines
6382                        my ($full_rev, $orig_lineno, $lineno, $group_size) =
6383                           ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6384                        if (!exists $metainfo{$full_rev}) {
6385                                $metainfo{$full_rev} = { 'nprevious' => 0 };
6386                        }
6387                        my $meta = $metainfo{$full_rev};
6388                        my $data;
6389                        while ($data = <$fd>) {
6390                                chomp $data;
6391                                last if ($data =~ s/^\t//); # contents of line
6392                                if ($data =~ /^(\S+)(?: (.*))?$/) {
6393                                        $meta->{$1} = $2 unless exists $meta->{$1};
6394                                }
6395                                if ($data =~ /^previous /) {
6396                                        $meta->{'nprevious'}++;
6397                                }
6398                        }
6399                        my $short_rev = substr($full_rev, 0, 8);
6400                        my $author = $meta->{'author'};
6401                        my %date =
6402                                parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6403                        my $date = $date{'iso-tz'};
6404                        if ($group_size) {
6405                                $current_color = ($current_color + 1) % $num_colors;
6406                        }
6407                        my $tr_class = $rev_color[$current_color];
6408                        $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6409                        $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6410                        $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6411                        print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6412                        if ($group_size) {
6413                                print "<td class=\"sha1\"";
6414                                print " title=\"". esc_html($author) . ", $date\"";
6415                                print " rowspan=\"$group_size\"" if ($group_size > 1);
6416                                print ">";
6417                                print $cgi->a({-href => href(action=>"commit",
6418                                                             hash=>$full_rev,
6419                                                             file_name=>$file_name)},
6420                                              esc_html($short_rev));
6421                                if ($group_size >= 2) {
6422                                        my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6423                                        if (@author_initials) {
6424                                                print "<br />" .
6425                                                      esc_html(join('', @author_initials));
6426                                                #           or join('.', ...)
6427                                        }
6428                                }
6429                                print "</td>\n";
6430                        }
6431                        # 'previous' <sha1 of parent commit> <filename at commit>
6432                        if (exists $meta->{'previous'} &&
6433                            $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6434                                $meta->{'parent'} = $1;
6435                                $meta->{'file_parent'} = unquote($2);
6436                        }
6437                        my $linenr_commit =
6438                                exists($meta->{'parent'}) ?
6439                                $meta->{'parent'} : $full_rev;
6440                        my $linenr_filename =
6441                                exists($meta->{'file_parent'}) ?
6442                                $meta->{'file_parent'} : unquote($meta->{'filename'});
6443                        my $blamed = href(action => 'blame',
6444                                          file_name => $linenr_filename,
6445                                          hash_base => $linenr_commit);
6446                        print "<td class=\"linenr\">";
6447                        print $cgi->a({ -href => "$blamed#l$orig_lineno",
6448                                        -class => "linenr" },
6449                                      esc_html($lineno));
6450                        print "</td>";
6451                        print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6452                        print "</tr>\n";
6453                } # end while
6454
6455        }
6456
6457        # footer
6458        print "</tbody>\n".
6459              "</table>\n"; # class="blame"
6460        print "</div>\n";   # class="blame_body"
6461        close $fd
6462                or print "Reading blob failed\n";
6463
6464        git_footer_html();
6465}
6466
6467sub git_blame {
6468        git_blame_common();
6469}
6470
6471sub git_blame_incremental {
6472        git_blame_common('incremental');
6473}
6474
6475sub git_blame_data {
6476        git_blame_common('data');
6477}
6478
6479sub git_tags {
6480        my $head = git_get_head_hash($project);
6481        git_header_html();
6482        git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6483        git_print_header_div('summary', $project);
6484
6485        my @tagslist = git_get_tags_list();
6486        if (@tagslist) {
6487                git_tags_body(\@tagslist);
6488        }
6489        git_footer_html();
6490}
6491
6492sub git_heads {
6493        my $head = git_get_head_hash($project);
6494        git_header_html();
6495        git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6496        git_print_header_div('summary', $project);
6497
6498        my @headslist = git_get_heads_list();
6499        if (@headslist) {
6500                git_heads_body(\@headslist, $head);
6501        }
6502        git_footer_html();
6503}
6504
6505# used both for single remote view and for list of all the remotes
6506sub git_remotes {
6507        gitweb_check_feature('remote_heads')
6508                or die_error(403, "Remote heads view is disabled");
6509
6510        my $head = git_get_head_hash($project);
6511        my $remote = $input_params{'hash'};
6512
6513        my $remotedata = git_get_remotes_list($remote);
6514        die_error(500, "Unable to get remote information") unless defined $remotedata;
6515
6516        unless (%$remotedata) {
6517                die_error(404, defined $remote ?
6518                        "Remote $remote not found" :
6519                        "No remotes found");
6520        }
6521
6522        git_header_html(undef, undef, -action_extra => $remote);
6523        git_print_page_nav('', '',  $head, undef, $head,
6524                format_ref_views($remote ? '' : 'remotes'));
6525
6526        fill_remote_heads($remotedata);
6527        if (defined $remote) {
6528                git_print_header_div('remotes', "$remote remote for $project");
6529                git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6530        } else {
6531                git_print_header_div('summary', "$project remotes");
6532                git_remotes_body($remotedata, undef, $head);
6533        }
6534
6535        git_footer_html();
6536}
6537
6538sub git_blob_plain {
6539        my $type = shift;
6540        my $expires;
6541
6542        if (!defined $hash) {
6543                if (defined $file_name) {
6544                        my $base = $hash_base || git_get_head_hash($project);
6545                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6546                                or die_error(404, "Cannot find file");
6547                } else {
6548                        die_error(400, "No file name defined");
6549                }
6550        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6551                # blobs defined by non-textual hash id's can be cached
6552                $expires = "+1d";
6553        }
6554
6555        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6556                or die_error(500, "Open git-cat-file blob '$hash' failed");
6557
6558        # content-type (can include charset)
6559        $type = blob_contenttype($fd, $file_name, $type);
6560
6561        # "save as" filename, even when no $file_name is given
6562        my $save_as = "$hash";
6563        if (defined $file_name) {
6564                $save_as = $file_name;
6565        } elsif ($type =~ m/^text\//) {
6566                $save_as .= '.txt';
6567        }
6568
6569        # With XSS prevention on, blobs of all types except a few known safe
6570        # ones are served with "Content-Disposition: attachment" to make sure
6571        # they don't run in our security domain.  For certain image types,
6572        # blob view writes an <img> tag referring to blob_plain view, and we
6573        # want to be sure not to break that by serving the image as an
6574        # attachment (though Firefox 3 doesn't seem to care).
6575        my $sandbox = $prevent_xss &&
6576                $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6577
6578        # serve text/* as text/plain
6579        if ($prevent_xss &&
6580            ($type =~ m!^text/[a-z]+\b(.*)$! ||
6581             ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
6582                my $rest = $1;
6583                $rest = defined $rest ? $rest : '';
6584                $type = "text/plain$rest";
6585        }
6586
6587        print $cgi->header(
6588                -type => $type,
6589                -expires => $expires,
6590                -content_disposition =>
6591                        ($sandbox ? 'attachment' : 'inline')
6592                        . '; filename="' . $save_as . '"');
6593        local $/ = undef;
6594        binmode STDOUT, ':raw';
6595        print <$fd>;
6596        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6597        close $fd;
6598}
6599
6600sub git_blob {
6601        my $expires;
6602
6603        if (!defined $hash) {
6604                if (defined $file_name) {
6605                        my $base = $hash_base || git_get_head_hash($project);
6606                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6607                                or die_error(404, "Cannot find file");
6608                } else {
6609                        die_error(400, "No file name defined");
6610                }
6611        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6612                # blobs defined by non-textual hash id's can be cached
6613                $expires = "+1d";
6614        }
6615
6616        my $have_blame = gitweb_check_feature('blame');
6617        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6618                or die_error(500, "Couldn't cat $file_name, $hash");
6619        my $mimetype = blob_mimetype($fd, $file_name);
6620        # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6621        if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6622                close $fd;
6623                return git_blob_plain($mimetype);
6624        }
6625        # we can have blame only for text/* mimetype
6626        $have_blame &&= ($mimetype =~ m!^text/!);
6627
6628        my $highlight = gitweb_check_feature('highlight');
6629        my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6630        $fd = run_highlighter($fd, $highlight, $syntax)
6631                if $syntax;
6632
6633        git_header_html(undef, $expires);
6634        my $formats_nav = '';
6635        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6636                if (defined $file_name) {
6637                        if ($have_blame) {
6638                                $formats_nav .=
6639                                        $cgi->a({-href => href(action=>"blame", -replay=>1)},
6640                                                "blame") .
6641                                        " | ";
6642                        }
6643                        $formats_nav .=
6644                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6645                                        "history") .
6646                                " | " .
6647                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6648                                        "raw") .
6649                                " | " .
6650                                $cgi->a({-href => href(action=>"blob",
6651                                                       hash_base=>"HEAD", file_name=>$file_name)},
6652                                        "HEAD");
6653                } else {
6654                        $formats_nav .=
6655                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6656                                        "raw");
6657                }
6658                git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6659                git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6660        } else {
6661                print "<div class=\"page_nav\">\n" .
6662                      "<br/><br/></div>\n" .
6663                      "<div class=\"title\">".esc_html($hash)."</div>\n";
6664        }
6665        git_print_page_path($file_name, "blob", $hash_base);
6666        print "<div class=\"page_body\">\n";
6667        if ($mimetype =~ m!^image/!) {
6668                print qq!<img type="!.esc_attr($mimetype).qq!"!;
6669                if ($file_name) {
6670                        print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
6671                }
6672                print qq! src="! .
6673                      href(action=>"blob_plain", hash=>$hash,
6674                           hash_base=>$hash_base, file_name=>$file_name) .
6675                      qq!" />\n!;
6676        } else {
6677                my $nr;
6678                while (my $line = <$fd>) {
6679                        chomp $line;
6680                        $nr++;
6681                        $line = untabify($line);
6682                        printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
6683                               $nr, esc_attr(href(-replay => 1)), $nr, $nr,
6684                               $syntax ? sanitize($line) : esc_html($line, -nbsp=>1);
6685                }
6686        }
6687        close $fd
6688                or print "Reading blob failed.\n";
6689        print "</div>";
6690        git_footer_html();
6691}
6692
6693sub git_tree {
6694        if (!defined $hash_base) {
6695                $hash_base = "HEAD";
6696        }
6697        if (!defined $hash) {
6698                if (defined $file_name) {
6699                        $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
6700                } else {
6701                        $hash = $hash_base;
6702                }
6703        }
6704        die_error(404, "No such tree") unless defined($hash);
6705
6706        my $show_sizes = gitweb_check_feature('show-sizes');
6707        my $have_blame = gitweb_check_feature('blame');
6708
6709        my @entries = ();
6710        {
6711                local $/ = "\0";
6712                open my $fd, "-|", git_cmd(), "ls-tree", '-z',
6713                        ($show_sizes ? '-l' : ()), @extra_options, $hash
6714                        or die_error(500, "Open git-ls-tree failed");
6715                @entries = map { chomp; $_ } <$fd>;
6716                close $fd
6717                        or die_error(404, "Reading tree failed");
6718        }
6719
6720        my $refs = git_get_references();
6721        my $ref = format_ref_marker($refs, $hash_base);
6722        git_header_html();
6723        my $basedir = '';
6724        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6725                my @views_nav = ();
6726                if (defined $file_name) {
6727                        push @views_nav,
6728                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6729                                        "history"),
6730                                $cgi->a({-href => href(action=>"tree",
6731                                                       hash_base=>"HEAD", file_name=>$file_name)},
6732                                        "HEAD"),
6733                }
6734                my $snapshot_links = format_snapshot_links($hash);
6735                if (defined $snapshot_links) {
6736                        # FIXME: Should be available when we have no hash base as well.
6737                        push @views_nav, $snapshot_links;
6738                }
6739                git_print_page_nav('tree','', $hash_base, undef, undef,
6740                                   join(' | ', @views_nav));
6741                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6742        } else {
6743                undef $hash_base;
6744                print "<div class=\"page_nav\">\n";
6745                print "<br/><br/></div>\n";
6746                print "<div class=\"title\">".esc_html($hash)."</div>\n";
6747        }
6748        if (defined $file_name) {
6749                $basedir = $file_name;
6750                if ($basedir ne '' && substr($basedir, -1) ne '/') {
6751                        $basedir .= '/';
6752                }
6753                git_print_page_path($file_name, 'tree', $hash_base);
6754        }
6755        print "<div class=\"page_body\">\n";
6756        print "<table class=\"tree\">\n";
6757        my $alternate = 1;
6758        # '..' (top directory) link if possible
6759        if (defined $hash_base &&
6760            defined $file_name && $file_name =~ m![^/]+$!) {
6761                if ($alternate) {
6762                        print "<tr class=\"dark\">\n";
6763                } else {
6764                        print "<tr class=\"light\">\n";
6765                }
6766                $alternate ^= 1;
6767
6768                my $up = $file_name;
6769                $up =~ s!/?[^/]+$!!;
6770                undef $up unless $up;
6771                # based on git_print_tree_entry
6772                print '<td class="mode">' . mode_str('040000') . "</td>\n";
6773                print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6774                print '<td class="list">';
6775                print $cgi->a({-href => href(action=>"tree",
6776                                             hash_base=>$hash_base,
6777                                             file_name=>$up)},
6778                              "..");
6779                print "</td>\n";
6780                print "<td class=\"link\"></td>\n";
6781
6782                print "</tr>\n";
6783        }
6784        foreach my $line (@entries) {
6785                my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6786
6787                if ($alternate) {
6788                        print "<tr class=\"dark\">\n";
6789                } else {
6790                        print "<tr class=\"light\">\n";
6791                }
6792                $alternate ^= 1;
6793
6794                git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6795
6796                print "</tr>\n";
6797        }
6798        print "</table>\n" .
6799              "</div>";
6800        git_footer_html();
6801}
6802
6803sub snapshot_name {
6804        my ($project, $hash) = @_;
6805
6806        # path/to/project.git  -> project
6807        # path/to/project/.git -> project
6808        my $name = to_utf8($project);
6809        $name =~ s,([^/])/*\.git$,$1,;
6810        $name = basename($name);
6811        # sanitize name
6812        $name =~ s/[[:cntrl:]]/?/g;
6813
6814        my $ver = $hash;
6815        if ($hash =~ /^[0-9a-fA-F]+$/) {
6816                # shorten SHA-1 hash
6817                my $full_hash = git_get_full_hash($project, $hash);
6818                if ($full_hash =~ /^$hash/ && length($hash) > 7) {
6819                        $ver = git_get_short_hash($project, $hash);
6820                }
6821        } elsif ($hash =~ m!^refs/tags/(.*)$!) {
6822                # tags don't need shortened SHA-1 hash
6823                $ver = $1;
6824        } else {
6825                # branches and other need shortened SHA-1 hash
6826                if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
6827                        $ver = $1;
6828                }
6829                $ver .= '-' . git_get_short_hash($project, $hash);
6830        }
6831        # in case of hierarchical branch names
6832        $ver =~ s!/!.!g;
6833
6834        # name = project-version_string
6835        $name = "$name-$ver";
6836
6837        return wantarray ? ($name, $name) : $name;
6838}
6839
6840sub git_snapshot {
6841        my $format = $input_params{'snapshot_format'};
6842        if (!@snapshot_fmts) {
6843                die_error(403, "Snapshots not allowed");
6844        }
6845        # default to first supported snapshot format
6846        $format ||= $snapshot_fmts[0];
6847        if ($format !~ m/^[a-z0-9]+$/) {
6848                die_error(400, "Invalid snapshot format parameter");
6849        } elsif (!exists($known_snapshot_formats{$format})) {
6850                die_error(400, "Unknown snapshot format");
6851        } elsif ($known_snapshot_formats{$format}{'disabled'}) {
6852                die_error(403, "Snapshot format not allowed");
6853        } elsif (!grep($_ eq $format, @snapshot_fmts)) {
6854                die_error(403, "Unsupported snapshot format");
6855        }
6856
6857        my $type = git_get_type("$hash^{}");
6858        if (!$type) {
6859                die_error(404, 'Object does not exist');
6860        }  elsif ($type eq 'blob') {
6861                die_error(400, 'Object is not a tree-ish');
6862        }
6863
6864        my ($name, $prefix) = snapshot_name($project, $hash);
6865        my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
6866        my $cmd = quote_command(
6867                git_cmd(), 'archive',
6868                "--format=$known_snapshot_formats{$format}{'format'}",
6869                "--prefix=$prefix/", $hash);
6870        if (exists $known_snapshot_formats{$format}{'compressor'}) {
6871                $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
6872        }
6873
6874        $filename =~ s/(["\\])/\\$1/g;
6875        print $cgi->header(
6876                -type => $known_snapshot_formats{$format}{'type'},
6877                -content_disposition => 'inline; filename="' . $filename . '"',
6878                -status => '200 OK');
6879
6880        open my $fd, "-|", $cmd
6881                or die_error(500, "Execute git-archive failed");
6882        binmode STDOUT, ':raw';
6883        print <$fd>;
6884        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6885        close $fd;
6886}
6887
6888sub git_log_generic {
6889        my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
6890
6891        my $head = git_get_head_hash($project);
6892        if (!defined $base) {
6893                $base = $head;
6894        }
6895        if (!defined $page) {
6896                $page = 0;
6897        }
6898        my $refs = git_get_references();
6899
6900        my $commit_hash = $base;
6901        if (defined $parent) {
6902                $commit_hash = "$parent..$base";
6903        }
6904        my @commitlist =
6905                parse_commits($commit_hash, 101, (100 * $page),
6906                              defined $file_name ? ($file_name, "--full-history") : ());
6907
6908        my $ftype;
6909        if (!defined $file_hash && defined $file_name) {
6910                # some commits could have deleted file in question,
6911                # and not have it in tree, but one of them has to have it
6912                for (my $i = 0; $i < @commitlist; $i++) {
6913                        $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
6914                        last if defined $file_hash;
6915                }
6916        }
6917        if (defined $file_hash) {
6918                $ftype = git_get_type($file_hash);
6919        }
6920        if (defined $file_name && !defined $ftype) {
6921                die_error(500, "Unknown type of object");
6922        }
6923        my %co;
6924        if (defined $file_name) {
6925                %co = parse_commit($base)
6926                        or die_error(404, "Unknown commit object");
6927        }
6928
6929
6930        my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
6931        my $next_link = '';
6932        if ($#commitlist >= 100) {
6933                $next_link =
6934                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
6935                                 -accesskey => "n", -title => "Alt-n"}, "next");
6936        }
6937        my $patch_max = gitweb_get_feature('patches');
6938        if ($patch_max && !defined $file_name) {
6939                if ($patch_max < 0 || @commitlist <= $patch_max) {
6940                        $paging_nav .= " &sdot; " .
6941                                $cgi->a({-href => href(action=>"patches", -replay=>1)},
6942                                        "patches");
6943                }
6944        }
6945
6946        git_header_html();
6947        git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
6948        if (defined $file_name) {
6949                git_print_header_div('commit', esc_html($co{'title'}), $base);
6950        } else {
6951                git_print_header_div('summary', $project)
6952        }
6953        git_print_page_path($file_name, $ftype, $hash_base)
6954                if (defined $file_name);
6955
6956        $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
6957                     $file_name, $file_hash, $ftype);
6958
6959        git_footer_html();
6960}
6961
6962sub git_log {
6963        git_log_generic('log', \&git_log_body,
6964                        $hash, $hash_parent);
6965}
6966
6967sub git_commit {
6968        $hash ||= $hash_base || "HEAD";
6969        my %co = parse_commit($hash)
6970            or die_error(404, "Unknown commit object");
6971
6972        my $parent  = $co{'parent'};
6973        my $parents = $co{'parents'}; # listref
6974
6975        # we need to prepare $formats_nav before any parameter munging
6976        my $formats_nav;
6977        if (!defined $parent) {
6978                # --root commitdiff
6979                $formats_nav .= '(initial)';
6980        } elsif (@$parents == 1) {
6981                # single parent commit
6982                $formats_nav .=
6983                        '(parent: ' .
6984                        $cgi->a({-href => href(action=>"commit",
6985                                               hash=>$parent)},
6986                                esc_html(substr($parent, 0, 7))) .
6987                        ')';
6988        } else {
6989                # merge commit
6990                $formats_nav .=
6991                        '(merge: ' .
6992                        join(' ', map {
6993                                $cgi->a({-href => href(action=>"commit",
6994                                                       hash=>$_)},
6995                                        esc_html(substr($_, 0, 7)));
6996                        } @$parents ) .
6997                        ')';
6998        }
6999        if (gitweb_check_feature('patches') && @$parents <= 1) {
7000                $formats_nav .= " | " .
7001                        $cgi->a({-href => href(action=>"patch", -replay=>1)},
7002                                "patch");
7003        }
7004
7005        if (!defined $parent) {
7006                $parent = "--root";
7007        }
7008        my @difftree;
7009        open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
7010                @diff_opts,
7011                (@$parents <= 1 ? $parent : '-c'),
7012                $hash, "--"
7013                or die_error(500, "Open git-diff-tree failed");
7014        @difftree = map { chomp; $_ } <$fd>;
7015        close $fd or die_error(404, "Reading git-diff-tree failed");
7016
7017        # non-textual hash id's can be cached
7018        my $expires;
7019        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7020                $expires = "+1d";
7021        }
7022        my $refs = git_get_references();
7023        my $ref = format_ref_marker($refs, $co{'id'});
7024
7025        git_header_html(undef, $expires);
7026        git_print_page_nav('commit', '',
7027                           $hash, $co{'tree'}, $hash,
7028                           $formats_nav);
7029
7030        if (defined $co{'parent'}) {
7031                git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
7032        } else {
7033                git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
7034        }
7035        print "<div class=\"title_text\">\n" .
7036              "<table class=\"object_header\">\n";
7037        git_print_authorship_rows(\%co);
7038        print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
7039        print "<tr>" .
7040              "<td>tree</td>" .
7041              "<td class=\"sha1\">" .
7042              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7043                       class => "list"}, $co{'tree'}) .
7044              "</td>" .
7045              "<td class=\"link\">" .
7046              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7047                      "tree");
7048        my $snapshot_links = format_snapshot_links($hash);
7049        if (defined $snapshot_links) {
7050                print " | " . $snapshot_links;
7051        }
7052        print "</td>" .
7053              "</tr>\n";
7054
7055        foreach my $par (@$parents) {
7056                print "<tr>" .
7057                      "<td>parent</td>" .
7058                      "<td class=\"sha1\">" .
7059                      $cgi->a({-href => href(action=>"commit", hash=>$par),
7060                               class => "list"}, $par) .
7061                      "</td>" .
7062                      "<td class=\"link\">" .
7063                      $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7064                      " | " .
7065                      $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7066                      "</td>" .
7067                      "</tr>\n";
7068        }
7069        print "</table>".
7070              "</div>\n";
7071
7072        print "<div class=\"page_body\">\n";
7073        git_print_log($co{'comment'});
7074        print "</div>\n";
7075
7076        git_difftree_body(\@difftree, $hash, @$parents);
7077
7078        git_footer_html();
7079}
7080
7081sub git_object {
7082        # object is defined by:
7083        # - hash or hash_base alone
7084        # - hash_base and file_name
7085        my $type;
7086
7087        # - hash or hash_base alone
7088        if ($hash || ($hash_base && !defined $file_name)) {
7089                my $object_id = $hash || $hash_base;
7090
7091                open my $fd, "-|", quote_command(
7092                        git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7093                        or die_error(404, "Object does not exist");
7094                $type = <$fd>;
7095                chomp $type;
7096                close $fd
7097                        or die_error(404, "Object does not exist");
7098
7099        # - hash_base and file_name
7100        } elsif ($hash_base && defined $file_name) {
7101                $file_name =~ s,/+$,,;
7102
7103                system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7104                        or die_error(404, "Base object does not exist");
7105
7106                # here errors should not hapen
7107                open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7108                        or die_error(500, "Open git-ls-tree failed");
7109                my $line = <$fd>;
7110                close $fd;
7111
7112                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7113                unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7114                        die_error(404, "File or directory for given base does not exist");
7115                }
7116                $type = $2;
7117                $hash = $3;
7118        } else {
7119                die_error(400, "Not enough information to find object");
7120        }
7121
7122        print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7123                                          hash=>$hash, hash_base=>$hash_base,
7124                                          file_name=>$file_name),
7125                             -status => '302 Found');
7126}
7127
7128sub git_blobdiff {
7129        my $format = shift || 'html';
7130        my $diff_style = $input_params{'diff_style'} || 'inline';
7131
7132        my $fd;
7133        my @difftree;
7134        my %diffinfo;
7135        my $expires;
7136
7137        # preparing $fd and %diffinfo for git_patchset_body
7138        # new style URI
7139        if (defined $hash_base && defined $hash_parent_base) {
7140                if (defined $file_name) {
7141                        # read raw output
7142                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7143                                $hash_parent_base, $hash_base,
7144                                "--", (defined $file_parent ? $file_parent : ()), $file_name
7145                                or die_error(500, "Open git-diff-tree failed");
7146                        @difftree = map { chomp; $_ } <$fd>;
7147                        close $fd
7148                                or die_error(404, "Reading git-diff-tree failed");
7149                        @difftree
7150                                or die_error(404, "Blob diff not found");
7151
7152                } elsif (defined $hash &&
7153                         $hash =~ /[0-9a-fA-F]{40}/) {
7154                        # try to find filename from $hash
7155
7156                        # read filtered raw output
7157                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7158                                $hash_parent_base, $hash_base, "--"
7159                                or die_error(500, "Open git-diff-tree failed");
7160                        @difftree =
7161                                # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7162                                # $hash == to_id
7163                                grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7164                                map { chomp; $_ } <$fd>;
7165                        close $fd
7166                                or die_error(404, "Reading git-diff-tree failed");
7167                        @difftree
7168                                or die_error(404, "Blob diff not found");
7169
7170                } else {
7171                        die_error(400, "Missing one of the blob diff parameters");
7172                }
7173
7174                if (@difftree > 1) {
7175                        die_error(400, "Ambiguous blob diff specification");
7176                }
7177
7178                %diffinfo = parse_difftree_raw_line($difftree[0]);
7179                $file_parent ||= $diffinfo{'from_file'} || $file_name;
7180                $file_name   ||= $diffinfo{'to_file'};
7181
7182                $hash_parent ||= $diffinfo{'from_id'};
7183                $hash        ||= $diffinfo{'to_id'};
7184
7185                # non-textual hash id's can be cached
7186                if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7187                    $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7188                        $expires = '+1d';
7189                }
7190
7191                # open patch output
7192                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7193                        '-p', ($format eq 'html' ? "--full-index" : ()),
7194                        $hash_parent_base, $hash_base,
7195                        "--", (defined $file_parent ? $file_parent : ()), $file_name
7196                        or die_error(500, "Open git-diff-tree failed");
7197        }
7198
7199        # old/legacy style URI -- not generated anymore since 1.4.3.
7200        if (!%diffinfo) {
7201                die_error('404 Not Found', "Missing one of the blob diff parameters")
7202        }
7203
7204        # header
7205        if ($format eq 'html') {
7206                my $formats_nav =
7207                        $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7208                                "raw");
7209                $formats_nav .= diff_style_nav($diff_style);
7210                git_header_html(undef, $expires);
7211                if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7212                        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7213                        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7214                } else {
7215                        print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7216                        print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7217                }
7218                if (defined $file_name) {
7219                        git_print_page_path($file_name, "blob", $hash_base);
7220                } else {
7221                        print "<div class=\"page_path\"></div>\n";
7222                }
7223
7224        } elsif ($format eq 'plain') {
7225                print $cgi->header(
7226                        -type => 'text/plain',
7227                        -charset => 'utf-8',
7228                        -expires => $expires,
7229                        -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7230
7231                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7232
7233        } else {
7234                die_error(400, "Unknown blobdiff format");
7235        }
7236
7237        # patch
7238        if ($format eq 'html') {
7239                print "<div class=\"page_body\">\n";
7240
7241                git_patchset_body($fd, $diff_style,
7242                                  [ \%diffinfo ], $hash_base, $hash_parent_base);
7243                close $fd;
7244
7245                print "</div>\n"; # class="page_body"
7246                git_footer_html();
7247
7248        } else {
7249                while (my $line = <$fd>) {
7250                        $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7251                        $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7252
7253                        print $line;
7254
7255                        last if $line =~ m!^\+\+\+!;
7256                }
7257                local $/ = undef;
7258                print <$fd>;
7259                close $fd;
7260        }
7261}
7262
7263sub git_blobdiff_plain {
7264        git_blobdiff('plain');
7265}
7266
7267# assumes that it is added as later part of already existing navigation,
7268# so it returns "| foo | bar" rather than just "foo | bar"
7269sub diff_style_nav {
7270        my ($diff_style, $is_combined) = @_;
7271        $diff_style ||= 'inline';
7272
7273        return "" if ($is_combined);
7274
7275        my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7276        my %styles = @styles;
7277        @styles =
7278                @styles[ map { $_ * 2 } 0..$#styles/2 ];
7279
7280        return join '',
7281                map { " | ".$_ }
7282                map {
7283                        $_ eq $diff_style ? $styles{$_} :
7284                        $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7285                } @styles;
7286}
7287
7288sub git_commitdiff {
7289        my %params = @_;
7290        my $format = $params{-format} || 'html';
7291        my $diff_style = $input_params{'diff_style'} || 'inline';
7292
7293        my ($patch_max) = gitweb_get_feature('patches');
7294        if ($format eq 'patch') {
7295                die_error(403, "Patch view not allowed") unless $patch_max;
7296        }
7297
7298        $hash ||= $hash_base || "HEAD";
7299        my %co = parse_commit($hash)
7300            or die_error(404, "Unknown commit object");
7301
7302        # choose format for commitdiff for merge
7303        if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7304                $hash_parent = '--cc';
7305        }
7306        # we need to prepare $formats_nav before almost any parameter munging
7307        my $formats_nav;
7308        if ($format eq 'html') {
7309                $formats_nav =
7310                        $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7311                                "raw");
7312                if ($patch_max && @{$co{'parents'}} <= 1) {
7313                        $formats_nav .= " | " .
7314                                $cgi->a({-href => href(action=>"patch", -replay=>1)},
7315                                        "patch");
7316                }
7317                $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7318
7319                if (defined $hash_parent &&
7320                    $hash_parent ne '-c' && $hash_parent ne '--cc') {
7321                        # commitdiff with two commits given
7322                        my $hash_parent_short = $hash_parent;
7323                        if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7324                                $hash_parent_short = substr($hash_parent, 0, 7);
7325                        }
7326                        $formats_nav .=
7327                                ' (from';
7328                        for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7329                                if ($co{'parents'}[$i] eq $hash_parent) {
7330                                        $formats_nav .= ' parent ' . ($i+1);
7331                                        last;
7332                                }
7333                        }
7334                        $formats_nav .= ': ' .
7335                                $cgi->a({-href => href(-replay=>1,
7336                                                       hash=>$hash_parent, hash_base=>undef)},
7337                                        esc_html($hash_parent_short)) .
7338                                ')';
7339                } elsif (!$co{'parent'}) {
7340                        # --root commitdiff
7341                        $formats_nav .= ' (initial)';
7342                } elsif (scalar @{$co{'parents'}} == 1) {
7343                        # single parent commit
7344                        $formats_nav .=
7345                                ' (parent: ' .
7346                                $cgi->a({-href => href(-replay=>1,
7347                                                       hash=>$co{'parent'}, hash_base=>undef)},
7348                                        esc_html(substr($co{'parent'}, 0, 7))) .
7349                                ')';
7350                } else {
7351                        # merge commit
7352                        if ($hash_parent eq '--cc') {
7353                                $formats_nav .= ' | ' .
7354                                        $cgi->a({-href => href(-replay=>1,
7355                                                               hash=>$hash, hash_parent=>'-c')},
7356                                                'combined');
7357                        } else { # $hash_parent eq '-c'
7358                                $formats_nav .= ' | ' .
7359                                        $cgi->a({-href => href(-replay=>1,
7360                                                               hash=>$hash, hash_parent=>'--cc')},
7361                                                'compact');
7362                        }
7363                        $formats_nav .=
7364                                ' (merge: ' .
7365                                join(' ', map {
7366                                        $cgi->a({-href => href(-replay=>1,
7367                                                               hash=>$_, hash_base=>undef)},
7368                                                esc_html(substr($_, 0, 7)));
7369                                } @{$co{'parents'}} ) .
7370                                ')';
7371                }
7372        }
7373
7374        my $hash_parent_param = $hash_parent;
7375        if (!defined $hash_parent_param) {
7376                # --cc for multiple parents, --root for parentless
7377                $hash_parent_param =
7378                        @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7379        }
7380
7381        # read commitdiff
7382        my $fd;
7383        my @difftree;
7384        if ($format eq 'html') {
7385                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7386                        "--no-commit-id", "--patch-with-raw", "--full-index",
7387                        $hash_parent_param, $hash, "--"
7388                        or die_error(500, "Open git-diff-tree failed");
7389
7390                while (my $line = <$fd>) {
7391                        chomp $line;
7392                        # empty line ends raw part of diff-tree output
7393                        last unless $line;
7394                        push @difftree, scalar parse_difftree_raw_line($line);
7395                }
7396
7397        } elsif ($format eq 'plain') {
7398                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7399                        '-p', $hash_parent_param, $hash, "--"
7400                        or die_error(500, "Open git-diff-tree failed");
7401        } elsif ($format eq 'patch') {
7402                # For commit ranges, we limit the output to the number of
7403                # patches specified in the 'patches' feature.
7404                # For single commits, we limit the output to a single patch,
7405                # diverging from the git-format-patch default.
7406                my @commit_spec = ();
7407                if ($hash_parent) {
7408                        if ($patch_max > 0) {
7409                                push @commit_spec, "-$patch_max";
7410                        }
7411                        push @commit_spec, '-n', "$hash_parent..$hash";
7412                } else {
7413                        if ($params{-single}) {
7414                                push @commit_spec, '-1';
7415                        } else {
7416                                if ($patch_max > 0) {
7417                                        push @commit_spec, "-$patch_max";
7418                                }
7419                                push @commit_spec, "-n";
7420                        }
7421                        push @commit_spec, '--root', $hash;
7422                }
7423                open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7424                        '--encoding=utf8', '--stdout', @commit_spec
7425                        or die_error(500, "Open git-format-patch failed");
7426        } else {
7427                die_error(400, "Unknown commitdiff format");
7428        }
7429
7430        # non-textual hash id's can be cached
7431        my $expires;
7432        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7433                $expires = "+1d";
7434        }
7435
7436        # write commit message
7437        if ($format eq 'html') {
7438                my $refs = git_get_references();
7439                my $ref = format_ref_marker($refs, $co{'id'});
7440
7441                git_header_html(undef, $expires);
7442                git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7443                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7444                print "<div class=\"title_text\">\n" .
7445                      "<table class=\"object_header\">\n";
7446                git_print_authorship_rows(\%co);
7447                print "</table>".
7448                      "</div>\n";
7449                print "<div class=\"page_body\">\n";
7450                if (@{$co{'comment'}} > 1) {
7451                        print "<div class=\"log\">\n";
7452                        git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7453                        print "</div>\n"; # class="log"
7454                }
7455
7456        } elsif ($format eq 'plain') {
7457                my $refs = git_get_references("tags");
7458                my $tagname = git_get_rev_name_tags($hash);
7459                my $filename = basename($project) . "-$hash.patch";
7460
7461                print $cgi->header(
7462                        -type => 'text/plain',
7463                        -charset => 'utf-8',
7464                        -expires => $expires,
7465                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7466                my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7467                print "From: " . to_utf8($co{'author'}) . "\n";
7468                print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7469                print "Subject: " . to_utf8($co{'title'}) . "\n";
7470
7471                print "X-Git-Tag: $tagname\n" if $tagname;
7472                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7473
7474                foreach my $line (@{$co{'comment'}}) {
7475                        print to_utf8($line) . "\n";
7476                }
7477                print "---\n\n";
7478        } elsif ($format eq 'patch') {
7479                my $filename = basename($project) . "-$hash.patch";
7480
7481                print $cgi->header(
7482                        -type => 'text/plain',
7483                        -charset => 'utf-8',
7484                        -expires => $expires,
7485                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7486        }
7487
7488        # write patch
7489        if ($format eq 'html') {
7490                my $use_parents = !defined $hash_parent ||
7491                        $hash_parent eq '-c' || $hash_parent eq '--cc';
7492                git_difftree_body(\@difftree, $hash,
7493                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7494                print "<br/>\n";
7495
7496                git_patchset_body($fd, $diff_style,
7497                                  \@difftree, $hash,
7498                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7499                close $fd;
7500                print "</div>\n"; # class="page_body"
7501                git_footer_html();
7502
7503        } elsif ($format eq 'plain') {
7504                local $/ = undef;
7505                print <$fd>;
7506                close $fd
7507                        or print "Reading git-diff-tree failed\n";
7508        } elsif ($format eq 'patch') {
7509                local $/ = undef;
7510                print <$fd>;
7511                close $fd
7512                        or print "Reading git-format-patch failed\n";
7513        }
7514}
7515
7516sub git_commitdiff_plain {
7517        git_commitdiff(-format => 'plain');
7518}
7519
7520# format-patch-style patches
7521sub git_patch {
7522        git_commitdiff(-format => 'patch', -single => 1);
7523}
7524
7525sub git_patches {
7526        git_commitdiff(-format => 'patch');
7527}
7528
7529sub git_history {
7530        git_log_generic('history', \&git_history_body,
7531                        $hash_base, $hash_parent_base,
7532                        $file_name, $hash);
7533}
7534
7535sub git_search {
7536        $searchtype ||= 'commit';
7537
7538        # check if appropriate features are enabled
7539        gitweb_check_feature('search')
7540                or die_error(403, "Search is disabled");
7541        if ($searchtype eq 'pickaxe') {
7542                # pickaxe may take all resources of your box and run for several minutes
7543                # with every query - so decide by yourself how public you make this feature
7544                gitweb_check_feature('pickaxe')
7545                        or die_error(403, "Pickaxe search is disabled");
7546        }
7547        if ($searchtype eq 'grep') {
7548                # grep search might be potentially CPU-intensive, too
7549                gitweb_check_feature('grep')
7550                        or die_error(403, "Grep search is disabled");
7551        }
7552
7553        if (!defined $searchtext) {
7554                die_error(400, "Text field is empty");
7555        }
7556        if (!defined $hash) {
7557                $hash = git_get_head_hash($project);
7558        }
7559        my %co = parse_commit($hash);
7560        if (!%co) {
7561                die_error(404, "Unknown commit object");
7562        }
7563        if (!defined $page) {
7564                $page = 0;
7565        }
7566
7567        if ($searchtype eq 'commit' ||
7568            $searchtype eq 'author' ||
7569            $searchtype eq 'committer') {
7570                git_search_message(%co);
7571        } elsif ($searchtype eq 'pickaxe') {
7572                git_search_changes(%co);
7573        } elsif ($searchtype eq 'grep') {
7574                git_search_files(%co);
7575        } else {
7576                die_error(400, "Unknown search type");
7577        }
7578}
7579
7580sub git_search_help {
7581        git_header_html();
7582        git_print_page_nav('','', $hash,$hash,$hash);
7583        print <<EOT;
7584<p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7585regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7586the pattern entered is recognized as the POSIX extended
7587<a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7588insensitive).</p>
7589<dl>
7590<dt><b>commit</b></dt>
7591<dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7592EOT
7593        my $have_grep = gitweb_check_feature('grep');
7594        if ($have_grep) {
7595                print <<EOT;
7596<dt><b>grep</b></dt>
7597<dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7598    a different one) are searched for the given pattern. On large trees, this search can take
7599a while and put some strain on the server, so please use it with some consideration. Note that
7600due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7601case-sensitive.</dd>
7602EOT
7603        }
7604        print <<EOT;
7605<dt><b>author</b></dt>
7606<dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7607<dt><b>committer</b></dt>
7608<dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7609EOT
7610        my $have_pickaxe = gitweb_check_feature('pickaxe');
7611        if ($have_pickaxe) {
7612                print <<EOT;
7613<dt><b>pickaxe</b></dt>
7614<dd>All commits that caused the string to appear or disappear from any file (changes that
7615added, removed or "modified" the string) will be listed. This search can take a while and
7616takes a lot of strain on the server, so please use it wisely. Note that since you may be
7617interested even in changes just changing the case as well, this search is case sensitive.</dd>
7618EOT
7619        }
7620        print "</dl>\n";
7621        git_footer_html();
7622}
7623
7624sub git_shortlog {
7625        git_log_generic('shortlog', \&git_shortlog_body,
7626                        $hash, $hash_parent);
7627}
7628
7629## ......................................................................
7630## feeds (RSS, Atom; OPML)
7631
7632sub git_feed {
7633        my $format = shift || 'atom';
7634        my $have_blame = gitweb_check_feature('blame');
7635
7636        # Atom: http://www.atomenabled.org/developers/syndication/
7637        # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7638        if ($format ne 'rss' && $format ne 'atom') {
7639                die_error(400, "Unknown web feed format");
7640        }
7641
7642        # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7643        my $head = $hash || 'HEAD';
7644        my @commitlist = parse_commits($head, 150, 0, $file_name);
7645
7646        my %latest_commit;
7647        my %latest_date;
7648        my $content_type = "application/$format+xml";
7649        if (defined $cgi->http('HTTP_ACCEPT') &&
7650                 $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7651                # browser (feed reader) prefers text/xml
7652                $content_type = 'text/xml';
7653        }
7654        if (defined($commitlist[0])) {
7655                %latest_commit = %{$commitlist[0]};
7656                my $latest_epoch = $latest_commit{'committer_epoch'};
7657                %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7658                my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7659                if (defined $if_modified) {
7660                        my $since;
7661                        if (eval { require HTTP::Date; 1; }) {
7662                                $since = HTTP::Date::str2time($if_modified);
7663                        } elsif (eval { require Time::ParseDate; 1; }) {
7664                                $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7665                        }
7666                        if (defined $since && $latest_epoch <= $since) {
7667                                print $cgi->header(
7668                                        -type => $content_type,
7669                                        -charset => 'utf-8',
7670                                        -last_modified => $latest_date{'rfc2822'},
7671                                        -status => '304 Not Modified');
7672                                return;
7673                        }
7674                }
7675                print $cgi->header(
7676                        -type => $content_type,
7677                        -charset => 'utf-8',
7678                        -last_modified => $latest_date{'rfc2822'});
7679        } else {
7680                print $cgi->header(
7681                        -type => $content_type,
7682                        -charset => 'utf-8');
7683        }
7684
7685        # Optimization: skip generating the body if client asks only
7686        # for Last-Modified date.
7687        return if ($cgi->request_method() eq 'HEAD');
7688
7689        # header variables
7690        my $title = "$site_name - $project/$action";
7691        my $feed_type = 'log';
7692        if (defined $hash) {
7693                $title .= " - '$hash'";
7694                $feed_type = 'branch log';
7695                if (defined $file_name) {
7696                        $title .= " :: $file_name";
7697                        $feed_type = 'history';
7698                }
7699        } elsif (defined $file_name) {
7700                $title .= " - $file_name";
7701                $feed_type = 'history';
7702        }
7703        $title .= " $feed_type";
7704        my $descr = git_get_project_description($project);
7705        if (defined $descr) {
7706                $descr = esc_html($descr);
7707        } else {
7708                $descr = "$project " .
7709                         ($format eq 'rss' ? 'RSS' : 'Atom') .
7710                         " feed";
7711        }
7712        my $owner = git_get_project_owner($project);
7713        $owner = esc_html($owner);
7714
7715        #header
7716        my $alt_url;
7717        if (defined $file_name) {
7718                $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7719        } elsif (defined $hash) {
7720                $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7721        } else {
7722                $alt_url = href(-full=>1, action=>"summary");
7723        }
7724        print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7725        if ($format eq 'rss') {
7726                print <<XML;
7727<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7728<channel>
7729XML
7730                print "<title>$title</title>\n" .
7731                      "<link>$alt_url</link>\n" .
7732                      "<description>$descr</description>\n" .
7733                      "<language>en</language>\n" .
7734                      # project owner is responsible for 'editorial' content
7735                      "<managingEditor>$owner</managingEditor>\n";
7736                if (defined $logo || defined $favicon) {
7737                        # prefer the logo to the favicon, since RSS
7738                        # doesn't allow both
7739                        my $img = esc_url($logo || $favicon);
7740                        print "<image>\n" .
7741                              "<url>$img</url>\n" .
7742                              "<title>$title</title>\n" .
7743                              "<link>$alt_url</link>\n" .
7744                              "</image>\n";
7745                }
7746                if (%latest_date) {
7747                        print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7748                        print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7749                }
7750                print "<generator>gitweb v.$version/$git_version</generator>\n";
7751        } elsif ($format eq 'atom') {
7752                print <<XML;
7753<feed xmlns="http://www.w3.org/2005/Atom">
7754XML
7755                print "<title>$title</title>\n" .
7756                      "<subtitle>$descr</subtitle>\n" .
7757                      '<link rel="alternate" type="text/html" href="' .
7758                      $alt_url . '" />' . "\n" .
7759                      '<link rel="self" type="' . $content_type . '" href="' .
7760                      $cgi->self_url() . '" />' . "\n" .
7761                      "<id>" . href(-full=>1) . "</id>\n" .
7762                      # use project owner for feed author
7763                      "<author><name>$owner</name></author>\n";
7764                if (defined $favicon) {
7765                        print "<icon>" . esc_url($favicon) . "</icon>\n";
7766                }
7767                if (defined $logo) {
7768                        # not twice as wide as tall: 72 x 27 pixels
7769                        print "<logo>" . esc_url($logo) . "</logo>\n";
7770                }
7771                if (! %latest_date) {
7772                        # dummy date to keep the feed valid until commits trickle in:
7773                        print "<updated>1970-01-01T00:00:00Z</updated>\n";
7774                } else {
7775                        print "<updated>$latest_date{'iso-8601'}</updated>\n";
7776                }
7777                print "<generator version='$version/$git_version'>gitweb</generator>\n";
7778        }
7779
7780        # contents
7781        for (my $i = 0; $i <= $#commitlist; $i++) {
7782                my %co = %{$commitlist[$i]};
7783                my $commit = $co{'id'};
7784                # we read 150, we always show 30 and the ones more recent than 48 hours
7785                if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7786                        last;
7787                }
7788                my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7789
7790                # get list of changed files
7791                open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7792                        $co{'parent'} || "--root",
7793                        $co{'id'}, "--", (defined $file_name ? $file_name : ())
7794                        or next;
7795                my @difftree = map { chomp; $_ } <$fd>;
7796                close $fd
7797                        or next;
7798
7799                # print element (entry, item)
7800                my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7801                if ($format eq 'rss') {
7802                        print "<item>\n" .
7803                              "<title>" . esc_html($co{'title'}) . "</title>\n" .
7804                              "<author>" . esc_html($co{'author'}) . "</author>\n" .
7805                              "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7806                              "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7807                              "<link>$co_url</link>\n" .
7808                              "<description>" . esc_html($co{'title'}) . "</description>\n" .
7809                              "<content:encoded>" .
7810                              "<![CDATA[\n";
7811                } elsif ($format eq 'atom') {
7812                        print "<entry>\n" .
7813                              "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7814                              "<updated>$cd{'iso-8601'}</updated>\n" .
7815                              "<author>\n" .
7816                              "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7817                        if ($co{'author_email'}) {
7818                                print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7819                        }
7820                        print "</author>\n" .
7821                              # use committer for contributor
7822                              "<contributor>\n" .
7823                              "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7824                        if ($co{'committer_email'}) {
7825                                print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7826                        }
7827                        print "</contributor>\n" .
7828                              "<published>$cd{'iso-8601'}</published>\n" .
7829                              "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7830                              "<id>$co_url</id>\n" .
7831                              "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
7832                              "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
7833                }
7834                my $comment = $co{'comment'};
7835                print "<pre>\n";
7836                foreach my $line (@$comment) {
7837                        $line = esc_html($line);
7838                        print "$line\n";
7839                }
7840                print "</pre><ul>\n";
7841                foreach my $difftree_line (@difftree) {
7842                        my %difftree = parse_difftree_raw_line($difftree_line);
7843                        next if !$difftree{'from_id'};
7844
7845                        my $file = $difftree{'file'} || $difftree{'to_file'};
7846
7847                        print "<li>" .
7848                              "[" .
7849                              $cgi->a({-href => href(-full=>1, action=>"blobdiff",
7850                                                     hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
7851                                                     hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
7852                                                     file_name=>$file, file_parent=>$difftree{'from_file'}),
7853                                      -title => "diff"}, 'D');
7854                        if ($have_blame) {
7855                                print $cgi->a({-href => href(-full=>1, action=>"blame",
7856                                                             file_name=>$file, hash_base=>$commit),
7857                                              -title => "blame"}, 'B');
7858                        }
7859                        # if this is not a feed of a file history
7860                        if (!defined $file_name || $file_name ne $file) {
7861                                print $cgi->a({-href => href(-full=>1, action=>"history",
7862                                                             file_name=>$file, hash=>$commit),
7863                                              -title => "history"}, 'H');
7864                        }
7865                        $file = esc_path($file);
7866                        print "] ".
7867                              "$file</li>\n";
7868                }
7869                if ($format eq 'rss') {
7870                        print "</ul>]]>\n" .
7871                              "</content:encoded>\n" .
7872                              "</item>\n";
7873                } elsif ($format eq 'atom') {
7874                        print "</ul>\n</div>\n" .
7875                              "</content>\n" .
7876                              "</entry>\n";
7877                }
7878        }
7879
7880        # end of feed
7881        if ($format eq 'rss') {
7882                print "</channel>\n</rss>\n";
7883        } elsif ($format eq 'atom') {
7884                print "</feed>\n";
7885        }
7886}
7887
7888sub git_rss {
7889        git_feed('rss');
7890}
7891
7892sub git_atom {
7893        git_feed('atom');
7894}
7895
7896sub git_opml {
7897        my @list = git_get_projects_list($project_filter, $strict_export);
7898        if (!@list) {
7899                die_error(404, "No projects found");
7900        }
7901
7902        print $cgi->header(
7903                -type => 'text/xml',
7904                -charset => 'utf-8',
7905                -content_disposition => 'inline; filename="opml.xml"');
7906
7907        my $title = esc_html($site_name);
7908        my $filter = " within subdirectory ";
7909        if (defined $project_filter) {
7910                $filter .= esc_html($project_filter);
7911        } else {
7912                $filter = "";
7913        }
7914        print <<XML;
7915<?xml version="1.0" encoding="utf-8"?>
7916<opml version="1.0">
7917<head>
7918  <title>$title OPML Export$filter</title>
7919</head>
7920<body>
7921<outline text="git RSS feeds">
7922XML
7923
7924        foreach my $pr (@list) {
7925                my %proj = %$pr;
7926                my $head = git_get_head_hash($proj{'path'});
7927                if (!defined $head) {
7928                        next;
7929                }
7930                $git_dir = "$projectroot/$proj{'path'}";
7931                my %co = parse_commit($head);
7932                if (!%co) {
7933                        next;
7934                }
7935
7936                my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7937                my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7938                my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7939                print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7940        }
7941        print <<XML;
7942</outline>
7943</body>
7944</opml>
7945XML
7946}