gitweb / gitweb.perlon commit gitweb: add project_filter to limit project list to a subdirectory (19d2d23)
   1#!/usr/bin/perl
   2
   3# gitweb - simple web interface to track changes in git repositories
   4#
   5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
   6# (C) 2005, Christian Gierke
   7#
   8# This program is licensed under the GPLv2
   9
  10use 5.008;
  11use strict;
  12use warnings;
  13use CGI qw(:standard :escapeHTML -nosticky);
  14use CGI::Util qw(unescape);
  15use CGI::Carp qw(fatalsToBrowser set_message);
  16use Encode;
  17use Fcntl ':mode';
  18use File::Find qw();
  19use File::Basename qw(basename);
  20use Time::HiRes qw(gettimeofday tv_interval);
  21binmode STDOUT, ':utf8';
  22
  23our $t0 = [ gettimeofday() ];
  24our $number_of_git_cmds = 0;
  25
  26BEGIN {
  27        CGI->compile() if $ENV{'MOD_PERL'};
  28}
  29
  30our $version = "++GIT_VERSION++";
  31
  32our ($my_url, $my_uri, $base_url, $path_info, $home_link);
  33sub evaluate_uri {
  34        our $cgi;
  35
  36        our $my_url = $cgi->url();
  37        our $my_uri = $cgi->url(-absolute => 1);
  38
  39        # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
  40        # needed and used only for URLs with nonempty PATH_INFO
  41        our $base_url = $my_url;
  42
  43        # When the script is used as DirectoryIndex, the URL does not contain the name
  44        # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
  45        # have to do it ourselves. We make $path_info global because it's also used
  46        # later on.
  47        #
  48        # Another issue with the script being the DirectoryIndex is that the resulting
  49        # $my_url data is not the full script URL: this is good, because we want
  50        # generated links to keep implying the script name if it wasn't explicitly
  51        # indicated in the URL we're handling, but it means that $my_url cannot be used
  52        # as base URL.
  53        # Therefore, if we needed to strip PATH_INFO, then we know that we have
  54        # to build the base URL ourselves:
  55        our $path_info = $ENV{"PATH_INFO"};
  56        if ($path_info) {
  57                if ($my_url =~ s,\Q$path_info\E$,, &&
  58                    $my_uri =~ s,\Q$path_info\E$,, &&
  59                    defined $ENV{'SCRIPT_NAME'}) {
  60                        $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
  61                }
  62        }
  63
  64        # target of the home link on top of all pages
  65        our $home_link = $my_uri || "/";
  66}
  67
  68# core git executable to use
  69# this can just be "git" if your webserver has a sensible PATH
  70our $GIT = "++GIT_BINDIR++/git";
  71
  72# absolute fs-path which will be prepended to the project path
  73#our $projectroot = "/pub/scm";
  74our $projectroot = "++GITWEB_PROJECTROOT++";
  75
  76# fs traversing limit for getting project list
  77# the number is relative to the projectroot
  78our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
  79
  80# string of the home link on top of all pages
  81our $home_link_str = "++GITWEB_HOME_LINK_STR++";
  82
  83# name of your site or organization to appear in page titles
  84# replace this with something more descriptive for clearer bookmarks
  85our $site_name = "++GITWEB_SITENAME++"
  86                 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
  87
  88# html snippet to include in the <head> section of each page
  89our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
  90# filename of html text to include at top of each page
  91our $site_header = "++GITWEB_SITE_HEADER++";
  92# html text to include at home page
  93our $home_text = "++GITWEB_HOMETEXT++";
  94# filename of html text to include at bottom of each page
  95our $site_footer = "++GITWEB_SITE_FOOTER++";
  96
  97# URI of stylesheets
  98our @stylesheets = ("++GITWEB_CSS++");
  99# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
 100our $stylesheet = undef;
 101# URI of GIT logo (72x27 size)
 102our $logo = "++GITWEB_LOGO++";
 103# URI of GIT favicon, assumed to be image/png type
 104our $favicon = "++GITWEB_FAVICON++";
 105# URI of gitweb.js (JavaScript code for gitweb)
 106our $javascript = "++GITWEB_JS++";
 107
 108# URI and label (title) of GIT logo link
 109#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
 110#our $logo_label = "git documentation";
 111our $logo_url = "http://git-scm.com/";
 112our $logo_label = "git homepage";
 113
 114# source of projects list
 115our $projects_list = "++GITWEB_LIST++";
 116
 117# the width (in characters) of the projects list "Description" column
 118our $projects_list_description_width = 25;
 119
 120# group projects by category on the projects list
 121# (enabled if this variable evaluates to true)
 122our $projects_list_group_categories = 0;
 123
 124# default category if none specified
 125# (leave the empty string for no category)
 126our $project_list_default_category = "";
 127
 128# default order of projects list
 129# valid values are none, project, descr, owner, and age
 130our $default_projects_order = "project";
 131
 132# show repository only if this file exists
 133# (only effective if this variable evaluates to true)
 134our $export_ok = "++GITWEB_EXPORT_OK++";
 135
 136# show repository only if this subroutine returns true
 137# when given the path to the project, for example:
 138#    sub { return -e "$_[0]/git-daemon-export-ok"; }
 139our $export_auth_hook = undef;
 140
 141# only allow viewing of repositories also shown on the overview page
 142our $strict_export = "++GITWEB_STRICT_EXPORT++";
 143
 144# list of git base URLs used for URL to where fetch project from,
 145# i.e. full URL is "$git_base_url/$project"
 146our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
 147
 148# default blob_plain mimetype and default charset for text/plain blob
 149our $default_blob_plain_mimetype = 'text/plain';
 150our $default_text_plain_charset  = undef;
 151
 152# file to use for guessing MIME types before trying /etc/mime.types
 153# (relative to the current git repository)
 154our $mimetypes_file = undef;
 155
 156# assume this charset if line contains non-UTF-8 characters;
 157# it should be valid encoding (see Encoding::Supported(3pm) for list),
 158# for which encoding all byte sequences are valid, for example
 159# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
 160# could be even 'utf-8' for the old behavior)
 161our $fallback_encoding = 'latin1';
 162
 163# rename detection options for git-diff and git-diff-tree
 164# - default is '-M', with the cost proportional to
 165#   (number of removed files) * (number of new files).
 166# - more costly is '-C' (which implies '-M'), with the cost proportional to
 167#   (number of changed files + number of removed files) * (number of new files)
 168# - even more costly is '-C', '--find-copies-harder' with cost
 169#   (number of files in the original tree) * (number of new files)
 170# - one might want to include '-B' option, e.g. '-B', '-M'
 171our @diff_opts = ('-M'); # taken from git_commit
 172
 173# Disables features that would allow repository owners to inject script into
 174# the gitweb domain.
 175our $prevent_xss = 0;
 176
 177# Path to the highlight executable to use (must be the one from
 178# http://www.andre-simon.de due to assumptions about parameters and output).
 179# Useful if highlight is not installed on your webserver's PATH.
 180# [Default: highlight]
 181our $highlight_bin = "++HIGHLIGHT_BIN++";
 182
 183# information about snapshot formats that gitweb is capable of serving
 184our %known_snapshot_formats = (
 185        # name => {
 186        #       'display' => display name,
 187        #       'type' => mime type,
 188        #       'suffix' => filename suffix,
 189        #       'format' => --format for git-archive,
 190        #       'compressor' => [compressor command and arguments]
 191        #                       (array reference, optional)
 192        #       'disabled' => boolean (optional)}
 193        #
 194        'tgz' => {
 195                'display' => 'tar.gz',
 196                'type' => 'application/x-gzip',
 197                'suffix' => '.tar.gz',
 198                'format' => 'tar',
 199                'compressor' => ['gzip', '-n']},
 200
 201        'tbz2' => {
 202                'display' => 'tar.bz2',
 203                'type' => 'application/x-bzip2',
 204                'suffix' => '.tar.bz2',
 205                'format' => 'tar',
 206                'compressor' => ['bzip2']},
 207
 208        'txz' => {
 209                'display' => 'tar.xz',
 210                'type' => 'application/x-xz',
 211                'suffix' => '.tar.xz',
 212                'format' => 'tar',
 213                'compressor' => ['xz'],
 214                'disabled' => 1},
 215
 216        'zip' => {
 217                'display' => 'zip',
 218                'type' => 'application/x-zip',
 219                'suffix' => '.zip',
 220                'format' => 'zip'},
 221);
 222
 223# Aliases so we understand old gitweb.snapshot values in repository
 224# configuration.
 225our %known_snapshot_format_aliases = (
 226        'gzip'  => 'tgz',
 227        'bzip2' => 'tbz2',
 228        'xz'    => 'txz',
 229
 230        # backward compatibility: legacy gitweb config support
 231        'x-gzip' => undef, 'gz' => undef,
 232        'x-bzip2' => undef, 'bz2' => undef,
 233        'x-zip' => undef, '' => undef,
 234);
 235
 236# Pixel sizes for icons and avatars. If the default font sizes or lineheights
 237# are changed, it may be appropriate to change these values too via
 238# $GITWEB_CONFIG.
 239our %avatar_size = (
 240        'default' => 16,
 241        'double'  => 32
 242);
 243
 244# Used to set the maximum load that we will still respond to gitweb queries.
 245# If server load exceed this value then return "503 server busy" error.
 246# If gitweb cannot determined server load, it is taken to be 0.
 247# Leave it undefined (or set to 'undef') to turn off load checking.
 248our $maxload = 300;
 249
 250# configuration for 'highlight' (http://www.andre-simon.de/)
 251# match by basename
 252our %highlight_basename = (
 253        #'Program' => 'py',
 254        #'Library' => 'py',
 255        'SConstruct' => 'py', # SCons equivalent of Makefile
 256        'Makefile' => 'make',
 257);
 258# match by extension
 259our %highlight_ext = (
 260        # main extensions, defining name of syntax;
 261        # see files in /usr/share/highlight/langDefs/ directory
 262        map { $_ => $_ }
 263                qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
 264        # alternate extensions, see /etc/highlight/filetypes.conf
 265        'h' => 'c',
 266        map { $_ => 'sh'  } qw(bash zsh ksh),
 267        map { $_ => 'cpp' } qw(cxx c++ cc),
 268        map { $_ => 'php' } qw(php3 php4 php5 phps),
 269        map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
 270        map { $_ => 'make'} qw(mak mk),
 271        map { $_ => 'xml' } qw(xhtml html htm),
 272);
 273
 274# You define site-wide feature defaults here; override them with
 275# $GITWEB_CONFIG as necessary.
 276our %feature = (
 277        # feature => {
 278        #       'sub' => feature-sub (subroutine),
 279        #       'override' => allow-override (boolean),
 280        #       'default' => [ default options...] (array reference)}
 281        #
 282        # if feature is overridable (it means that allow-override has true value),
 283        # then feature-sub will be called with default options as parameters;
 284        # return value of feature-sub indicates if to enable specified feature
 285        #
 286        # if there is no 'sub' key (no feature-sub), then feature cannot be
 287        # overridden
 288        #
 289        # use gitweb_get_feature(<feature>) to retrieve the <feature> value
 290        # (an array) or gitweb_check_feature(<feature>) to check if <feature>
 291        # is enabled
 292
 293        # Enable the 'blame' blob view, showing the last commit that modified
 294        # each line in the file. This can be very CPU-intensive.
 295
 296        # To enable system wide have in $GITWEB_CONFIG
 297        # $feature{'blame'}{'default'} = [1];
 298        # To have project specific config enable override in $GITWEB_CONFIG
 299        # $feature{'blame'}{'override'} = 1;
 300        # and in project config gitweb.blame = 0|1;
 301        'blame' => {
 302                'sub' => sub { feature_bool('blame', @_) },
 303                'override' => 0,
 304                'default' => [0]},
 305
 306        # Enable the 'snapshot' link, providing a compressed archive of any
 307        # tree. This can potentially generate high traffic if you have large
 308        # project.
 309
 310        # Value is a list of formats defined in %known_snapshot_formats that
 311        # you wish to offer.
 312        # To disable system wide have in $GITWEB_CONFIG
 313        # $feature{'snapshot'}{'default'} = [];
 314        # To have project specific config enable override in $GITWEB_CONFIG
 315        # $feature{'snapshot'}{'override'} = 1;
 316        # and in project config, a comma-separated list of formats or "none"
 317        # to disable.  Example: gitweb.snapshot = tbz2,zip;
 318        'snapshot' => {
 319                'sub' => \&feature_snapshot,
 320                'override' => 0,
 321                'default' => ['tgz']},
 322
 323        # Enable text search, which will list the commits which match author,
 324        # committer or commit text to a given string.  Enabled by default.
 325        # Project specific override is not supported.
 326        #
 327        # Note that this controls all search features, which means that if
 328        # it is disabled, then 'grep' and 'pickaxe' search would also be
 329        # disabled.
 330        'search' => {
 331                'override' => 0,
 332                'default' => [1]},
 333
 334        # Enable grep search, which will list the files in currently selected
 335        # tree containing the given string. Enabled by default. This can be
 336        # potentially CPU-intensive, of course.
 337        # Note that you need to have 'search' feature enabled too.
 338
 339        # To enable system wide have in $GITWEB_CONFIG
 340        # $feature{'grep'}{'default'} = [1];
 341        # To have project specific config enable override in $GITWEB_CONFIG
 342        # $feature{'grep'}{'override'} = 1;
 343        # and in project config gitweb.grep = 0|1;
 344        'grep' => {
 345                'sub' => sub { feature_bool('grep', @_) },
 346                'override' => 0,
 347                'default' => [1]},
 348
 349        # Enable the pickaxe search, which will list the commits that modified
 350        # a given string in a file. This can be practical and quite faster
 351        # alternative to 'blame', but still potentially CPU-intensive.
 352        # Note that you need to have 'search' feature enabled too.
 353
 354        # To enable system wide have in $GITWEB_CONFIG
 355        # $feature{'pickaxe'}{'default'} = [1];
 356        # To have project specific config enable override in $GITWEB_CONFIG
 357        # $feature{'pickaxe'}{'override'} = 1;
 358        # and in project config gitweb.pickaxe = 0|1;
 359        'pickaxe' => {
 360                'sub' => sub { feature_bool('pickaxe', @_) },
 361                'override' => 0,
 362                'default' => [1]},
 363
 364        # Enable showing size of blobs in a 'tree' view, in a separate
 365        # column, similar to what 'ls -l' does.  This cost a bit of IO.
 366
 367        # To disable system wide have in $GITWEB_CONFIG
 368        # $feature{'show-sizes'}{'default'} = [0];
 369        # To have project specific config enable override in $GITWEB_CONFIG
 370        # $feature{'show-sizes'}{'override'} = 1;
 371        # and in project config gitweb.showsizes = 0|1;
 372        'show-sizes' => {
 373                'sub' => sub { feature_bool('showsizes', @_) },
 374                'override' => 0,
 375                'default' => [1]},
 376
 377        # Make gitweb use an alternative format of the URLs which can be
 378        # more readable and natural-looking: project name is embedded
 379        # directly in the path and the query string contains other
 380        # auxiliary information. All gitweb installations recognize
 381        # URL in either format; this configures in which formats gitweb
 382        # generates links.
 383
 384        # To enable system wide have in $GITWEB_CONFIG
 385        # $feature{'pathinfo'}{'default'} = [1];
 386        # Project specific override is not supported.
 387
 388        # Note that you will need to change the default location of CSS,
 389        # favicon, logo and possibly other files to an absolute URL. Also,
 390        # if gitweb.cgi serves as your indexfile, you will need to force
 391        # $my_uri to contain the script name in your $GITWEB_CONFIG.
 392        'pathinfo' => {
 393                'override' => 0,
 394                'default' => [0]},
 395
 396        # Make gitweb consider projects in project root subdirectories
 397        # to be forks of existing projects. Given project $projname.git,
 398        # projects matching $projname/*.git will not be shown in the main
 399        # projects list, instead a '+' mark will be added to $projname
 400        # there and a 'forks' view will be enabled for the project, listing
 401        # all the forks. If project list is taken from a file, forks have
 402        # to be listed after the main project.
 403
 404        # To enable system wide have in $GITWEB_CONFIG
 405        # $feature{'forks'}{'default'} = [1];
 406        # Project specific override is not supported.
 407        'forks' => {
 408                'override' => 0,
 409                'default' => [0]},
 410
 411        # Insert custom links to the action bar of all project pages.
 412        # This enables you mainly to link to third-party scripts integrating
 413        # into gitweb; e.g. git-browser for graphical history representation
 414        # or custom web-based repository administration interface.
 415
 416        # The 'default' value consists of a list of triplets in the form
 417        # (label, link, position) where position is the label after which
 418        # to insert the link and link is a format string where %n expands
 419        # to the project name, %f to the project path within the filesystem,
 420        # %h to the current hash (h gitweb parameter) and %b to the current
 421        # hash base (hb gitweb parameter); %% expands to %.
 422
 423        # To enable system wide have in $GITWEB_CONFIG e.g.
 424        # $feature{'actions'}{'default'} = [('graphiclog',
 425        #       '/git-browser/by-commit.html?r=%n', 'summary')];
 426        # Project specific override is not supported.
 427        'actions' => {
 428                'override' => 0,
 429                'default' => []},
 430
 431        # Allow gitweb scan project content tags of project repository,
 432        # and display the popular Web 2.0-ish "tag cloud" near the projects
 433        # list.  Note that this is something COMPLETELY different from the
 434        # normal Git tags.
 435
 436        # gitweb by itself can show existing tags, but it does not handle
 437        # tagging itself; you need to do it externally, outside gitweb.
 438        # The format is described in git_get_project_ctags() subroutine.
 439        # You may want to install the HTML::TagCloud Perl module to get
 440        # a pretty tag cloud instead of just a list of tags.
 441
 442        # To enable system wide have in $GITWEB_CONFIG
 443        # $feature{'ctags'}{'default'} = [1];
 444        # Project specific override is not supported.
 445
 446        # In the future whether ctags editing is enabled might depend
 447        # on the value, but using 1 should always mean no editing of ctags.
 448        'ctags' => {
 449                'override' => 0,
 450                'default' => [0]},
 451
 452        # The maximum number of patches in a patchset generated in patch
 453        # view. Set this to 0 or undef to disable patch view, or to a
 454        # negative number to remove any limit.
 455
 456        # To disable system wide have in $GITWEB_CONFIG
 457        # $feature{'patches'}{'default'} = [0];
 458        # To have project specific config enable override in $GITWEB_CONFIG
 459        # $feature{'patches'}{'override'} = 1;
 460        # and in project config gitweb.patches = 0|n;
 461        # where n is the maximum number of patches allowed in a patchset.
 462        'patches' => {
 463                'sub' => \&feature_patches,
 464                'override' => 0,
 465                'default' => [16]},
 466
 467        # Avatar support. When this feature is enabled, views such as
 468        # shortlog or commit will display an avatar associated with
 469        # the email of the committer(s) and/or author(s).
 470
 471        # Currently available providers are gravatar and picon.
 472        # If an unknown provider is specified, the feature is disabled.
 473
 474        # Gravatar depends on Digest::MD5.
 475        # Picon currently relies on the indiana.edu database.
 476
 477        # To enable system wide have in $GITWEB_CONFIG
 478        # $feature{'avatar'}{'default'} = ['<provider>'];
 479        # where <provider> is either gravatar or picon.
 480        # To have project specific config enable override in $GITWEB_CONFIG
 481        # $feature{'avatar'}{'override'} = 1;
 482        # and in project config gitweb.avatar = <provider>;
 483        'avatar' => {
 484                'sub' => \&feature_avatar,
 485                'override' => 0,
 486                'default' => ['']},
 487
 488        # Enable displaying how much time and how many git commands
 489        # it took to generate and display page.  Disabled by default.
 490        # Project specific override is not supported.
 491        'timed' => {
 492                'override' => 0,
 493                'default' => [0]},
 494
 495        # Enable turning some links into links to actions which require
 496        # JavaScript to run (like 'blame_incremental').  Not enabled by
 497        # default.  Project specific override is currently not supported.
 498        'javascript-actions' => {
 499                'override' => 0,
 500                'default' => [0]},
 501
 502        # Enable and configure ability to change common timezone for dates
 503        # in gitweb output via JavaScript.  Enabled by default.
 504        # Project specific override is not supported.
 505        'javascript-timezone' => {
 506                'override' => 0,
 507                'default' => [
 508                        'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
 509                                     # or undef to turn off this feature
 510                        'gitweb_tz', # name of cookie where to store selected timezone
 511                        'datetime',  # CSS class used to mark up dates for manipulation
 512                ]},
 513
 514        # Syntax highlighting support. This is based on Daniel Svensson's
 515        # and Sham Chukoury's work in gitweb-xmms2.git.
 516        # It requires the 'highlight' program present in $PATH,
 517        # and therefore is disabled by default.
 518
 519        # To enable system wide have in $GITWEB_CONFIG
 520        # $feature{'highlight'}{'default'} = [1];
 521
 522        'highlight' => {
 523                'sub' => sub { feature_bool('highlight', @_) },
 524                'override' => 0,
 525                'default' => [0]},
 526
 527        # Enable displaying of remote heads in the heads list
 528
 529        # To enable system wide have in $GITWEB_CONFIG
 530        # $feature{'remote_heads'}{'default'} = [1];
 531        # To have project specific config enable override in $GITWEB_CONFIG
 532        # $feature{'remote_heads'}{'override'} = 1;
 533        # and in project config gitweb.remote_heads = 0|1;
 534        'remote_heads' => {
 535                'sub' => sub { feature_bool('remote_heads', @_) },
 536                'override' => 0,
 537                'default' => [0]},
 538);
 539
 540sub gitweb_get_feature {
 541        my ($name) = @_;
 542        return unless exists $feature{$name};
 543        my ($sub, $override, @defaults) = (
 544                $feature{$name}{'sub'},
 545                $feature{$name}{'override'},
 546                @{$feature{$name}{'default'}});
 547        # project specific override is possible only if we have project
 548        our $git_dir; # global variable, declared later
 549        if (!$override || !defined $git_dir) {
 550                return @defaults;
 551        }
 552        if (!defined $sub) {
 553                warn "feature $name is not overridable";
 554                return @defaults;
 555        }
 556        return $sub->(@defaults);
 557}
 558
 559# A wrapper to check if a given feature is enabled.
 560# With this, you can say
 561#
 562#   my $bool_feat = gitweb_check_feature('bool_feat');
 563#   gitweb_check_feature('bool_feat') or somecode;
 564#
 565# instead of
 566#
 567#   my ($bool_feat) = gitweb_get_feature('bool_feat');
 568#   (gitweb_get_feature('bool_feat'))[0] or somecode;
 569#
 570sub gitweb_check_feature {
 571        return (gitweb_get_feature(@_))[0];
 572}
 573
 574
 575sub feature_bool {
 576        my $key = shift;
 577        my ($val) = git_get_project_config($key, '--bool');
 578
 579        if (!defined $val) {
 580                return ($_[0]);
 581        } elsif ($val eq 'true') {
 582                return (1);
 583        } elsif ($val eq 'false') {
 584                return (0);
 585        }
 586}
 587
 588sub feature_snapshot {
 589        my (@fmts) = @_;
 590
 591        my ($val) = git_get_project_config('snapshot');
 592
 593        if ($val) {
 594                @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
 595        }
 596
 597        return @fmts;
 598}
 599
 600sub feature_patches {
 601        my @val = (git_get_project_config('patches', '--int'));
 602
 603        if (@val) {
 604                return @val;
 605        }
 606
 607        return ($_[0]);
 608}
 609
 610sub feature_avatar {
 611        my @val = (git_get_project_config('avatar'));
 612
 613        return @val ? @val : @_;
 614}
 615
 616# checking HEAD file with -e is fragile if the repository was
 617# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
 618# and then pruned.
 619sub check_head_link {
 620        my ($dir) = @_;
 621        my $headfile = "$dir/HEAD";
 622        return ((-e $headfile) ||
 623                (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
 624}
 625
 626sub check_export_ok {
 627        my ($dir) = @_;
 628        return (check_head_link($dir) &&
 629                (!$export_ok || -e "$dir/$export_ok") &&
 630                (!$export_auth_hook || $export_auth_hook->($dir)));
 631}
 632
 633# process alternate names for backward compatibility
 634# filter out unsupported (unknown) snapshot formats
 635sub filter_snapshot_fmts {
 636        my @fmts = @_;
 637
 638        @fmts = map {
 639                exists $known_snapshot_format_aliases{$_} ?
 640                       $known_snapshot_format_aliases{$_} : $_} @fmts;
 641        @fmts = grep {
 642                exists $known_snapshot_formats{$_} &&
 643                !$known_snapshot_formats{$_}{'disabled'}} @fmts;
 644}
 645
 646# If it is set to code reference, it is code that it is to be run once per
 647# request, allowing updating configurations that change with each request,
 648# while running other code in config file only once.
 649#
 650# Otherwise, if it is false then gitweb would process config file only once;
 651# if it is true then gitweb config would be run for each request.
 652our $per_request_config = 1;
 653
 654# read and parse gitweb config file given by its parameter.
 655# returns true on success, false on recoverable error, allowing
 656# to chain this subroutine, using first file that exists.
 657# dies on errors during parsing config file, as it is unrecoverable.
 658sub read_config_file {
 659        my $filename = shift;
 660        return unless defined $filename;
 661        # die if there are errors parsing config file
 662        if (-e $filename) {
 663                do $filename;
 664                die $@ if $@;
 665                return 1;
 666        }
 667        return;
 668}
 669
 670our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
 671sub evaluate_gitweb_config {
 672        our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
 673        our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
 674        our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
 675
 676        # Protect agains duplications of file names, to not read config twice.
 677        # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
 678        # there possibility of duplication of filename there doesn't matter.
 679        $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
 680        $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
 681
 682        # Common system-wide settings for convenience.
 683        # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
 684        read_config_file($GITWEB_CONFIG_COMMON);
 685
 686        # Use first config file that exists.  This means use the per-instance
 687        # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
 688        read_config_file($GITWEB_CONFIG) and return;
 689        read_config_file($GITWEB_CONFIG_SYSTEM);
 690}
 691
 692# Get loadavg of system, to compare against $maxload.
 693# Currently it requires '/proc/loadavg' present to get loadavg;
 694# if it is not present it returns 0, which means no load checking.
 695sub get_loadavg {
 696        if( -e '/proc/loadavg' ){
 697                open my $fd, '<', '/proc/loadavg'
 698                        or return 0;
 699                my @load = split(/\s+/, scalar <$fd>);
 700                close $fd;
 701
 702                # The first three columns measure CPU and IO utilization of the last one,
 703                # five, and 10 minute periods.  The fourth column shows the number of
 704                # currently running processes and the total number of processes in the m/n
 705                # format.  The last column displays the last process ID used.
 706                return $load[0] || 0;
 707        }
 708        # additional checks for load average should go here for things that don't export
 709        # /proc/loadavg
 710
 711        return 0;
 712}
 713
 714# version of the core git binary
 715our $git_version;
 716sub evaluate_git_version {
 717        our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
 718        $number_of_git_cmds++;
 719}
 720
 721sub check_loadavg {
 722        if (defined $maxload && get_loadavg() > $maxload) {
 723                die_error(503, "The load average on the server is too high");
 724        }
 725}
 726
 727# ======================================================================
 728# input validation and dispatch
 729
 730# input parameters can be collected from a variety of sources (presently, CGI
 731# and PATH_INFO), so we define an %input_params hash that collects them all
 732# together during validation: this allows subsequent uses (e.g. href()) to be
 733# agnostic of the parameter origin
 734
 735our %input_params = ();
 736
 737# input parameters are stored with the long parameter name as key. This will
 738# also be used in the href subroutine to convert parameters to their CGI
 739# equivalent, and since the href() usage is the most frequent one, we store
 740# the name -> CGI key mapping here, instead of the reverse.
 741#
 742# XXX: Warning: If you touch this, check the search form for updating,
 743# too.
 744
 745our @cgi_param_mapping = (
 746        project => "p",
 747        action => "a",
 748        file_name => "f",
 749        file_parent => "fp",
 750        hash => "h",
 751        hash_parent => "hp",
 752        hash_base => "hb",
 753        hash_parent_base => "hpb",
 754        page => "pg",
 755        order => "o",
 756        searchtext => "s",
 757        searchtype => "st",
 758        snapshot_format => "sf",
 759        extra_options => "opt",
 760        search_use_regexp => "sr",
 761        ctag => "by_tag",
 762        diff_style => "ds",
 763        project_filter => "pf",
 764        # this must be last entry (for manipulation from JavaScript)
 765        javascript => "js"
 766);
 767our %cgi_param_mapping = @cgi_param_mapping;
 768
 769# we will also need to know the possible actions, for validation
 770our %actions = (
 771        "blame" => \&git_blame,
 772        "blame_incremental" => \&git_blame_incremental,
 773        "blame_data" => \&git_blame_data,
 774        "blobdiff" => \&git_blobdiff,
 775        "blobdiff_plain" => \&git_blobdiff_plain,
 776        "blob" => \&git_blob,
 777        "blob_plain" => \&git_blob_plain,
 778        "commitdiff" => \&git_commitdiff,
 779        "commitdiff_plain" => \&git_commitdiff_plain,
 780        "commit" => \&git_commit,
 781        "forks" => \&git_forks,
 782        "heads" => \&git_heads,
 783        "history" => \&git_history,
 784        "log" => \&git_log,
 785        "patch" => \&git_patch,
 786        "patches" => \&git_patches,
 787        "remotes" => \&git_remotes,
 788        "rss" => \&git_rss,
 789        "atom" => \&git_atom,
 790        "search" => \&git_search,
 791        "search_help" => \&git_search_help,
 792        "shortlog" => \&git_shortlog,
 793        "summary" => \&git_summary,
 794        "tag" => \&git_tag,
 795        "tags" => \&git_tags,
 796        "tree" => \&git_tree,
 797        "snapshot" => \&git_snapshot,
 798        "object" => \&git_object,
 799        # those below don't need $project
 800        "opml" => \&git_opml,
 801        "project_list" => \&git_project_list,
 802        "project_index" => \&git_project_index,
 803);
 804
 805# finally, we have the hash of allowed extra_options for the commands that
 806# allow them
 807our %allowed_options = (
 808        "--no-merges" => [ qw(rss atom log shortlog history) ],
 809);
 810
 811# fill %input_params with the CGI parameters. All values except for 'opt'
 812# should be single values, but opt can be an array. We should probably
 813# build an array of parameters that can be multi-valued, but since for the time
 814# being it's only this one, we just single it out
 815sub evaluate_query_params {
 816        our $cgi;
 817
 818        while (my ($name, $symbol) = each %cgi_param_mapping) {
 819                if ($symbol eq 'opt') {
 820                        $input_params{$name} = [ $cgi->param($symbol) ];
 821                } else {
 822                        $input_params{$name} = $cgi->param($symbol);
 823                }
 824        }
 825}
 826
 827# now read PATH_INFO and update the parameter list for missing parameters
 828sub evaluate_path_info {
 829        return if defined $input_params{'project'};
 830        return if !$path_info;
 831        $path_info =~ s,^/+,,;
 832        return if !$path_info;
 833
 834        # find which part of PATH_INFO is project
 835        my $project = $path_info;
 836        $project =~ s,/+$,,;
 837        while ($project && !check_head_link("$projectroot/$project")) {
 838                $project =~ s,/*[^/]*$,,;
 839        }
 840        return unless $project;
 841        $input_params{'project'} = $project;
 842
 843        # do not change any parameters if an action is given using the query string
 844        return if $input_params{'action'};
 845        $path_info =~ s,^\Q$project\E/*,,;
 846
 847        # next, check if we have an action
 848        my $action = $path_info;
 849        $action =~ s,/.*$,,;
 850        if (exists $actions{$action}) {
 851                $path_info =~ s,^$action/*,,;
 852                $input_params{'action'} = $action;
 853        }
 854
 855        # list of actions that want hash_base instead of hash, but can have no
 856        # pathname (f) parameter
 857        my @wants_base = (
 858                'tree',
 859                'history',
 860        );
 861
 862        # we want to catch, among others
 863        # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
 864        my ($parentrefname, $parentpathname, $refname, $pathname) =
 865                ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
 866
 867        # first, analyze the 'current' part
 868        if (defined $pathname) {
 869                # we got "branch:filename" or "branch:dir/"
 870                # we could use git_get_type(branch:pathname), but:
 871                # - it needs $git_dir
 872                # - it does a git() call
 873                # - the convention of terminating directories with a slash
 874                #   makes it superfluous
 875                # - embedding the action in the PATH_INFO would make it even
 876                #   more superfluous
 877                $pathname =~ s,^/+,,;
 878                if (!$pathname || substr($pathname, -1) eq "/") {
 879                        $input_params{'action'} ||= "tree";
 880                        $pathname =~ s,/$,,;
 881                } else {
 882                        # the default action depends on whether we had parent info
 883                        # or not
 884                        if ($parentrefname) {
 885                                $input_params{'action'} ||= "blobdiff_plain";
 886                        } else {
 887                                $input_params{'action'} ||= "blob_plain";
 888                        }
 889                }
 890                $input_params{'hash_base'} ||= $refname;
 891                $input_params{'file_name'} ||= $pathname;
 892        } elsif (defined $refname) {
 893                # we got "branch". In this case we have to choose if we have to
 894                # set hash or hash_base.
 895                #
 896                # Most of the actions without a pathname only want hash to be
 897                # set, except for the ones specified in @wants_base that want
 898                # hash_base instead. It should also be noted that hand-crafted
 899                # links having 'history' as an action and no pathname or hash
 900                # set will fail, but that happens regardless of PATH_INFO.
 901                if (defined $parentrefname) {
 902                        # if there is parent let the default be 'shortlog' action
 903                        # (for http://git.example.com/repo.git/A..B links); if there
 904                        # is no parent, dispatch will detect type of object and set
 905                        # action appropriately if required (if action is not set)
 906                        $input_params{'action'} ||= "shortlog";
 907                }
 908                if ($input_params{'action'} &&
 909                    grep { $_ eq $input_params{'action'} } @wants_base) {
 910                        $input_params{'hash_base'} ||= $refname;
 911                } else {
 912                        $input_params{'hash'} ||= $refname;
 913                }
 914        }
 915
 916        # next, handle the 'parent' part, if present
 917        if (defined $parentrefname) {
 918                # a missing pathspec defaults to the 'current' filename, allowing e.g.
 919                # someproject/blobdiff/oldrev..newrev:/filename
 920                if ($parentpathname) {
 921                        $parentpathname =~ s,^/+,,;
 922                        $parentpathname =~ s,/$,,;
 923                        $input_params{'file_parent'} ||= $parentpathname;
 924                } else {
 925                        $input_params{'file_parent'} ||= $input_params{'file_name'};
 926                }
 927                # we assume that hash_parent_base is wanted if a path was specified,
 928                # or if the action wants hash_base instead of hash
 929                if (defined $input_params{'file_parent'} ||
 930                        grep { $_ eq $input_params{'action'} } @wants_base) {
 931                        $input_params{'hash_parent_base'} ||= $parentrefname;
 932                } else {
 933                        $input_params{'hash_parent'} ||= $parentrefname;
 934                }
 935        }
 936
 937        # for the snapshot action, we allow URLs in the form
 938        # $project/snapshot/$hash.ext
 939        # where .ext determines the snapshot and gets removed from the
 940        # passed $refname to provide the $hash.
 941        #
 942        # To be able to tell that $refname includes the format extension, we
 943        # require the following two conditions to be satisfied:
 944        # - the hash input parameter MUST have been set from the $refname part
 945        #   of the URL (i.e. they must be equal)
 946        # - the snapshot format MUST NOT have been defined already (e.g. from
 947        #   CGI parameter sf)
 948        # It's also useless to try any matching unless $refname has a dot,
 949        # so we check for that too
 950        if (defined $input_params{'action'} &&
 951                $input_params{'action'} eq 'snapshot' &&
 952                defined $refname && index($refname, '.') != -1 &&
 953                $refname eq $input_params{'hash'} &&
 954                !defined $input_params{'snapshot_format'}) {
 955                # We loop over the known snapshot formats, checking for
 956                # extensions. Allowed extensions are both the defined suffix
 957                # (which includes the initial dot already) and the snapshot
 958                # format key itself, with a prepended dot
 959                while (my ($fmt, $opt) = each %known_snapshot_formats) {
 960                        my $hash = $refname;
 961                        unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
 962                                next;
 963                        }
 964                        my $sfx = $1;
 965                        # a valid suffix was found, so set the snapshot format
 966                        # and reset the hash parameter
 967                        $input_params{'snapshot_format'} = $fmt;
 968                        $input_params{'hash'} = $hash;
 969                        # we also set the format suffix to the one requested
 970                        # in the URL: this way a request for e.g. .tgz returns
 971                        # a .tgz instead of a .tar.gz
 972                        $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
 973                        last;
 974                }
 975        }
 976}
 977
 978our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
 979     $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
 980     $searchtext, $search_regexp, $project_filter);
 981sub evaluate_and_validate_params {
 982        our $action = $input_params{'action'};
 983        if (defined $action) {
 984                if (!validate_action($action)) {
 985                        die_error(400, "Invalid action parameter");
 986                }
 987        }
 988
 989        # parameters which are pathnames
 990        our $project = $input_params{'project'};
 991        if (defined $project) {
 992                if (!validate_project($project)) {
 993                        undef $project;
 994                        die_error(404, "No such project");
 995                }
 996        }
 997
 998        our $project_filter = $input_params{'project_filter'};
 999        if (defined $project_filter) {
1000                if (!validate_pathname($project_filter)) {
1001                        die_error(404, "Invalid project_filter parameter");
1002                }
1003        }
1004
1005        our $file_name = $input_params{'file_name'};
1006        if (defined $file_name) {
1007                if (!validate_pathname($file_name)) {
1008                        die_error(400, "Invalid file parameter");
1009                }
1010        }
1011
1012        our $file_parent = $input_params{'file_parent'};
1013        if (defined $file_parent) {
1014                if (!validate_pathname($file_parent)) {
1015                        die_error(400, "Invalid file parent parameter");
1016                }
1017        }
1018
1019        # parameters which are refnames
1020        our $hash = $input_params{'hash'};
1021        if (defined $hash) {
1022                if (!validate_refname($hash)) {
1023                        die_error(400, "Invalid hash parameter");
1024                }
1025        }
1026
1027        our $hash_parent = $input_params{'hash_parent'};
1028        if (defined $hash_parent) {
1029                if (!validate_refname($hash_parent)) {
1030                        die_error(400, "Invalid hash parent parameter");
1031                }
1032        }
1033
1034        our $hash_base = $input_params{'hash_base'};
1035        if (defined $hash_base) {
1036                if (!validate_refname($hash_base)) {
1037                        die_error(400, "Invalid hash base parameter");
1038                }
1039        }
1040
1041        our @extra_options = @{$input_params{'extra_options'}};
1042        # @extra_options is always defined, since it can only be (currently) set from
1043        # CGI, and $cgi->param() returns the empty array in array context if the param
1044        # is not set
1045        foreach my $opt (@extra_options) {
1046                if (not exists $allowed_options{$opt}) {
1047                        die_error(400, "Invalid option parameter");
1048                }
1049                if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1050                        die_error(400, "Invalid option parameter for this action");
1051                }
1052        }
1053
1054        our $hash_parent_base = $input_params{'hash_parent_base'};
1055        if (defined $hash_parent_base) {
1056                if (!validate_refname($hash_parent_base)) {
1057                        die_error(400, "Invalid hash parent base parameter");
1058                }
1059        }
1060
1061        # other parameters
1062        our $page = $input_params{'page'};
1063        if (defined $page) {
1064                if ($page =~ m/[^0-9]/) {
1065                        die_error(400, "Invalid page parameter");
1066                }
1067        }
1068
1069        our $searchtype = $input_params{'searchtype'};
1070        if (defined $searchtype) {
1071                if ($searchtype =~ m/[^a-z]/) {
1072                        die_error(400, "Invalid searchtype parameter");
1073                }
1074        }
1075
1076        our $search_use_regexp = $input_params{'search_use_regexp'};
1077
1078        our $searchtext = $input_params{'searchtext'};
1079        our $search_regexp;
1080        if (defined $searchtext) {
1081                if (length($searchtext) < 2) {
1082                        die_error(403, "At least two characters are required for search parameter");
1083                }
1084                $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
1085        }
1086}
1087
1088# path to the current git repository
1089our $git_dir;
1090sub evaluate_git_dir {
1091        our $git_dir = "$projectroot/$project" if $project;
1092}
1093
1094our (@snapshot_fmts, $git_avatar);
1095sub configure_gitweb_features {
1096        # list of supported snapshot formats
1097        our @snapshot_fmts = gitweb_get_feature('snapshot');
1098        @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1099
1100        # check that the avatar feature is set to a known provider name,
1101        # and for each provider check if the dependencies are satisfied.
1102        # if the provider name is invalid or the dependencies are not met,
1103        # reset $git_avatar to the empty string.
1104        our ($git_avatar) = gitweb_get_feature('avatar');
1105        if ($git_avatar eq 'gravatar') {
1106                $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1107        } elsif ($git_avatar eq 'picon') {
1108                # no dependencies
1109        } else {
1110                $git_avatar = '';
1111        }
1112}
1113
1114# custom error handler: 'die <message>' is Internal Server Error
1115sub handle_errors_html {
1116        my $msg = shift; # it is already HTML escaped
1117
1118        # to avoid infinite loop where error occurs in die_error,
1119        # change handler to default handler, disabling handle_errors_html
1120        set_message("Error occured when inside die_error:\n$msg");
1121
1122        # you cannot jump out of die_error when called as error handler;
1123        # the subroutine set via CGI::Carp::set_message is called _after_
1124        # HTTP headers are already written, so it cannot write them itself
1125        die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1126}
1127set_message(\&handle_errors_html);
1128
1129# dispatch
1130sub dispatch {
1131        if (!defined $action) {
1132                if (defined $hash) {
1133                        $action = git_get_type($hash);
1134                } elsif (defined $hash_base && defined $file_name) {
1135                        $action = git_get_type("$hash_base:$file_name");
1136                } elsif (defined $project) {
1137                        $action = 'summary';
1138                } else {
1139                        $action = 'project_list';
1140                }
1141        }
1142        if (!defined($actions{$action})) {
1143                die_error(400, "Unknown action");
1144        }
1145        if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1146            !$project) {
1147                die_error(400, "Project needed");
1148        }
1149        $actions{$action}->();
1150}
1151
1152sub reset_timer {
1153        our $t0 = [ gettimeofday() ]
1154                if defined $t0;
1155        our $number_of_git_cmds = 0;
1156}
1157
1158our $first_request = 1;
1159sub run_request {
1160        reset_timer();
1161
1162        evaluate_uri();
1163        if ($first_request) {
1164                evaluate_gitweb_config();
1165                evaluate_git_version();
1166        }
1167        if ($per_request_config) {
1168                if (ref($per_request_config) eq 'CODE') {
1169                        $per_request_config->();
1170                } elsif (!$first_request) {
1171                        evaluate_gitweb_config();
1172                }
1173        }
1174        check_loadavg();
1175
1176        # $projectroot and $projects_list might be set in gitweb config file
1177        $projects_list ||= $projectroot;
1178
1179        evaluate_query_params();
1180        evaluate_path_info();
1181        evaluate_and_validate_params();
1182        evaluate_git_dir();
1183
1184        configure_gitweb_features();
1185
1186        dispatch();
1187}
1188
1189our $is_last_request = sub { 1 };
1190our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1191our $CGI = 'CGI';
1192our $cgi;
1193sub configure_as_fcgi {
1194        require CGI::Fast;
1195        our $CGI = 'CGI::Fast';
1196
1197        my $request_number = 0;
1198        # let each child service 100 requests
1199        our $is_last_request = sub { ++$request_number > 100 };
1200}
1201sub evaluate_argv {
1202        my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1203        configure_as_fcgi()
1204                if $script_name =~ /\.fcgi$/;
1205
1206        return unless (@ARGV);
1207
1208        require Getopt::Long;
1209        Getopt::Long::GetOptions(
1210                'fastcgi|fcgi|f' => \&configure_as_fcgi,
1211                'nproc|n=i' => sub {
1212                        my ($arg, $val) = @_;
1213                        return unless eval { require FCGI::ProcManager; 1; };
1214                        my $proc_manager = FCGI::ProcManager->new({
1215                                n_processes => $val,
1216                        });
1217                        our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1218                        our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1219                        our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1220                },
1221        );
1222}
1223
1224sub run {
1225        evaluate_argv();
1226
1227        $first_request = 1;
1228        $pre_listen_hook->()
1229                if $pre_listen_hook;
1230
1231 REQUEST:
1232        while ($cgi = $CGI->new()) {
1233                $pre_dispatch_hook->()
1234                        if $pre_dispatch_hook;
1235
1236                run_request();
1237
1238                $post_dispatch_hook->()
1239                        if $post_dispatch_hook;
1240                $first_request = 0;
1241
1242                last REQUEST if ($is_last_request->());
1243        }
1244
1245 DONE_GITWEB:
1246        1;
1247}
1248
1249run();
1250
1251if (defined caller) {
1252        # wrapped in a subroutine processing requests,
1253        # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1254        return;
1255} else {
1256        # pure CGI script, serving single request
1257        exit;
1258}
1259
1260## ======================================================================
1261## action links
1262
1263# possible values of extra options
1264# -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1265# -replay => 1      - start from a current view (replay with modifications)
1266# -path_info => 0|1 - don't use/use path_info URL (if possible)
1267# -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1268sub href {
1269        my %params = @_;
1270        # default is to use -absolute url() i.e. $my_uri
1271        my $href = $params{-full} ? $my_url : $my_uri;
1272
1273        # implicit -replay, must be first of implicit params
1274        $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1275
1276        $params{'project'} = $project unless exists $params{'project'};
1277
1278        if ($params{-replay}) {
1279                while (my ($name, $symbol) = each %cgi_param_mapping) {
1280                        if (!exists $params{$name}) {
1281                                $params{$name} = $input_params{$name};
1282                        }
1283                }
1284        }
1285
1286        my $use_pathinfo = gitweb_check_feature('pathinfo');
1287        if (defined $params{'project'} &&
1288            (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1289                # try to put as many parameters as possible in PATH_INFO:
1290                #   - project name
1291                #   - action
1292                #   - hash_parent or hash_parent_base:/file_parent
1293                #   - hash or hash_base:/filename
1294                #   - the snapshot_format as an appropriate suffix
1295
1296                # When the script is the root DirectoryIndex for the domain,
1297                # $href here would be something like http://gitweb.example.com/
1298                # Thus, we strip any trailing / from $href, to spare us double
1299                # slashes in the final URL
1300                $href =~ s,/$,,;
1301
1302                # Then add the project name, if present
1303                $href .= "/".esc_path_info($params{'project'});
1304                delete $params{'project'};
1305
1306                # since we destructively absorb parameters, we keep this
1307                # boolean that remembers if we're handling a snapshot
1308                my $is_snapshot = $params{'action'} eq 'snapshot';
1309
1310                # Summary just uses the project path URL, any other action is
1311                # added to the URL
1312                if (defined $params{'action'}) {
1313                        $href .= "/".esc_path_info($params{'action'})
1314                                unless $params{'action'} eq 'summary';
1315                        delete $params{'action'};
1316                }
1317
1318                # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1319                # stripping nonexistent or useless pieces
1320                $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1321                        || $params{'hash_parent'} || $params{'hash'});
1322                if (defined $params{'hash_base'}) {
1323                        if (defined $params{'hash_parent_base'}) {
1324                                $href .= esc_path_info($params{'hash_parent_base'});
1325                                # skip the file_parent if it's the same as the file_name
1326                                if (defined $params{'file_parent'}) {
1327                                        if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1328                                                delete $params{'file_parent'};
1329                                        } elsif ($params{'file_parent'} !~ /\.\./) {
1330                                                $href .= ":/".esc_path_info($params{'file_parent'});
1331                                                delete $params{'file_parent'};
1332                                        }
1333                                }
1334                                $href .= "..";
1335                                delete $params{'hash_parent'};
1336                                delete $params{'hash_parent_base'};
1337                        } elsif (defined $params{'hash_parent'}) {
1338                                $href .= esc_path_info($params{'hash_parent'}). "..";
1339                                delete $params{'hash_parent'};
1340                        }
1341
1342                        $href .= esc_path_info($params{'hash_base'});
1343                        if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1344                                $href .= ":/".esc_path_info($params{'file_name'});
1345                                delete $params{'file_name'};
1346                        }
1347                        delete $params{'hash'};
1348                        delete $params{'hash_base'};
1349                } elsif (defined $params{'hash'}) {
1350                        $href .= esc_path_info($params{'hash'});
1351                        delete $params{'hash'};
1352                }
1353
1354                # If the action was a snapshot, we can absorb the
1355                # snapshot_format parameter too
1356                if ($is_snapshot) {
1357                        my $fmt = $params{'snapshot_format'};
1358                        # snapshot_format should always be defined when href()
1359                        # is called, but just in case some code forgets, we
1360                        # fall back to the default
1361                        $fmt ||= $snapshot_fmts[0];
1362                        $href .= $known_snapshot_formats{$fmt}{'suffix'};
1363                        delete $params{'snapshot_format'};
1364                }
1365        }
1366
1367        # now encode the parameters explicitly
1368        my @result = ();
1369        for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1370                my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1371                if (defined $params{$name}) {
1372                        if (ref($params{$name}) eq "ARRAY") {
1373                                foreach my $par (@{$params{$name}}) {
1374                                        push @result, $symbol . "=" . esc_param($par);
1375                                }
1376                        } else {
1377                                push @result, $symbol . "=" . esc_param($params{$name});
1378                        }
1379                }
1380        }
1381        $href .= "?" . join(';', @result) if scalar @result;
1382
1383        # final transformation: trailing spaces must be escaped (URI-encoded)
1384        $href =~ s/(\s+)$/CGI::escape($1)/e;
1385
1386        if ($params{-anchor}) {
1387                $href .= "#".esc_param($params{-anchor});
1388        }
1389
1390        return $href;
1391}
1392
1393
1394## ======================================================================
1395## validation, quoting/unquoting and escaping
1396
1397sub validate_action {
1398        my $input = shift || return undef;
1399        return undef unless exists $actions{$input};
1400        return $input;
1401}
1402
1403sub validate_project {
1404        my $input = shift || return undef;
1405        if (!validate_pathname($input) ||
1406                !(-d "$projectroot/$input") ||
1407                !check_export_ok("$projectroot/$input") ||
1408                ($strict_export && !project_in_list($input))) {
1409                return undef;
1410        } else {
1411                return $input;
1412        }
1413}
1414
1415sub validate_pathname {
1416        my $input = shift || return undef;
1417
1418        # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1419        # at the beginning, at the end, and between slashes.
1420        # also this catches doubled slashes
1421        if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1422                return undef;
1423        }
1424        # no null characters
1425        if ($input =~ m!\0!) {
1426                return undef;
1427        }
1428        return $input;
1429}
1430
1431sub validate_refname {
1432        my $input = shift || return undef;
1433
1434        # textual hashes are O.K.
1435        if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1436                return $input;
1437        }
1438        # it must be correct pathname
1439        $input = validate_pathname($input)
1440                or return undef;
1441        # restrictions on ref name according to git-check-ref-format
1442        if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1443                return undef;
1444        }
1445        return $input;
1446}
1447
1448# decode sequences of octets in utf8 into Perl's internal form,
1449# which is utf-8 with utf8 flag set if needed.  gitweb writes out
1450# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1451sub to_utf8 {
1452        my $str = shift;
1453        return undef unless defined $str;
1454
1455        if (utf8::is_utf8($str) || utf8::decode($str)) {
1456                return $str;
1457        } else {
1458                return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1459        }
1460}
1461
1462# quote unsafe chars, but keep the slash, even when it's not
1463# correct, but quoted slashes look too horrible in bookmarks
1464sub esc_param {
1465        my $str = shift;
1466        return undef unless defined $str;
1467        $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1468        $str =~ s/ /\+/g;
1469        return $str;
1470}
1471
1472# the quoting rules for path_info fragment are slightly different
1473sub esc_path_info {
1474        my $str = shift;
1475        return undef unless defined $str;
1476
1477        # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1478        $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1479
1480        return $str;
1481}
1482
1483# quote unsafe chars in whole URL, so some characters cannot be quoted
1484sub esc_url {
1485        my $str = shift;
1486        return undef unless defined $str;
1487        $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1488        $str =~ s/ /\+/g;
1489        return $str;
1490}
1491
1492# quote unsafe characters in HTML attributes
1493sub esc_attr {
1494
1495        # for XHTML conformance escaping '"' to '&quot;' is not enough
1496        return esc_html(@_);
1497}
1498
1499# replace invalid utf8 character with SUBSTITUTION sequence
1500sub esc_html {
1501        my $str = shift;
1502        my %opts = @_;
1503
1504        return undef unless defined $str;
1505
1506        $str = to_utf8($str);
1507        $str = $cgi->escapeHTML($str);
1508        if ($opts{'-nbsp'}) {
1509                $str =~ s/ /&nbsp;/g;
1510        }
1511        $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1512        return $str;
1513}
1514
1515# quote control characters and escape filename to HTML
1516sub esc_path {
1517        my $str = shift;
1518        my %opts = @_;
1519
1520        return undef unless defined $str;
1521
1522        $str = to_utf8($str);
1523        $str = $cgi->escapeHTML($str);
1524        if ($opts{'-nbsp'}) {
1525                $str =~ s/ /&nbsp;/g;
1526        }
1527        $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1528        return $str;
1529}
1530
1531# Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1532sub sanitize {
1533        my $str = shift;
1534
1535        return undef unless defined $str;
1536
1537        $str = to_utf8($str);
1538        $str =~ s|([[:cntrl:]])|($1 =~ /[\t\n\r]/ ? $1 : quot_cec($1))|eg;
1539        return $str;
1540}
1541
1542# Make control characters "printable", using character escape codes (CEC)
1543sub quot_cec {
1544        my $cntrl = shift;
1545        my %opts = @_;
1546        my %es = ( # character escape codes, aka escape sequences
1547                "\t" => '\t',   # tab            (HT)
1548                "\n" => '\n',   # line feed      (LF)
1549                "\r" => '\r',   # carrige return (CR)
1550                "\f" => '\f',   # form feed      (FF)
1551                "\b" => '\b',   # backspace      (BS)
1552                "\a" => '\a',   # alarm (bell)   (BEL)
1553                "\e" => '\e',   # escape         (ESC)
1554                "\013" => '\v', # vertical tab   (VT)
1555                "\000" => '\0', # nul character  (NUL)
1556        );
1557        my $chr = ( (exists $es{$cntrl})
1558                    ? $es{$cntrl}
1559                    : sprintf('\%2x', ord($cntrl)) );
1560        if ($opts{-nohtml}) {
1561                return $chr;
1562        } else {
1563                return "<span class=\"cntrl\">$chr</span>";
1564        }
1565}
1566
1567# Alternatively use unicode control pictures codepoints,
1568# Unicode "printable representation" (PR)
1569sub quot_upr {
1570        my $cntrl = shift;
1571        my %opts = @_;
1572
1573        my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1574        if ($opts{-nohtml}) {
1575                return $chr;
1576        } else {
1577                return "<span class=\"cntrl\">$chr</span>";
1578        }
1579}
1580
1581# git may return quoted and escaped filenames
1582sub unquote {
1583        my $str = shift;
1584
1585        sub unq {
1586                my $seq = shift;
1587                my %es = ( # character escape codes, aka escape sequences
1588                        't' => "\t",   # tab            (HT, TAB)
1589                        'n' => "\n",   # newline        (NL)
1590                        'r' => "\r",   # return         (CR)
1591                        'f' => "\f",   # form feed      (FF)
1592                        'b' => "\b",   # backspace      (BS)
1593                        'a' => "\a",   # alarm (bell)   (BEL)
1594                        'e' => "\e",   # escape         (ESC)
1595                        'v' => "\013", # vertical tab   (VT)
1596                );
1597
1598                if ($seq =~ m/^[0-7]{1,3}$/) {
1599                        # octal char sequence
1600                        return chr(oct($seq));
1601                } elsif (exists $es{$seq}) {
1602                        # C escape sequence, aka character escape code
1603                        return $es{$seq};
1604                }
1605                # quoted ordinary character
1606                return $seq;
1607        }
1608
1609        if ($str =~ m/^"(.*)"$/) {
1610                # needs unquoting
1611                $str = $1;
1612                $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1613        }
1614        return $str;
1615}
1616
1617# escape tabs (convert tabs to spaces)
1618sub untabify {
1619        my $line = shift;
1620
1621        while ((my $pos = index($line, "\t")) != -1) {
1622                if (my $count = (8 - ($pos % 8))) {
1623                        my $spaces = ' ' x $count;
1624                        $line =~ s/\t/$spaces/;
1625                }
1626        }
1627
1628        return $line;
1629}
1630
1631sub project_in_list {
1632        my $project = shift;
1633        my @list = git_get_projects_list();
1634        return @list && scalar(grep { $_->{'path'} eq $project } @list);
1635}
1636
1637## ----------------------------------------------------------------------
1638## HTML aware string manipulation
1639
1640# Try to chop given string on a word boundary between position
1641# $len and $len+$add_len. If there is no word boundary there,
1642# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1643# (marking chopped part) would be longer than given string.
1644sub chop_str {
1645        my $str = shift;
1646        my $len = shift;
1647        my $add_len = shift || 10;
1648        my $where = shift || 'right'; # 'left' | 'center' | 'right'
1649
1650        # Make sure perl knows it is utf8 encoded so we don't
1651        # cut in the middle of a utf8 multibyte char.
1652        $str = to_utf8($str);
1653
1654        # allow only $len chars, but don't cut a word if it would fit in $add_len
1655        # if it doesn't fit, cut it if it's still longer than the dots we would add
1656        # remove chopped character entities entirely
1657
1658        # when chopping in the middle, distribute $len into left and right part
1659        # return early if chopping wouldn't make string shorter
1660        if ($where eq 'center') {
1661                return $str if ($len + 5 >= length($str)); # filler is length 5
1662                $len = int($len/2);
1663        } else {
1664                return $str if ($len + 4 >= length($str)); # filler is length 4
1665        }
1666
1667        # regexps: ending and beginning with word part up to $add_len
1668        my $endre = qr/.{$len}\w{0,$add_len}/;
1669        my $begre = qr/\w{0,$add_len}.{$len}/;
1670
1671        if ($where eq 'left') {
1672                $str =~ m/^(.*?)($begre)$/;
1673                my ($lead, $body) = ($1, $2);
1674                if (length($lead) > 4) {
1675                        $lead = " ...";
1676                }
1677                return "$lead$body";
1678
1679        } elsif ($where eq 'center') {
1680                $str =~ m/^($endre)(.*)$/;
1681                my ($left, $str)  = ($1, $2);
1682                $str =~ m/^(.*?)($begre)$/;
1683                my ($mid, $right) = ($1, $2);
1684                if (length($mid) > 5) {
1685                        $mid = " ... ";
1686                }
1687                return "$left$mid$right";
1688
1689        } else {
1690                $str =~ m/^($endre)(.*)$/;
1691                my $body = $1;
1692                my $tail = $2;
1693                if (length($tail) > 4) {
1694                        $tail = "... ";
1695                }
1696                return "$body$tail";
1697        }
1698}
1699
1700# takes the same arguments as chop_str, but also wraps a <span> around the
1701# result with a title attribute if it does get chopped. Additionally, the
1702# string is HTML-escaped.
1703sub chop_and_escape_str {
1704        my ($str) = @_;
1705
1706        my $chopped = chop_str(@_);
1707        $str = to_utf8($str);
1708        if ($chopped eq $str) {
1709                return esc_html($chopped);
1710        } else {
1711                $str =~ s/[[:cntrl:]]/?/g;
1712                return $cgi->span({-title=>$str}, esc_html($chopped));
1713        }
1714}
1715
1716## ----------------------------------------------------------------------
1717## functions returning short strings
1718
1719# CSS class for given age value (in seconds)
1720sub age_class {
1721        my $age = shift;
1722
1723        if (!defined $age) {
1724                return "noage";
1725        } elsif ($age < 60*60*2) {
1726                return "age0";
1727        } elsif ($age < 60*60*24*2) {
1728                return "age1";
1729        } else {
1730                return "age2";
1731        }
1732}
1733
1734# convert age in seconds to "nn units ago" string
1735sub age_string {
1736        my $age = shift;
1737        my $age_str;
1738
1739        if ($age > 60*60*24*365*2) {
1740                $age_str = (int $age/60/60/24/365);
1741                $age_str .= " years ago";
1742        } elsif ($age > 60*60*24*(365/12)*2) {
1743                $age_str = int $age/60/60/24/(365/12);
1744                $age_str .= " months ago";
1745        } elsif ($age > 60*60*24*7*2) {
1746                $age_str = int $age/60/60/24/7;
1747                $age_str .= " weeks ago";
1748        } elsif ($age > 60*60*24*2) {
1749                $age_str = int $age/60/60/24;
1750                $age_str .= " days ago";
1751        } elsif ($age > 60*60*2) {
1752                $age_str = int $age/60/60;
1753                $age_str .= " hours ago";
1754        } elsif ($age > 60*2) {
1755                $age_str = int $age/60;
1756                $age_str .= " min ago";
1757        } elsif ($age > 2) {
1758                $age_str = int $age;
1759                $age_str .= " sec ago";
1760        } else {
1761                $age_str .= " right now";
1762        }
1763        return $age_str;
1764}
1765
1766use constant {
1767        S_IFINVALID => 0030000,
1768        S_IFGITLINK => 0160000,
1769};
1770
1771# submodule/subproject, a commit object reference
1772sub S_ISGITLINK {
1773        my $mode = shift;
1774
1775        return (($mode & S_IFMT) == S_IFGITLINK)
1776}
1777
1778# convert file mode in octal to symbolic file mode string
1779sub mode_str {
1780        my $mode = oct shift;
1781
1782        if (S_ISGITLINK($mode)) {
1783                return 'm---------';
1784        } elsif (S_ISDIR($mode & S_IFMT)) {
1785                return 'drwxr-xr-x';
1786        } elsif (S_ISLNK($mode)) {
1787                return 'lrwxrwxrwx';
1788        } elsif (S_ISREG($mode)) {
1789                # git cares only about the executable bit
1790                if ($mode & S_IXUSR) {
1791                        return '-rwxr-xr-x';
1792                } else {
1793                        return '-rw-r--r--';
1794                };
1795        } else {
1796                return '----------';
1797        }
1798}
1799
1800# convert file mode in octal to file type string
1801sub file_type {
1802        my $mode = shift;
1803
1804        if ($mode !~ m/^[0-7]+$/) {
1805                return $mode;
1806        } else {
1807                $mode = oct $mode;
1808        }
1809
1810        if (S_ISGITLINK($mode)) {
1811                return "submodule";
1812        } elsif (S_ISDIR($mode & S_IFMT)) {
1813                return "directory";
1814        } elsif (S_ISLNK($mode)) {
1815                return "symlink";
1816        } elsif (S_ISREG($mode)) {
1817                return "file";
1818        } else {
1819                return "unknown";
1820        }
1821}
1822
1823# convert file mode in octal to file type description string
1824sub file_type_long {
1825        my $mode = shift;
1826
1827        if ($mode !~ m/^[0-7]+$/) {
1828                return $mode;
1829        } else {
1830                $mode = oct $mode;
1831        }
1832
1833        if (S_ISGITLINK($mode)) {
1834                return "submodule";
1835        } elsif (S_ISDIR($mode & S_IFMT)) {
1836                return "directory";
1837        } elsif (S_ISLNK($mode)) {
1838                return "symlink";
1839        } elsif (S_ISREG($mode)) {
1840                if ($mode & S_IXUSR) {
1841                        return "executable";
1842                } else {
1843                        return "file";
1844                };
1845        } else {
1846                return "unknown";
1847        }
1848}
1849
1850
1851## ----------------------------------------------------------------------
1852## functions returning short HTML fragments, or transforming HTML fragments
1853## which don't belong to other sections
1854
1855# format line of commit message.
1856sub format_log_line_html {
1857        my $line = shift;
1858
1859        $line = esc_html($line, -nbsp=>1);
1860        $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1861                $cgi->a({-href => href(action=>"object", hash=>$1),
1862                                        -class => "text"}, $1);
1863        }eg;
1864
1865        return $line;
1866}
1867
1868# format marker of refs pointing to given object
1869
1870# the destination action is chosen based on object type and current context:
1871# - for annotated tags, we choose the tag view unless it's the current view
1872#   already, in which case we go to shortlog view
1873# - for other refs, we keep the current view if we're in history, shortlog or
1874#   log view, and select shortlog otherwise
1875sub format_ref_marker {
1876        my ($refs, $id) = @_;
1877        my $markers = '';
1878
1879        if (defined $refs->{$id}) {
1880                foreach my $ref (@{$refs->{$id}}) {
1881                        # this code exploits the fact that non-lightweight tags are the
1882                        # only indirect objects, and that they are the only objects for which
1883                        # we want to use tag instead of shortlog as action
1884                        my ($type, $name) = qw();
1885                        my $indirect = ($ref =~ s/\^\{\}$//);
1886                        # e.g. tags/v2.6.11 or heads/next
1887                        if ($ref =~ m!^(.*?)s?/(.*)$!) {
1888                                $type = $1;
1889                                $name = $2;
1890                        } else {
1891                                $type = "ref";
1892                                $name = $ref;
1893                        }
1894
1895                        my $class = $type;
1896                        $class .= " indirect" if $indirect;
1897
1898                        my $dest_action = "shortlog";
1899
1900                        if ($indirect) {
1901                                $dest_action = "tag" unless $action eq "tag";
1902                        } elsif ($action =~ /^(history|(short)?log)$/) {
1903                                $dest_action = $action;
1904                        }
1905
1906                        my $dest = "";
1907                        $dest .= "refs/" unless $ref =~ m!^refs/!;
1908                        $dest .= $ref;
1909
1910                        my $link = $cgi->a({
1911                                -href => href(
1912                                        action=>$dest_action,
1913                                        hash=>$dest
1914                                )}, $name);
1915
1916                        $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
1917                                $link . "</span>";
1918                }
1919        }
1920
1921        if ($markers) {
1922                return ' <span class="refs">'. $markers . '</span>';
1923        } else {
1924                return "";
1925        }
1926}
1927
1928# format, perhaps shortened and with markers, title line
1929sub format_subject_html {
1930        my ($long, $short, $href, $extra) = @_;
1931        $extra = '' unless defined($extra);
1932
1933        if (length($short) < length($long)) {
1934                $long =~ s/[[:cntrl:]]/?/g;
1935                return $cgi->a({-href => $href, -class => "list subject",
1936                                -title => to_utf8($long)},
1937                       esc_html($short)) . $extra;
1938        } else {
1939                return $cgi->a({-href => $href, -class => "list subject"},
1940                       esc_html($long)) . $extra;
1941        }
1942}
1943
1944# Rather than recomputing the url for an email multiple times, we cache it
1945# after the first hit. This gives a visible benefit in views where the avatar
1946# for the same email is used repeatedly (e.g. shortlog).
1947# The cache is shared by all avatar engines (currently gravatar only), which
1948# are free to use it as preferred. Since only one avatar engine is used for any
1949# given page, there's no risk for cache conflicts.
1950our %avatar_cache = ();
1951
1952# Compute the picon url for a given email, by using the picon search service over at
1953# http://www.cs.indiana.edu/picons/search.html
1954sub picon_url {
1955        my $email = lc shift;
1956        if (!$avatar_cache{$email}) {
1957                my ($user, $domain) = split('@', $email);
1958                $avatar_cache{$email} =
1959                        "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1960                        "$domain/$user/" .
1961                        "users+domains+unknown/up/single";
1962        }
1963        return $avatar_cache{$email};
1964}
1965
1966# Compute the gravatar url for a given email, if it's not in the cache already.
1967# Gravatar stores only the part of the URL before the size, since that's the
1968# one computationally more expensive. This also allows reuse of the cache for
1969# different sizes (for this particular engine).
1970sub gravatar_url {
1971        my $email = lc shift;
1972        my $size = shift;
1973        $avatar_cache{$email} ||=
1974                "http://www.gravatar.com/avatar/" .
1975                        Digest::MD5::md5_hex($email) . "?s=";
1976        return $avatar_cache{$email} . $size;
1977}
1978
1979# Insert an avatar for the given $email at the given $size if the feature
1980# is enabled.
1981sub git_get_avatar {
1982        my ($email, %opts) = @_;
1983        my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1984        my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1985        $opts{-size} ||= 'default';
1986        my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1987        my $url = "";
1988        if ($git_avatar eq 'gravatar') {
1989                $url = gravatar_url($email, $size);
1990        } elsif ($git_avatar eq 'picon') {
1991                $url = picon_url($email);
1992        }
1993        # Other providers can be added by extending the if chain, defining $url
1994        # as needed. If no variant puts something in $url, we assume avatars
1995        # are completely disabled/unavailable.
1996        if ($url) {
1997                return $pre_white .
1998                       "<img width=\"$size\" " .
1999                            "class=\"avatar\" " .
2000                            "src=\"".esc_url($url)."\" " .
2001                            "alt=\"\" " .
2002                       "/>" . $post_white;
2003        } else {
2004                return "";
2005        }
2006}
2007
2008sub format_search_author {
2009        my ($author, $searchtype, $displaytext) = @_;
2010        my $have_search = gitweb_check_feature('search');
2011
2012        if ($have_search) {
2013                my $performed = "";
2014                if ($searchtype eq 'author') {
2015                        $performed = "authored";
2016                } elsif ($searchtype eq 'committer') {
2017                        $performed = "committed";
2018                }
2019
2020                return $cgi->a({-href => href(action=>"search", hash=>$hash,
2021                                searchtext=>$author,
2022                                searchtype=>$searchtype), class=>"list",
2023                                title=>"Search for commits $performed by $author"},
2024                                $displaytext);
2025
2026        } else {
2027                return $displaytext;
2028        }
2029}
2030
2031# format the author name of the given commit with the given tag
2032# the author name is chopped and escaped according to the other
2033# optional parameters (see chop_str).
2034sub format_author_html {
2035        my $tag = shift;
2036        my $co = shift;
2037        my $author = chop_and_escape_str($co->{'author_name'}, @_);
2038        return "<$tag class=\"author\">" .
2039               format_search_author($co->{'author_name'}, "author",
2040                       git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2041                       $author) .
2042               "</$tag>";
2043}
2044
2045# format git diff header line, i.e. "diff --(git|combined|cc) ..."
2046sub format_git_diff_header_line {
2047        my $line = shift;
2048        my $diffinfo = shift;
2049        my ($from, $to) = @_;
2050
2051        if ($diffinfo->{'nparents'}) {
2052                # combined diff
2053                $line =~ s!^(diff (.*?) )"?.*$!$1!;
2054                if ($to->{'href'}) {
2055                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2056                                         esc_path($to->{'file'}));
2057                } else { # file was deleted (no href)
2058                        $line .= esc_path($to->{'file'});
2059                }
2060        } else {
2061                # "ordinary" diff
2062                $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2063                if ($from->{'href'}) {
2064                        $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2065                                         'a/' . esc_path($from->{'file'}));
2066                } else { # file was added (no href)
2067                        $line .= 'a/' . esc_path($from->{'file'});
2068                }
2069                $line .= ' ';
2070                if ($to->{'href'}) {
2071                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2072                                         'b/' . esc_path($to->{'file'}));
2073                } else { # file was deleted
2074                        $line .= 'b/' . esc_path($to->{'file'});
2075                }
2076        }
2077
2078        return "<div class=\"diff header\">$line</div>\n";
2079}
2080
2081# format extended diff header line, before patch itself
2082sub format_extended_diff_header_line {
2083        my $line = shift;
2084        my $diffinfo = shift;
2085        my ($from, $to) = @_;
2086
2087        # match <path>
2088        if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2089                $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2090                                       esc_path($from->{'file'}));
2091        }
2092        if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2093                $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2094                                 esc_path($to->{'file'}));
2095        }
2096        # match single <mode>
2097        if ($line =~ m/\s(\d{6})$/) {
2098                $line .= '<span class="info"> (' .
2099                         file_type_long($1) .
2100                         ')</span>';
2101        }
2102        # match <hash>
2103        if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2104                # can match only for combined diff
2105                $line = 'index ';
2106                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2107                        if ($from->{'href'}[$i]) {
2108                                $line .= $cgi->a({-href=>$from->{'href'}[$i],
2109                                                  -class=>"hash"},
2110                                                 substr($diffinfo->{'from_id'}[$i],0,7));
2111                        } else {
2112                                $line .= '0' x 7;
2113                        }
2114                        # separator
2115                        $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2116                }
2117                $line .= '..';
2118                if ($to->{'href'}) {
2119                        $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2120                                         substr($diffinfo->{'to_id'},0,7));
2121                } else {
2122                        $line .= '0' x 7;
2123                }
2124
2125        } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2126                # can match only for ordinary diff
2127                my ($from_link, $to_link);
2128                if ($from->{'href'}) {
2129                        $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2130                                             substr($diffinfo->{'from_id'},0,7));
2131                } else {
2132                        $from_link = '0' x 7;
2133                }
2134                if ($to->{'href'}) {
2135                        $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2136                                           substr($diffinfo->{'to_id'},0,7));
2137                } else {
2138                        $to_link = '0' x 7;
2139                }
2140                my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2141                $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2142        }
2143
2144        return $line . "<br/>\n";
2145}
2146
2147# format from-file/to-file diff header
2148sub format_diff_from_to_header {
2149        my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2150        my $line;
2151        my $result = '';
2152
2153        $line = $from_line;
2154        #assert($line =~ m/^---/) if DEBUG;
2155        # no extra formatting for "^--- /dev/null"
2156        if (! $diffinfo->{'nparents'}) {
2157                # ordinary (single parent) diff
2158                if ($line =~ m!^--- "?a/!) {
2159                        if ($from->{'href'}) {
2160                                $line = '--- a/' .
2161                                        $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2162                                                esc_path($from->{'file'}));
2163                        } else {
2164                                $line = '--- a/' .
2165                                        esc_path($from->{'file'});
2166                        }
2167                }
2168                $result .= qq!<div class="diff from_file">$line</div>\n!;
2169
2170        } else {
2171                # combined diff (merge commit)
2172                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2173                        if ($from->{'href'}[$i]) {
2174                                $line = '--- ' .
2175                                        $cgi->a({-href=>href(action=>"blobdiff",
2176                                                             hash_parent=>$diffinfo->{'from_id'}[$i],
2177                                                             hash_parent_base=>$parents[$i],
2178                                                             file_parent=>$from->{'file'}[$i],
2179                                                             hash=>$diffinfo->{'to_id'},
2180                                                             hash_base=>$hash,
2181                                                             file_name=>$to->{'file'}),
2182                                                 -class=>"path",
2183                                                 -title=>"diff" . ($i+1)},
2184                                                $i+1) .
2185                                        '/' .
2186                                        $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2187                                                esc_path($from->{'file'}[$i]));
2188                        } else {
2189                                $line = '--- /dev/null';
2190                        }
2191                        $result .= qq!<div class="diff from_file">$line</div>\n!;
2192                }
2193        }
2194
2195        $line = $to_line;
2196        #assert($line =~ m/^\+\+\+/) if DEBUG;
2197        # no extra formatting for "^+++ /dev/null"
2198        if ($line =~ m!^\+\+\+ "?b/!) {
2199                if ($to->{'href'}) {
2200                        $line = '+++ b/' .
2201                                $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2202                                        esc_path($to->{'file'}));
2203                } else {
2204                        $line = '+++ b/' .
2205                                esc_path($to->{'file'});
2206                }
2207        }
2208        $result .= qq!<div class="diff to_file">$line</div>\n!;
2209
2210        return $result;
2211}
2212
2213# create note for patch simplified by combined diff
2214sub format_diff_cc_simplified {
2215        my ($diffinfo, @parents) = @_;
2216        my $result = '';
2217
2218        $result .= "<div class=\"diff header\">" .
2219                   "diff --cc ";
2220        if (!is_deleted($diffinfo)) {
2221                $result .= $cgi->a({-href => href(action=>"blob",
2222                                                  hash_base=>$hash,
2223                                                  hash=>$diffinfo->{'to_id'},
2224                                                  file_name=>$diffinfo->{'to_file'}),
2225                                    -class => "path"},
2226                                   esc_path($diffinfo->{'to_file'}));
2227        } else {
2228                $result .= esc_path($diffinfo->{'to_file'});
2229        }
2230        $result .= "</div>\n" . # class="diff header"
2231                   "<div class=\"diff nodifferences\">" .
2232                   "Simple merge" .
2233                   "</div>\n"; # class="diff nodifferences"
2234
2235        return $result;
2236}
2237
2238sub diff_line_class {
2239        my ($line, $from, $to) = @_;
2240
2241        # ordinary diff
2242        my $num_sign = 1;
2243        # combined diff
2244        if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2245                $num_sign = scalar @{$from->{'href'}};
2246        }
2247
2248        my @diff_line_classifier = (
2249                { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2250                { regexp => qr/^\\/,               class => "incomplete"  },
2251                { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2252                # classifier for context must come before classifier add/rem,
2253                # or we would have to use more complicated regexp, for example
2254                # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2255                { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2256                { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2257        );
2258        for my $clsfy (@diff_line_classifier) {
2259                return $clsfy->{'class'}
2260                        if ($line =~ $clsfy->{'regexp'});
2261        }
2262
2263        # fallback
2264        return "";
2265}
2266
2267# assumes that $from and $to are defined and correctly filled,
2268# and that $line holds a line of chunk header for unified diff
2269sub format_unidiff_chunk_header {
2270        my ($line, $from, $to) = @_;
2271
2272        my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2273                $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2274
2275        $from_lines = 0 unless defined $from_lines;
2276        $to_lines   = 0 unless defined $to_lines;
2277
2278        if ($from->{'href'}) {
2279                $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2280                                     -class=>"list"}, $from_text);
2281        }
2282        if ($to->{'href'}) {
2283                $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2284                                     -class=>"list"}, $to_text);
2285        }
2286        $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2287                "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2288        return $line;
2289}
2290
2291# assumes that $from and $to are defined and correctly filled,
2292# and that $line holds a line of chunk header for combined diff
2293sub format_cc_diff_chunk_header {
2294        my ($line, $from, $to) = @_;
2295
2296        my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2297        my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2298
2299        @from_text = split(' ', $ranges);
2300        for (my $i = 0; $i < @from_text; ++$i) {
2301                ($from_start[$i], $from_nlines[$i]) =
2302                        (split(',', substr($from_text[$i], 1)), 0);
2303        }
2304
2305        $to_text   = pop @from_text;
2306        $to_start  = pop @from_start;
2307        $to_nlines = pop @from_nlines;
2308
2309        $line = "<span class=\"chunk_info\">$prefix ";
2310        for (my $i = 0; $i < @from_text; ++$i) {
2311                if ($from->{'href'}[$i]) {
2312                        $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2313                                          -class=>"list"}, $from_text[$i]);
2314                } else {
2315                        $line .= $from_text[$i];
2316                }
2317                $line .= " ";
2318        }
2319        if ($to->{'href'}) {
2320                $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2321                                  -class=>"list"}, $to_text);
2322        } else {
2323                $line .= $to_text;
2324        }
2325        $line .= " $prefix</span>" .
2326                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2327        return $line;
2328}
2329
2330# process patch (diff) line (not to be used for diff headers),
2331# returning class and HTML-formatted (but not wrapped) line
2332sub process_diff_line {
2333        my $line = shift;
2334        my ($from, $to) = @_;
2335
2336        my $diff_class = diff_line_class($line, $from, $to);
2337
2338        chomp $line;
2339        $line = untabify($line);
2340
2341        if ($from && $to && $line =~ m/^\@{2} /) {
2342                $line = format_unidiff_chunk_header($line, $from, $to);
2343                return $diff_class, $line;
2344
2345        } elsif ($from && $to && $line =~ m/^\@{3}/) {
2346                $line = format_cc_diff_chunk_header($line, $from, $to);
2347                return $diff_class, $line;
2348
2349        }
2350        return $diff_class, esc_html($line, -nbsp=>1);
2351}
2352
2353# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2354# linked.  Pass the hash of the tree/commit to snapshot.
2355sub format_snapshot_links {
2356        my ($hash) = @_;
2357        my $num_fmts = @snapshot_fmts;
2358        if ($num_fmts > 1) {
2359                # A parenthesized list of links bearing format names.
2360                # e.g. "snapshot (_tar.gz_ _zip_)"
2361                return "snapshot (" . join(' ', map
2362                        $cgi->a({
2363                                -href => href(
2364                                        action=>"snapshot",
2365                                        hash=>$hash,
2366                                        snapshot_format=>$_
2367                                )
2368                        }, $known_snapshot_formats{$_}{'display'})
2369                , @snapshot_fmts) . ")";
2370        } elsif ($num_fmts == 1) {
2371                # A single "snapshot" link whose tooltip bears the format name.
2372                # i.e. "_snapshot_"
2373                my ($fmt) = @snapshot_fmts;
2374                return
2375                        $cgi->a({
2376                                -href => href(
2377                                        action=>"snapshot",
2378                                        hash=>$hash,
2379                                        snapshot_format=>$fmt
2380                                ),
2381                                -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2382                        }, "snapshot");
2383        } else { # $num_fmts == 0
2384                return undef;
2385        }
2386}
2387
2388## ......................................................................
2389## functions returning values to be passed, perhaps after some
2390## transformation, to other functions; e.g. returning arguments to href()
2391
2392# returns hash to be passed to href to generate gitweb URL
2393# in -title key it returns description of link
2394sub get_feed_info {
2395        my $format = shift || 'Atom';
2396        my %res = (action => lc($format));
2397
2398        # feed links are possible only for project views
2399        return unless (defined $project);
2400        # some views should link to OPML, or to generic project feed,
2401        # or don't have specific feed yet (so they should use generic)
2402        return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2403
2404        my $branch;
2405        # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2406        # from tag links; this also makes possible to detect branch links
2407        if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2408            (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2409                $branch = $1;
2410        }
2411        # find log type for feed description (title)
2412        my $type = 'log';
2413        if (defined $file_name) {
2414                $type  = "history of $file_name";
2415                $type .= "/" if ($action eq 'tree');
2416                $type .= " on '$branch'" if (defined $branch);
2417        } else {
2418                $type = "log of $branch" if (defined $branch);
2419        }
2420
2421        $res{-title} = $type;
2422        $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2423        $res{'file_name'} = $file_name;
2424
2425        return %res;
2426}
2427
2428## ----------------------------------------------------------------------
2429## git utility subroutines, invoking git commands
2430
2431# returns path to the core git executable and the --git-dir parameter as list
2432sub git_cmd {
2433        $number_of_git_cmds++;
2434        return $GIT, '--git-dir='.$git_dir;
2435}
2436
2437# quote the given arguments for passing them to the shell
2438# quote_command("command", "arg 1", "arg with ' and ! characters")
2439# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2440# Try to avoid using this function wherever possible.
2441sub quote_command {
2442        return join(' ',
2443                map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2444}
2445
2446# get HEAD ref of given project as hash
2447sub git_get_head_hash {
2448        return git_get_full_hash(shift, 'HEAD');
2449}
2450
2451sub git_get_full_hash {
2452        return git_get_hash(@_);
2453}
2454
2455sub git_get_short_hash {
2456        return git_get_hash(@_, '--short=7');
2457}
2458
2459sub git_get_hash {
2460        my ($project, $hash, @options) = @_;
2461        my $o_git_dir = $git_dir;
2462        my $retval = undef;
2463        $git_dir = "$projectroot/$project";
2464        if (open my $fd, '-|', git_cmd(), 'rev-parse',
2465            '--verify', '-q', @options, $hash) {
2466                $retval = <$fd>;
2467                chomp $retval if defined $retval;
2468                close $fd;
2469        }
2470        if (defined $o_git_dir) {
2471                $git_dir = $o_git_dir;
2472        }
2473        return $retval;
2474}
2475
2476# get type of given object
2477sub git_get_type {
2478        my $hash = shift;
2479
2480        open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2481        my $type = <$fd>;
2482        close $fd or return;
2483        chomp $type;
2484        return $type;
2485}
2486
2487# repository configuration
2488our $config_file = '';
2489our %config;
2490
2491# store multiple values for single key as anonymous array reference
2492# single values stored directly in the hash, not as [ <value> ]
2493sub hash_set_multi {
2494        my ($hash, $key, $value) = @_;
2495
2496        if (!exists $hash->{$key}) {
2497                $hash->{$key} = $value;
2498        } elsif (!ref $hash->{$key}) {
2499                $hash->{$key} = [ $hash->{$key}, $value ];
2500        } else {
2501                push @{$hash->{$key}}, $value;
2502        }
2503}
2504
2505# return hash of git project configuration
2506# optionally limited to some section, e.g. 'gitweb'
2507sub git_parse_project_config {
2508        my $section_regexp = shift;
2509        my %config;
2510
2511        local $/ = "\0";
2512
2513        open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2514                or return;
2515
2516        while (my $keyval = <$fh>) {
2517                chomp $keyval;
2518                my ($key, $value) = split(/\n/, $keyval, 2);
2519
2520                hash_set_multi(\%config, $key, $value)
2521                        if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2522        }
2523        close $fh;
2524
2525        return %config;
2526}
2527
2528# convert config value to boolean: 'true' or 'false'
2529# no value, number > 0, 'true' and 'yes' values are true
2530# rest of values are treated as false (never as error)
2531sub config_to_bool {
2532        my $val = shift;
2533
2534        return 1 if !defined $val;             # section.key
2535
2536        # strip leading and trailing whitespace
2537        $val =~ s/^\s+//;
2538        $val =~ s/\s+$//;
2539
2540        return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2541                ($val =~ /^(?:true|yes)$/i));  # section.key = true
2542}
2543
2544# convert config value to simple decimal number
2545# an optional value suffix of 'k', 'm', or 'g' will cause the value
2546# to be multiplied by 1024, 1048576, or 1073741824
2547sub config_to_int {
2548        my $val = shift;
2549
2550        # strip leading and trailing whitespace
2551        $val =~ s/^\s+//;
2552        $val =~ s/\s+$//;
2553
2554        if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2555                $unit = lc($unit);
2556                # unknown unit is treated as 1
2557                return $num * ($unit eq 'g' ? 1073741824 :
2558                               $unit eq 'm' ?    1048576 :
2559                               $unit eq 'k' ?       1024 : 1);
2560        }
2561        return $val;
2562}
2563
2564# convert config value to array reference, if needed
2565sub config_to_multi {
2566        my $val = shift;
2567
2568        return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2569}
2570
2571sub git_get_project_config {
2572        my ($key, $type) = @_;
2573
2574        return unless defined $git_dir;
2575
2576        # key sanity check
2577        return unless ($key);
2578        # only subsection, if exists, is case sensitive,
2579        # and not lowercased by 'git config -z -l'
2580        if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2581                $key = join(".", lc($hi), $mi, lc($lo));
2582        } else {
2583                $key = lc($key);
2584        }
2585        $key =~ s/^gitweb\.//;
2586        return if ($key =~ m/\W/);
2587
2588        # type sanity check
2589        if (defined $type) {
2590                $type =~ s/^--//;
2591                $type = undef
2592                        unless ($type eq 'bool' || $type eq 'int');
2593        }
2594
2595        # get config
2596        if (!defined $config_file ||
2597            $config_file ne "$git_dir/config") {
2598                %config = git_parse_project_config('gitweb');
2599                $config_file = "$git_dir/config";
2600        }
2601
2602        # check if config variable (key) exists
2603        return unless exists $config{"gitweb.$key"};
2604
2605        # ensure given type
2606        if (!defined $type) {
2607                return $config{"gitweb.$key"};
2608        } elsif ($type eq 'bool') {
2609                # backward compatibility: 'git config --bool' returns true/false
2610                return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2611        } elsif ($type eq 'int') {
2612                return config_to_int($config{"gitweb.$key"});
2613        }
2614        return $config{"gitweb.$key"};
2615}
2616
2617# get hash of given path at given ref
2618sub git_get_hash_by_path {
2619        my $base = shift;
2620        my $path = shift || return undef;
2621        my $type = shift;
2622
2623        $path =~ s,/+$,,;
2624
2625        open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2626                or die_error(500, "Open git-ls-tree failed");
2627        my $line = <$fd>;
2628        close $fd or return undef;
2629
2630        if (!defined $line) {
2631                # there is no tree or hash given by $path at $base
2632                return undef;
2633        }
2634
2635        #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2636        $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2637        if (defined $type && $type ne $2) {
2638                # type doesn't match
2639                return undef;
2640        }
2641        return $3;
2642}
2643
2644# get path of entry with given hash at given tree-ish (ref)
2645# used to get 'from' filename for combined diff (merge commit) for renames
2646sub git_get_path_by_hash {
2647        my $base = shift || return;
2648        my $hash = shift || return;
2649
2650        local $/ = "\0";
2651
2652        open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2653                or return undef;
2654        while (my $line = <$fd>) {
2655                chomp $line;
2656
2657                #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2658                #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2659                if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2660                        close $fd;
2661                        return $1;
2662                }
2663        }
2664        close $fd;
2665        return undef;
2666}
2667
2668## ......................................................................
2669## git utility functions, directly accessing git repository
2670
2671# get the value of config variable either from file named as the variable
2672# itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2673# configuration variable in the repository config file.
2674sub git_get_file_or_project_config {
2675        my ($path, $name) = @_;
2676
2677        $git_dir = "$projectroot/$path";
2678        open my $fd, '<', "$git_dir/$name"
2679                or return git_get_project_config($name);
2680        my $conf = <$fd>;
2681        close $fd;
2682        if (defined $conf) {
2683                chomp $conf;
2684        }
2685        return $conf;
2686}
2687
2688sub git_get_project_description {
2689        my $path = shift;
2690        return git_get_file_or_project_config($path, 'description');
2691}
2692
2693sub git_get_project_category {
2694        my $path = shift;
2695        return git_get_file_or_project_config($path, 'category');
2696}
2697
2698
2699# supported formats:
2700# * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2701#   - if its contents is a number, use it as tag weight,
2702#   - otherwise add a tag with weight 1
2703# * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2704#   the same value multiple times increases tag weight
2705# * `gitweb.ctag' multi-valued repo config variable
2706sub git_get_project_ctags {
2707        my $project = shift;
2708        my $ctags = {};
2709
2710        $git_dir = "$projectroot/$project";
2711        if (opendir my $dh, "$git_dir/ctags") {
2712                my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2713                foreach my $tagfile (@files) {
2714                        open my $ct, '<', $tagfile
2715                                or next;
2716                        my $val = <$ct>;
2717                        chomp $val if $val;
2718                        close $ct;
2719
2720                        (my $ctag = $tagfile) =~ s#.*/##;
2721                        if ($val =~ /^\d+$/) {
2722                                $ctags->{$ctag} = $val;
2723                        } else {
2724                                $ctags->{$ctag} = 1;
2725                        }
2726                }
2727                closedir $dh;
2728
2729        } elsif (open my $fh, '<', "$git_dir/ctags") {
2730                while (my $line = <$fh>) {
2731                        chomp $line;
2732                        $ctags->{$line}++ if $line;
2733                }
2734                close $fh;
2735
2736        } else {
2737                my $taglist = config_to_multi(git_get_project_config('ctag'));
2738                foreach my $tag (@$taglist) {
2739                        $ctags->{$tag}++;
2740                }
2741        }
2742
2743        return $ctags;
2744}
2745
2746# return hash, where keys are content tags ('ctags'),
2747# and values are sum of weights of given tag in every project
2748sub git_gather_all_ctags {
2749        my $projects = shift;
2750        my $ctags = {};
2751
2752        foreach my $p (@$projects) {
2753                foreach my $ct (keys %{$p->{'ctags'}}) {
2754                        $ctags->{$ct} += $p->{'ctags'}->{$ct};
2755                }
2756        }
2757
2758        return $ctags;
2759}
2760
2761sub git_populate_project_tagcloud {
2762        my $ctags = shift;
2763
2764        # First, merge different-cased tags; tags vote on casing
2765        my %ctags_lc;
2766        foreach (keys %$ctags) {
2767                $ctags_lc{lc $_}->{count} += $ctags->{$_};
2768                if (not $ctags_lc{lc $_}->{topcount}
2769                    or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2770                        $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2771                        $ctags_lc{lc $_}->{topname} = $_;
2772                }
2773        }
2774
2775        my $cloud;
2776        my $matched = $cgi->param('by_tag');
2777        if (eval { require HTML::TagCloud; 1; }) {
2778                $cloud = HTML::TagCloud->new;
2779                foreach my $ctag (sort keys %ctags_lc) {
2780                        # Pad the title with spaces so that the cloud looks
2781                        # less crammed.
2782                        my $title = esc_html($ctags_lc{$ctag}->{topname});
2783                        $title =~ s/ /&nbsp;/g;
2784                        $title =~ s/^/&nbsp;/g;
2785                        $title =~ s/$/&nbsp;/g;
2786                        if (defined $matched && $matched eq $ctag) {
2787                                $title = qq(<span class="match">$title</span>);
2788                        }
2789                        $cloud->add($title, href(project=>undef, ctag=>$ctag),
2790                                    $ctags_lc{$ctag}->{count});
2791                }
2792        } else {
2793                $cloud = {};
2794                foreach my $ctag (keys %ctags_lc) {
2795                        my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2796                        if (defined $matched && $matched eq $ctag) {
2797                                $title = qq(<span class="match">$title</span>);
2798                        }
2799                        $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2800                        $cloud->{$ctag}{ctag} =
2801                                $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2802                }
2803        }
2804        return $cloud;
2805}
2806
2807sub git_show_project_tagcloud {
2808        my ($cloud, $count) = @_;
2809        if (ref $cloud eq 'HTML::TagCloud') {
2810                return $cloud->html_and_css($count);
2811        } else {
2812                my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2813                return
2814                        '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2815                        join (', ', map {
2816                                $cloud->{$_}->{'ctag'}
2817                        } splice(@tags, 0, $count)) .
2818                        '</div>';
2819        }
2820}
2821
2822sub git_get_project_url_list {
2823        my $path = shift;
2824
2825        $git_dir = "$projectroot/$path";
2826        open my $fd, '<', "$git_dir/cloneurl"
2827                or return wantarray ?
2828                @{ config_to_multi(git_get_project_config('url')) } :
2829                   config_to_multi(git_get_project_config('url'));
2830        my @git_project_url_list = map { chomp; $_ } <$fd>;
2831        close $fd;
2832
2833        return wantarray ? @git_project_url_list : \@git_project_url_list;
2834}
2835
2836sub git_get_projects_list {
2837        my $filter = shift || '';
2838        my $paranoid = shift;
2839        my @list;
2840
2841        if (-d $projects_list) {
2842                # search in directory
2843                my $dir = $projects_list;
2844                # remove the trailing "/"
2845                $dir =~ s!/+$!!;
2846                my $pfxlen = length("$dir");
2847                my $pfxdepth = ($dir =~ tr!/!!);
2848                # when filtering, search only given subdirectory
2849                if ($filter && !$paranoid) {
2850                        $dir .= "/$filter";
2851                        $dir =~ s!/+$!!;
2852                }
2853
2854                File::Find::find({
2855                        follow_fast => 1, # follow symbolic links
2856                        follow_skip => 2, # ignore duplicates
2857                        dangling_symlinks => 0, # ignore dangling symlinks, silently
2858                        wanted => sub {
2859                                # global variables
2860                                our $project_maxdepth;
2861                                our $projectroot;
2862                                # skip project-list toplevel, if we get it.
2863                                return if (m!^[/.]$!);
2864                                # only directories can be git repositories
2865                                return unless (-d $_);
2866                                # don't traverse too deep (Find is super slow on os x)
2867                                # $project_maxdepth excludes depth of $projectroot
2868                                if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2869                                        $File::Find::prune = 1;
2870                                        return;
2871                                }
2872
2873                                my $path = substr($File::Find::name, $pfxlen + 1);
2874                                # paranoidly only filter here
2875                                if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
2876                                        next;
2877                                }
2878                                # we check related file in $projectroot
2879                                if (check_export_ok("$projectroot/$path")) {
2880                                        push @list, { path => $path };
2881                                        $File::Find::prune = 1;
2882                                }
2883                        },
2884                }, "$dir");
2885
2886        } elsif (-f $projects_list) {
2887                # read from file(url-encoded):
2888                # 'git%2Fgit.git Linus+Torvalds'
2889                # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2890                # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2891                open my $fd, '<', $projects_list or return;
2892        PROJECT:
2893                while (my $line = <$fd>) {
2894                        chomp $line;
2895                        my ($path, $owner) = split ' ', $line;
2896                        $path = unescape($path);
2897                        $owner = unescape($owner);
2898                        if (!defined $path) {
2899                                next;
2900                        }
2901                        # if $filter is rpovided, check if $path begins with $filter
2902                        if ($filter && $path !~ m!^\Q$filter\E/!) {
2903                                next;
2904                        }
2905                        if (check_export_ok("$projectroot/$path")) {
2906                                my $pr = {
2907                                        path => $path,
2908                                        owner => to_utf8($owner),
2909                                };
2910                                push @list, $pr;
2911                        }
2912                }
2913                close $fd;
2914        }
2915        return @list;
2916}
2917
2918# written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
2919# as side effects it sets 'forks' field to list of forks for forked projects
2920sub filter_forks_from_projects_list {
2921        my $projects = shift;
2922
2923        my %trie; # prefix tree of directories (path components)
2924        # generate trie out of those directories that might contain forks
2925        foreach my $pr (@$projects) {
2926                my $path = $pr->{'path'};
2927                $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
2928                next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
2929                next unless ($path);      # skip '.git' repository: tests, git-instaweb
2930                next unless (-d "$projectroot/$path"); # containing directory exists
2931                $pr->{'forks'} = [];      # there can be 0 or more forks of project
2932
2933                # add to trie
2934                my @dirs = split('/', $path);
2935                # walk the trie, until either runs out of components or out of trie
2936                my $ref = \%trie;
2937                while (scalar @dirs &&
2938                       exists($ref->{$dirs[0]})) {
2939                        $ref = $ref->{shift @dirs};
2940                }
2941                # create rest of trie structure from rest of components
2942                foreach my $dir (@dirs) {
2943                        $ref = $ref->{$dir} = {};
2944                }
2945                # create end marker, store $pr as a data
2946                $ref->{''} = $pr if (!exists $ref->{''});
2947        }
2948
2949        # filter out forks, by finding shortest prefix match for paths
2950        my @filtered;
2951 PROJECT:
2952        foreach my $pr (@$projects) {
2953                # trie lookup
2954                my $ref = \%trie;
2955        DIR:
2956                foreach my $dir (split('/', $pr->{'path'})) {
2957                        if (exists $ref->{''}) {
2958                                # found [shortest] prefix, is a fork - skip it
2959                                push @{$ref->{''}{'forks'}}, $pr;
2960                                next PROJECT;
2961                        }
2962                        if (!exists $ref->{$dir}) {
2963                                # not in trie, cannot have prefix, not a fork
2964                                push @filtered, $pr;
2965                                next PROJECT;
2966                        }
2967                        # If the dir is there, we just walk one step down the trie.
2968                        $ref = $ref->{$dir};
2969                }
2970                # we ran out of trie
2971                # (shouldn't happen: it's either no match, or end marker)
2972                push @filtered, $pr;
2973        }
2974
2975        return @filtered;
2976}
2977
2978# note: fill_project_list_info must be run first,
2979# for 'descr_long' and 'ctags' to be filled
2980sub search_projects_list {
2981        my ($projlist, %opts) = @_;
2982        my $tagfilter  = $opts{'tagfilter'};
2983        my $searchtext = $opts{'searchtext'};
2984
2985        return @$projlist
2986                unless ($tagfilter || $searchtext);
2987
2988        my @projects;
2989 PROJECT:
2990        foreach my $pr (@$projlist) {
2991
2992                if ($tagfilter) {
2993                        next unless ref($pr->{'ctags'}) eq 'HASH';
2994                        next unless
2995                                grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
2996                }
2997
2998                if ($searchtext) {
2999                        next unless
3000                                $pr->{'path'} =~ /$searchtext/ ||
3001                                $pr->{'descr_long'} =~ /$searchtext/;
3002                }
3003
3004                push @projects, $pr;
3005        }
3006
3007        return @projects;
3008}
3009
3010our $gitweb_project_owner = undef;
3011sub git_get_project_list_from_file {
3012
3013        return if (defined $gitweb_project_owner);
3014
3015        $gitweb_project_owner = {};
3016        # read from file (url-encoded):
3017        # 'git%2Fgit.git Linus+Torvalds'
3018        # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3019        # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3020        if (-f $projects_list) {
3021                open(my $fd, '<', $projects_list);
3022                while (my $line = <$fd>) {
3023                        chomp $line;
3024                        my ($pr, $ow) = split ' ', $line;
3025                        $pr = unescape($pr);
3026                        $ow = unescape($ow);
3027                        $gitweb_project_owner->{$pr} = to_utf8($ow);
3028                }
3029                close $fd;
3030        }
3031}
3032
3033sub git_get_project_owner {
3034        my $project = shift;
3035        my $owner;
3036
3037        return undef unless $project;
3038        $git_dir = "$projectroot/$project";
3039
3040        if (!defined $gitweb_project_owner) {
3041                git_get_project_list_from_file();
3042        }
3043
3044        if (exists $gitweb_project_owner->{$project}) {
3045                $owner = $gitweb_project_owner->{$project};
3046        }
3047        if (!defined $owner){
3048                $owner = git_get_project_config('owner');
3049        }
3050        if (!defined $owner) {
3051                $owner = get_file_owner("$git_dir");
3052        }
3053
3054        return $owner;
3055}
3056
3057sub git_get_last_activity {
3058        my ($path) = @_;
3059        my $fd;
3060
3061        $git_dir = "$projectroot/$path";
3062        open($fd, "-|", git_cmd(), 'for-each-ref',
3063             '--format=%(committer)',
3064             '--sort=-committerdate',
3065             '--count=1',
3066             'refs/heads') or return;
3067        my $most_recent = <$fd>;
3068        close $fd or return;
3069        if (defined $most_recent &&
3070            $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3071                my $timestamp = $1;
3072                my $age = time - $timestamp;
3073                return ($age, age_string($age));
3074        }
3075        return (undef, undef);
3076}
3077
3078# Implementation note: when a single remote is wanted, we cannot use 'git
3079# remote show -n' because that command always work (assuming it's a remote URL
3080# if it's not defined), and we cannot use 'git remote show' because that would
3081# try to make a network roundtrip. So the only way to find if that particular
3082# remote is defined is to walk the list provided by 'git remote -v' and stop if
3083# and when we find what we want.
3084sub git_get_remotes_list {
3085        my $wanted = shift;
3086        my %remotes = ();
3087
3088        open my $fd, '-|' , git_cmd(), 'remote', '-v';
3089        return unless $fd;
3090        while (my $remote = <$fd>) {
3091                chomp $remote;
3092                $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3093                next if $wanted and not $remote eq $wanted;
3094                my ($url, $key) = ($1, $2);
3095
3096                $remotes{$remote} ||= { 'heads' => () };
3097                $remotes{$remote}{$key} = $url;
3098        }
3099        close $fd or return;
3100        return wantarray ? %remotes : \%remotes;
3101}
3102
3103# Takes a hash of remotes as first parameter and fills it by adding the
3104# available remote heads for each of the indicated remotes.
3105sub fill_remote_heads {
3106        my $remotes = shift;
3107        my @heads = map { "remotes/$_" } keys %$remotes;
3108        my @remoteheads = git_get_heads_list(undef, @heads);
3109        foreach my $remote (keys %$remotes) {
3110                $remotes->{$remote}{'heads'} = [ grep {
3111                        $_->{'name'} =~ s!^$remote/!!
3112                        } @remoteheads ];
3113        }
3114}
3115
3116sub git_get_references {
3117        my $type = shift || "";
3118        my %refs;
3119        # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3120        # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3121        open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3122                ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3123                or return;
3124
3125        while (my $line = <$fd>) {
3126                chomp $line;
3127                if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3128                        if (defined $refs{$1}) {
3129                                push @{$refs{$1}}, $2;
3130                        } else {
3131                                $refs{$1} = [ $2 ];
3132                        }
3133                }
3134        }
3135        close $fd or return;
3136        return \%refs;
3137}
3138
3139sub git_get_rev_name_tags {
3140        my $hash = shift || return undef;
3141
3142        open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3143                or return;
3144        my $name_rev = <$fd>;
3145        close $fd;
3146
3147        if ($name_rev =~ m|^$hash tags/(.*)$|) {
3148                return $1;
3149        } else {
3150                # catches also '$hash undefined' output
3151                return undef;
3152        }
3153}
3154
3155## ----------------------------------------------------------------------
3156## parse to hash functions
3157
3158sub parse_date {
3159        my $epoch = shift;
3160        my $tz = shift || "-0000";
3161
3162        my %date;
3163        my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3164        my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3165        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3166        $date{'hour'} = $hour;
3167        $date{'minute'} = $min;
3168        $date{'mday'} = $mday;
3169        $date{'day'} = $days[$wday];
3170        $date{'month'} = $months[$mon];
3171        $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3172                             $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3173        $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3174                             $mday, $months[$mon], $hour ,$min;
3175        $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3176                             1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3177
3178        my ($tz_sign, $tz_hour, $tz_min) =
3179                ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3180        $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3181        my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3182        ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3183        $date{'hour_local'} = $hour;
3184        $date{'minute_local'} = $min;
3185        $date{'tz_local'} = $tz;
3186        $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3187                                  1900+$year, $mon+1, $mday,
3188                                  $hour, $min, $sec, $tz);
3189        return %date;
3190}
3191
3192sub parse_tag {
3193        my $tag_id = shift;
3194        my %tag;
3195        my @comment;
3196
3197        open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3198        $tag{'id'} = $tag_id;
3199        while (my $line = <$fd>) {
3200                chomp $line;
3201                if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3202                        $tag{'object'} = $1;
3203                } elsif ($line =~ m/^type (.+)$/) {
3204                        $tag{'type'} = $1;
3205                } elsif ($line =~ m/^tag (.+)$/) {
3206                        $tag{'name'} = $1;
3207                } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3208                        $tag{'author'} = $1;
3209                        $tag{'author_epoch'} = $2;
3210                        $tag{'author_tz'} = $3;
3211                        if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3212                                $tag{'author_name'}  = $1;
3213                                $tag{'author_email'} = $2;
3214                        } else {
3215                                $tag{'author_name'} = $tag{'author'};
3216                        }
3217                } elsif ($line =~ m/--BEGIN/) {
3218                        push @comment, $line;
3219                        last;
3220                } elsif ($line eq "") {
3221                        last;
3222                }
3223        }
3224        push @comment, <$fd>;
3225        $tag{'comment'} = \@comment;
3226        close $fd or return;
3227        if (!defined $tag{'name'}) {
3228                return
3229        };
3230        return %tag
3231}
3232
3233sub parse_commit_text {
3234        my ($commit_text, $withparents) = @_;
3235        my @commit_lines = split '\n', $commit_text;
3236        my %co;
3237
3238        pop @commit_lines; # Remove '\0'
3239
3240        if (! @commit_lines) {
3241                return;
3242        }
3243
3244        my $header = shift @commit_lines;
3245        if ($header !~ m/^[0-9a-fA-F]{40}/) {
3246                return;
3247        }
3248        ($co{'id'}, my @parents) = split ' ', $header;
3249        while (my $line = shift @commit_lines) {
3250                last if $line eq "\n";
3251                if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3252                        $co{'tree'} = $1;
3253                } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3254                        push @parents, $1;
3255                } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3256                        $co{'author'} = to_utf8($1);
3257                        $co{'author_epoch'} = $2;
3258                        $co{'author_tz'} = $3;
3259                        if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3260                                $co{'author_name'}  = $1;
3261                                $co{'author_email'} = $2;
3262                        } else {
3263                                $co{'author_name'} = $co{'author'};
3264                        }
3265                } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3266                        $co{'committer'} = to_utf8($1);
3267                        $co{'committer_epoch'} = $2;
3268                        $co{'committer_tz'} = $3;
3269                        if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3270                                $co{'committer_name'}  = $1;
3271                                $co{'committer_email'} = $2;
3272                        } else {
3273                                $co{'committer_name'} = $co{'committer'};
3274                        }
3275                }
3276        }
3277        if (!defined $co{'tree'}) {
3278                return;
3279        };
3280        $co{'parents'} = \@parents;
3281        $co{'parent'} = $parents[0];
3282
3283        foreach my $title (@commit_lines) {
3284                $title =~ s/^    //;
3285                if ($title ne "") {
3286                        $co{'title'} = chop_str($title, 80, 5);
3287                        # remove leading stuff of merges to make the interesting part visible
3288                        if (length($title) > 50) {
3289                                $title =~ s/^Automatic //;
3290                                $title =~ s/^merge (of|with) /Merge ... /i;
3291                                if (length($title) > 50) {
3292                                        $title =~ s/(http|rsync):\/\///;
3293                                }
3294                                if (length($title) > 50) {
3295                                        $title =~ s/(master|www|rsync)\.//;
3296                                }
3297                                if (length($title) > 50) {
3298                                        $title =~ s/kernel.org:?//;
3299                                }
3300                                if (length($title) > 50) {
3301                                        $title =~ s/\/pub\/scm//;
3302                                }
3303                        }
3304                        $co{'title_short'} = chop_str($title, 50, 5);
3305                        last;
3306                }
3307        }
3308        if (! defined $co{'title'} || $co{'title'} eq "") {
3309                $co{'title'} = $co{'title_short'} = '(no commit message)';
3310        }
3311        # remove added spaces
3312        foreach my $line (@commit_lines) {
3313                $line =~ s/^    //;
3314        }
3315        $co{'comment'} = \@commit_lines;
3316
3317        my $age = time - $co{'committer_epoch'};
3318        $co{'age'} = $age;
3319        $co{'age_string'} = age_string($age);
3320        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3321        if ($age > 60*60*24*7*2) {
3322                $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3323                $co{'age_string_age'} = $co{'age_string'};
3324        } else {
3325                $co{'age_string_date'} = $co{'age_string'};
3326                $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3327        }
3328        return %co;
3329}
3330
3331sub parse_commit {
3332        my ($commit_id) = @_;
3333        my %co;
3334
3335        local $/ = "\0";
3336
3337        open my $fd, "-|", git_cmd(), "rev-list",
3338                "--parents",
3339                "--header",
3340                "--max-count=1",
3341                $commit_id,
3342                "--",
3343                or die_error(500, "Open git-rev-list failed");
3344        %co = parse_commit_text(<$fd>, 1);
3345        close $fd;
3346
3347        return %co;
3348}
3349
3350sub parse_commits {
3351        my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3352        my @cos;
3353
3354        $maxcount ||= 1;
3355        $skip ||= 0;
3356
3357        local $/ = "\0";
3358
3359        open my $fd, "-|", git_cmd(), "rev-list",
3360                "--header",
3361                @args,
3362                ("--max-count=" . $maxcount),
3363                ("--skip=" . $skip),
3364                @extra_options,
3365                $commit_id,
3366                "--",
3367                ($filename ? ($filename) : ())
3368                or die_error(500, "Open git-rev-list failed");
3369        while (my $line = <$fd>) {
3370                my %co = parse_commit_text($line);
3371                push @cos, \%co;
3372        }
3373        close $fd;
3374
3375        return wantarray ? @cos : \@cos;
3376}
3377
3378# parse line of git-diff-tree "raw" output
3379sub parse_difftree_raw_line {
3380        my $line = shift;
3381        my %res;
3382
3383        # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3384        # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3385        if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3386                $res{'from_mode'} = $1;
3387                $res{'to_mode'} = $2;
3388                $res{'from_id'} = $3;
3389                $res{'to_id'} = $4;
3390                $res{'status'} = $5;
3391                $res{'similarity'} = $6;
3392                if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3393                        ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3394                } else {
3395                        $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3396                }
3397        }
3398        # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3399        # combined diff (for merge commit)
3400        elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3401                $res{'nparents'}  = length($1);
3402                $res{'from_mode'} = [ split(' ', $2) ];
3403                $res{'to_mode'} = pop @{$res{'from_mode'}};
3404                $res{'from_id'} = [ split(' ', $3) ];
3405                $res{'to_id'} = pop @{$res{'from_id'}};
3406                $res{'status'} = [ split('', $4) ];
3407                $res{'to_file'} = unquote($5);
3408        }
3409        # 'c512b523472485aef4fff9e57b229d9d243c967f'
3410        elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3411                $res{'commit'} = $1;
3412        }
3413
3414        return wantarray ? %res : \%res;
3415}
3416
3417# wrapper: return parsed line of git-diff-tree "raw" output
3418# (the argument might be raw line, or parsed info)
3419sub parsed_difftree_line {
3420        my $line_or_ref = shift;
3421
3422        if (ref($line_or_ref) eq "HASH") {
3423                # pre-parsed (or generated by hand)
3424                return $line_or_ref;
3425        } else {
3426                return parse_difftree_raw_line($line_or_ref);
3427        }
3428}
3429
3430# parse line of git-ls-tree output
3431sub parse_ls_tree_line {
3432        my $line = shift;
3433        my %opts = @_;
3434        my %res;
3435
3436        if ($opts{'-l'}) {
3437                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3438                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3439
3440                $res{'mode'} = $1;
3441                $res{'type'} = $2;
3442                $res{'hash'} = $3;
3443                $res{'size'} = $4;
3444                if ($opts{'-z'}) {
3445                        $res{'name'} = $5;
3446                } else {
3447                        $res{'name'} = unquote($5);
3448                }
3449        } else {
3450                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3451                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3452
3453                $res{'mode'} = $1;
3454                $res{'type'} = $2;
3455                $res{'hash'} = $3;
3456                if ($opts{'-z'}) {
3457                        $res{'name'} = $4;
3458                } else {
3459                        $res{'name'} = unquote($4);
3460                }
3461        }
3462
3463        return wantarray ? %res : \%res;
3464}
3465
3466# generates _two_ hashes, references to which are passed as 2 and 3 argument
3467sub parse_from_to_diffinfo {
3468        my ($diffinfo, $from, $to, @parents) = @_;
3469
3470        if ($diffinfo->{'nparents'}) {
3471                # combined diff
3472                $from->{'file'} = [];
3473                $from->{'href'} = [];
3474                fill_from_file_info($diffinfo, @parents)
3475                        unless exists $diffinfo->{'from_file'};
3476                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3477                        $from->{'file'}[$i] =
3478                                defined $diffinfo->{'from_file'}[$i] ?
3479                                        $diffinfo->{'from_file'}[$i] :
3480                                        $diffinfo->{'to_file'};
3481                        if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3482                                $from->{'href'}[$i] = href(action=>"blob",
3483                                                           hash_base=>$parents[$i],
3484                                                           hash=>$diffinfo->{'from_id'}[$i],
3485                                                           file_name=>$from->{'file'}[$i]);
3486                        } else {
3487                                $from->{'href'}[$i] = undef;
3488                        }
3489                }
3490        } else {
3491                # ordinary (not combined) diff
3492                $from->{'file'} = $diffinfo->{'from_file'};
3493                if ($diffinfo->{'status'} ne "A") { # not new (added) file
3494                        $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3495                                               hash=>$diffinfo->{'from_id'},
3496                                               file_name=>$from->{'file'});
3497                } else {
3498                        delete $from->{'href'};
3499                }
3500        }
3501
3502        $to->{'file'} = $diffinfo->{'to_file'};
3503        if (!is_deleted($diffinfo)) { # file exists in result
3504                $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3505                                     hash=>$diffinfo->{'to_id'},
3506                                     file_name=>$to->{'file'});
3507        } else {
3508                delete $to->{'href'};
3509        }
3510}
3511
3512## ......................................................................
3513## parse to array of hashes functions
3514
3515sub git_get_heads_list {
3516        my ($limit, @classes) = @_;
3517        @classes = ('heads') unless @classes;
3518        my @patterns = map { "refs/$_" } @classes;
3519        my @headslist;
3520
3521        open my $fd, '-|', git_cmd(), 'for-each-ref',
3522                ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3523                '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3524                @patterns
3525                or return;
3526        while (my $line = <$fd>) {
3527                my %ref_item;
3528
3529                chomp $line;
3530                my ($refinfo, $committerinfo) = split(/\0/, $line);
3531                my ($hash, $name, $title) = split(' ', $refinfo, 3);
3532                my ($committer, $epoch, $tz) =
3533                        ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3534                $ref_item{'fullname'}  = $name;
3535                $name =~ s!^refs/(?:head|remote)s/!!;
3536
3537                $ref_item{'name'}  = $name;
3538                $ref_item{'id'}    = $hash;
3539                $ref_item{'title'} = $title || '(no commit message)';
3540                $ref_item{'epoch'} = $epoch;
3541                if ($epoch) {
3542                        $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3543                } else {
3544                        $ref_item{'age'} = "unknown";
3545                }
3546
3547                push @headslist, \%ref_item;
3548        }
3549        close $fd;
3550
3551        return wantarray ? @headslist : \@headslist;
3552}
3553
3554sub git_get_tags_list {
3555        my $limit = shift;
3556        my @tagslist;
3557
3558        open my $fd, '-|', git_cmd(), 'for-each-ref',
3559                ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3560                '--format=%(objectname) %(objecttype) %(refname) '.
3561                '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3562                'refs/tags'
3563                or return;
3564        while (my $line = <$fd>) {
3565                my %ref_item;
3566
3567                chomp $line;
3568                my ($refinfo, $creatorinfo) = split(/\0/, $line);
3569                my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3570                my ($creator, $epoch, $tz) =
3571                        ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3572                $ref_item{'fullname'} = $name;
3573                $name =~ s!^refs/tags/!!;
3574
3575                $ref_item{'type'} = $type;
3576                $ref_item{'id'} = $id;
3577                $ref_item{'name'} = $name;
3578                if ($type eq "tag") {
3579                        $ref_item{'subject'} = $title;
3580                        $ref_item{'reftype'} = $reftype;
3581                        $ref_item{'refid'}   = $refid;
3582                } else {
3583                        $ref_item{'reftype'} = $type;
3584                        $ref_item{'refid'}   = $id;
3585                }
3586
3587                if ($type eq "tag" || $type eq "commit") {
3588                        $ref_item{'epoch'} = $epoch;
3589                        if ($epoch) {
3590                                $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3591                        } else {
3592                                $ref_item{'age'} = "unknown";
3593                        }
3594                }
3595
3596                push @tagslist, \%ref_item;
3597        }
3598        close $fd;
3599
3600        return wantarray ? @tagslist : \@tagslist;
3601}
3602
3603## ----------------------------------------------------------------------
3604## filesystem-related functions
3605
3606sub get_file_owner {
3607        my $path = shift;
3608
3609        my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3610        my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3611        if (!defined $gcos) {
3612                return undef;
3613        }
3614        my $owner = $gcos;
3615        $owner =~ s/[,;].*$//;
3616        return to_utf8($owner);
3617}
3618
3619# assume that file exists
3620sub insert_file {
3621        my $filename = shift;
3622
3623        open my $fd, '<', $filename;
3624        print map { to_utf8($_) } <$fd>;
3625        close $fd;
3626}
3627
3628## ......................................................................
3629## mimetype related functions
3630
3631sub mimetype_guess_file {
3632        my $filename = shift;
3633        my $mimemap = shift;
3634        -r $mimemap or return undef;
3635
3636        my %mimemap;
3637        open(my $mh, '<', $mimemap) or return undef;
3638        while (<$mh>) {
3639                next if m/^#/; # skip comments
3640                my ($mimetype, @exts) = split(/\s+/);
3641                foreach my $ext (@exts) {
3642                        $mimemap{$ext} = $mimetype;
3643                }
3644        }
3645        close($mh);
3646
3647        $filename =~ /\.([^.]*)$/;
3648        return $mimemap{$1};
3649}
3650
3651sub mimetype_guess {
3652        my $filename = shift;
3653        my $mime;
3654        $filename =~ /\./ or return undef;
3655
3656        if ($mimetypes_file) {
3657                my $file = $mimetypes_file;
3658                if ($file !~ m!^/!) { # if it is relative path
3659                        # it is relative to project
3660                        $file = "$projectroot/$project/$file";
3661                }
3662                $mime = mimetype_guess_file($filename, $file);
3663        }
3664        $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3665        return $mime;
3666}
3667
3668sub blob_mimetype {
3669        my $fd = shift;
3670        my $filename = shift;
3671
3672        if ($filename) {
3673                my $mime = mimetype_guess($filename);
3674                $mime and return $mime;
3675        }
3676
3677        # just in case
3678        return $default_blob_plain_mimetype unless $fd;
3679
3680        if (-T $fd) {
3681                return 'text/plain';
3682        } elsif (! $filename) {
3683                return 'application/octet-stream';
3684        } elsif ($filename =~ m/\.png$/i) {
3685                return 'image/png';
3686        } elsif ($filename =~ m/\.gif$/i) {
3687                return 'image/gif';
3688        } elsif ($filename =~ m/\.jpe?g$/i) {
3689                return 'image/jpeg';
3690        } else {
3691                return 'application/octet-stream';
3692        }
3693}
3694
3695sub blob_contenttype {
3696        my ($fd, $file_name, $type) = @_;
3697
3698        $type ||= blob_mimetype($fd, $file_name);
3699        if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3700                $type .= "; charset=$default_text_plain_charset";
3701        }
3702
3703        return $type;
3704}
3705
3706# guess file syntax for syntax highlighting; return undef if no highlighting
3707# the name of syntax can (in the future) depend on syntax highlighter used
3708sub guess_file_syntax {
3709        my ($highlight, $mimetype, $file_name) = @_;
3710        return undef unless ($highlight && defined $file_name);
3711        my $basename = basename($file_name, '.in');
3712        return $highlight_basename{$basename}
3713                if exists $highlight_basename{$basename};
3714
3715        $basename =~ /\.([^.]*)$/;
3716        my $ext = $1 or return undef;
3717        return $highlight_ext{$ext}
3718                if exists $highlight_ext{$ext};
3719
3720        return undef;
3721}
3722
3723# run highlighter and return FD of its output,
3724# or return original FD if no highlighting
3725sub run_highlighter {
3726        my ($fd, $highlight, $syntax) = @_;
3727        return $fd unless ($highlight && defined $syntax);
3728
3729        close $fd;
3730        open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3731                  quote_command($highlight_bin).
3732                  " --replace-tabs=8 --fragment --syntax $syntax |"
3733                or die_error(500, "Couldn't open file or run syntax highlighter");
3734        return $fd;
3735}
3736
3737## ======================================================================
3738## functions printing HTML: header, footer, error page
3739
3740sub get_page_title {
3741        my $title = to_utf8($site_name);
3742
3743        unless (defined $project) {
3744                if (defined $project_filter) {
3745                        $title .= " - " . to_utf8($project_filter);
3746                }
3747                return $title;
3748        }
3749        $title .= " - " . to_utf8($project);
3750
3751        return $title unless (defined $action);
3752        $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3753
3754        return $title unless (defined $file_name);
3755        $title .= " - " . esc_path($file_name);
3756        if ($action eq "tree" && $file_name !~ m|/$|) {
3757                $title .= "/";
3758        }
3759
3760        return $title;
3761}
3762
3763sub get_content_type_html {
3764        # require explicit support from the UA if we are to send the page as
3765        # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3766        # we have to do this because MSIE sometimes globs '*/*', pretending to
3767        # support xhtml+xml but choking when it gets what it asked for.
3768        if (defined $cgi->http('HTTP_ACCEPT') &&
3769            $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3770            $cgi->Accept('application/xhtml+xml') != 0) {
3771                return 'application/xhtml+xml';
3772        } else {
3773                return 'text/html';
3774        }
3775}
3776
3777sub print_feed_meta {
3778        if (defined $project) {
3779                my %href_params = get_feed_info();
3780                if (!exists $href_params{'-title'}) {
3781                        $href_params{'-title'} = 'log';
3782                }
3783
3784                foreach my $format (qw(RSS Atom)) {
3785                        my $type = lc($format);
3786                        my %link_attr = (
3787                                '-rel' => 'alternate',
3788                                '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3789                                '-type' => "application/$type+xml"
3790                        );
3791
3792                        $href_params{'action'} = $type;
3793                        $link_attr{'-href'} = href(%href_params);
3794                        print "<link ".
3795                              "rel=\"$link_attr{'-rel'}\" ".
3796                              "title=\"$link_attr{'-title'}\" ".
3797                              "href=\"$link_attr{'-href'}\" ".
3798                              "type=\"$link_attr{'-type'}\" ".
3799                              "/>\n";
3800
3801                        $href_params{'extra_options'} = '--no-merges';
3802                        $link_attr{'-href'} = href(%href_params);
3803                        $link_attr{'-title'} .= ' (no merges)';
3804                        print "<link ".
3805                              "rel=\"$link_attr{'-rel'}\" ".
3806                              "title=\"$link_attr{'-title'}\" ".
3807                              "href=\"$link_attr{'-href'}\" ".
3808                              "type=\"$link_attr{'-type'}\" ".
3809                              "/>\n";
3810                }
3811
3812        } else {
3813                printf('<link rel="alternate" title="%s projects list" '.
3814                       'href="%s" type="text/plain; charset=utf-8" />'."\n",
3815                       esc_attr($site_name), href(project=>undef, action=>"project_index"));
3816                printf('<link rel="alternate" title="%s projects feeds" '.
3817                       'href="%s" type="text/x-opml" />'."\n",
3818                       esc_attr($site_name), href(project=>undef, action=>"opml"));
3819        }
3820}
3821
3822sub print_header_links {
3823        my $status = shift;
3824
3825        # print out each stylesheet that exist, providing backwards capability
3826        # for those people who defined $stylesheet in a config file
3827        if (defined $stylesheet) {
3828                print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3829        } else {
3830                foreach my $stylesheet (@stylesheets) {
3831                        next unless $stylesheet;
3832                        print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3833                }
3834        }
3835        print_feed_meta()
3836                if ($status eq '200 OK');
3837        if (defined $favicon) {
3838                print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3839        }
3840}
3841
3842sub print_nav_breadcrumbs {
3843        my %opts = @_;
3844
3845        print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3846        if (defined $project) {
3847                print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3848                if (defined $action) {
3849                        my $action_print = $action ;
3850                        if (defined $opts{-action_extra}) {
3851                                $action_print = $cgi->a({-href => href(action=>$action)},
3852                                        $action);
3853                        }
3854                        print " / $action_print";
3855                }
3856                if (defined $opts{-action_extra}) {
3857                        print " / $opts{-action_extra}";
3858                }
3859                print "\n";
3860        }
3861}
3862
3863sub print_search_form {
3864        if (!defined $searchtext) {
3865                $searchtext = "";
3866        }
3867        my $search_hash;
3868        if (defined $hash_base) {
3869                $search_hash = $hash_base;
3870        } elsif (defined $hash) {
3871                $search_hash = $hash;
3872        } else {
3873                $search_hash = "HEAD";
3874        }
3875        my $action = $my_uri;
3876        my $use_pathinfo = gitweb_check_feature('pathinfo');
3877        if ($use_pathinfo) {
3878                $action .= "/".esc_url($project);
3879        }
3880        print $cgi->startform(-method => "get", -action => $action) .
3881              "<div class=\"search\">\n" .
3882              (!$use_pathinfo &&
3883              $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3884              $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3885              $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3886              $cgi->popup_menu(-name => 'st', -default => 'commit',
3887                               -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3888              $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3889              " search:\n",
3890              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3891              "<span title=\"Extended regular expression\">" .
3892              $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3893                             -checked => $search_use_regexp) .
3894              "</span>" .
3895              "</div>" .
3896              $cgi->end_form() . "\n";
3897}
3898
3899sub git_header_html {
3900        my $status = shift || "200 OK";
3901        my $expires = shift;
3902        my %opts = @_;
3903
3904        my $title = get_page_title();
3905        my $content_type = get_content_type_html();
3906        print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3907                           -status=> $status, -expires => $expires)
3908                unless ($opts{'-no_http_header'});
3909        my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3910        print <<EOF;
3911<?xml version="1.0" encoding="utf-8"?>
3912<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3913<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3914<!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3915<!-- git core binaries version $git_version -->
3916<head>
3917<meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3918<meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3919<meta name="robots" content="index, nofollow"/>
3920<title>$title</title>
3921EOF
3922        # the stylesheet, favicon etc urls won't work correctly with path_info
3923        # unless we set the appropriate base URL
3924        if ($ENV{'PATH_INFO'}) {
3925                print "<base href=\"".esc_url($base_url)."\" />\n";
3926        }
3927        print_header_links($status);
3928
3929        if (defined $site_html_head_string) {
3930                print to_utf8($site_html_head_string);
3931        }
3932
3933        print "</head>\n" .
3934              "<body>\n";
3935
3936        if (defined $site_header && -f $site_header) {
3937                insert_file($site_header);
3938        }
3939
3940        print "<div class=\"page_header\">\n";
3941        if (defined $logo) {
3942                print $cgi->a({-href => esc_url($logo_url),
3943                               -title => $logo_label},
3944                              $cgi->img({-src => esc_url($logo),
3945                                         -width => 72, -height => 27,
3946                                         -alt => "git",
3947                                         -class => "logo"}));
3948        }
3949        print_nav_breadcrumbs(%opts);
3950        print "</div>\n";
3951
3952        my $have_search = gitweb_check_feature('search');
3953        if (defined $project && $have_search) {
3954                print_search_form();
3955        }
3956}
3957
3958sub git_footer_html {
3959        my $feed_class = 'rss_logo';
3960
3961        print "<div class=\"page_footer\">\n";
3962        if (defined $project) {
3963                my $descr = git_get_project_description($project);
3964                if (defined $descr) {
3965                        print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3966                }
3967
3968                my %href_params = get_feed_info();
3969                if (!%href_params) {
3970                        $feed_class .= ' generic';
3971                }
3972                $href_params{'-title'} ||= 'log';
3973
3974                foreach my $format (qw(RSS Atom)) {
3975                        $href_params{'action'} = lc($format);
3976                        print $cgi->a({-href => href(%href_params),
3977                                      -title => "$href_params{'-title'} $format feed",
3978                                      -class => $feed_class}, $format)."\n";
3979                }
3980
3981        } else {
3982                print $cgi->a({-href => href(project=>undef, action=>"opml"),
3983                              -class => $feed_class}, "OPML") . " ";
3984                print $cgi->a({-href => href(project=>undef, action=>"project_index"),
3985                              -class => $feed_class}, "TXT") . "\n";
3986        }
3987        print "</div>\n"; # class="page_footer"
3988
3989        if (defined $t0 && gitweb_check_feature('timed')) {
3990                print "<div id=\"generating_info\">\n";
3991                print 'This page took '.
3992                      '<span id="generating_time" class="time_span">'.
3993                      tv_interval($t0, [ gettimeofday() ]).
3994                      ' seconds </span>'.
3995                      ' and '.
3996                      '<span id="generating_cmd">'.
3997                      $number_of_git_cmds.
3998                      '</span> git commands '.
3999                      " to generate.\n";
4000                print "</div>\n"; # class="page_footer"
4001        }
4002
4003        if (defined $site_footer && -f $site_footer) {
4004                insert_file($site_footer);
4005        }
4006
4007        print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
4008        if (defined $action &&
4009            $action eq 'blame_incremental') {
4010                print qq!<script type="text/javascript">\n!.
4011                      qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
4012                      qq!           "!. href() .qq!");\n!.
4013                      qq!</script>\n!;
4014        } else {
4015                my ($jstimezone, $tz_cookie, $datetime_class) =
4016                        gitweb_get_feature('javascript-timezone');
4017
4018                print qq!<script type="text/javascript">\n!.
4019                      qq!window.onload = function () {\n!;
4020                if (gitweb_check_feature('javascript-actions')) {
4021                        print qq!       fixLinks();\n!;
4022                }
4023                if ($jstimezone && $tz_cookie && $datetime_class) {
4024                        print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4025                              qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4026                }
4027                print qq!};\n!.
4028                      qq!</script>\n!;
4029        }
4030
4031        print "</body>\n" .
4032              "</html>";
4033}
4034
4035# die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4036# Example: die_error(404, 'Hash not found')
4037# By convention, use the following status codes (as defined in RFC 2616):
4038# 400: Invalid or missing CGI parameters, or
4039#      requested object exists but has wrong type.
4040# 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4041#      this server or project.
4042# 404: Requested object/revision/project doesn't exist.
4043# 500: The server isn't configured properly, or
4044#      an internal error occurred (e.g. failed assertions caused by bugs), or
4045#      an unknown error occurred (e.g. the git binary died unexpectedly).
4046# 503: The server is currently unavailable (because it is overloaded,
4047#      or down for maintenance).  Generally, this is a temporary state.
4048sub die_error {
4049        my $status = shift || 500;
4050        my $error = esc_html(shift) || "Internal Server Error";
4051        my $extra = shift;
4052        my %opts = @_;
4053
4054        my %http_responses = (
4055                400 => '400 Bad Request',
4056                403 => '403 Forbidden',
4057                404 => '404 Not Found',
4058                500 => '500 Internal Server Error',
4059                503 => '503 Service Unavailable',
4060        );
4061        git_header_html($http_responses{$status}, undef, %opts);
4062        print <<EOF;
4063<div class="page_body">
4064<br /><br />
4065$status - $error
4066<br />
4067EOF
4068        if (defined $extra) {
4069                print "<hr />\n" .
4070                      "$extra\n";
4071        }
4072        print "</div>\n";
4073
4074        git_footer_html();
4075        goto DONE_GITWEB
4076                unless ($opts{'-error_handler'});
4077}
4078
4079## ----------------------------------------------------------------------
4080## functions printing or outputting HTML: navigation
4081
4082sub git_print_page_nav {
4083        my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4084        $extra = '' if !defined $extra; # pager or formats
4085
4086        my @navs = qw(summary shortlog log commit commitdiff tree);
4087        if ($suppress) {
4088                @navs = grep { $_ ne $suppress } @navs;
4089        }
4090
4091        my %arg = map { $_ => {action=>$_} } @navs;
4092        if (defined $head) {
4093                for (qw(commit commitdiff)) {
4094                        $arg{$_}{'hash'} = $head;
4095                }
4096                if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4097                        for (qw(shortlog log)) {
4098                                $arg{$_}{'hash'} = $head;
4099                        }
4100                }
4101        }
4102
4103        $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4104        $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4105
4106        my @actions = gitweb_get_feature('actions');
4107        my %repl = (
4108                '%' => '%',
4109                'n' => $project,         # project name
4110                'f' => $git_dir,         # project path within filesystem
4111                'h' => $treehead || '',  # current hash ('h' parameter)
4112                'b' => $treebase || '',  # hash base ('hb' parameter)
4113        );
4114        while (@actions) {
4115                my ($label, $link, $pos) = splice(@actions,0,3);
4116                # insert
4117                @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4118                # munch munch
4119                $link =~ s/%([%nfhb])/$repl{$1}/g;
4120                $arg{$label}{'_href'} = $link;
4121        }
4122
4123        print "<div class=\"page_nav\">\n" .
4124                (join " | ",
4125                 map { $_ eq $current ?
4126                       $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4127                 } @navs);
4128        print "<br/>\n$extra<br/>\n" .
4129              "</div>\n";
4130}
4131
4132# returns a submenu for the nagivation of the refs views (tags, heads,
4133# remotes) with the current view disabled and the remotes view only
4134# available if the feature is enabled
4135sub format_ref_views {
4136        my ($current) = @_;
4137        my @ref_views = qw{tags heads};
4138        push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4139        return join " | ", map {
4140                $_ eq $current ? $_ :
4141                $cgi->a({-href => href(action=>$_)}, $_)
4142        } @ref_views
4143}
4144
4145sub format_paging_nav {
4146        my ($action, $page, $has_next_link) = @_;
4147        my $paging_nav;
4148
4149
4150        if ($page > 0) {
4151                $paging_nav .=
4152                        $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4153                        " &sdot; " .
4154                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
4155                                 -accesskey => "p", -title => "Alt-p"}, "prev");
4156        } else {
4157                $paging_nav .= "first &sdot; prev";
4158        }
4159
4160        if ($has_next_link) {
4161                $paging_nav .= " &sdot; " .
4162                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
4163                                 -accesskey => "n", -title => "Alt-n"}, "next");
4164        } else {
4165                $paging_nav .= " &sdot; next";
4166        }
4167
4168        return $paging_nav;
4169}
4170
4171## ......................................................................
4172## functions printing or outputting HTML: div
4173
4174sub git_print_header_div {
4175        my ($action, $title, $hash, $hash_base) = @_;
4176        my %args = ();
4177
4178        $args{'action'} = $action;
4179        $args{'hash'} = $hash if $hash;
4180        $args{'hash_base'} = $hash_base if $hash_base;
4181
4182        print "<div class=\"header\">\n" .
4183              $cgi->a({-href => href(%args), -class => "title"},
4184              $title ? $title : $action) .
4185              "\n</div>\n";
4186}
4187
4188sub format_repo_url {
4189        my ($name, $url) = @_;
4190        return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4191}
4192
4193# Group output by placing it in a DIV element and adding a header.
4194# Options for start_div() can be provided by passing a hash reference as the
4195# first parameter to the function.
4196# Options to git_print_header_div() can be provided by passing an array
4197# reference. This must follow the options to start_div if they are present.
4198# The content can be a scalar, which is output as-is, a scalar reference, which
4199# is output after html escaping, an IO handle passed either as *handle or
4200# *handle{IO}, or a function reference. In the latter case all following
4201# parameters will be taken as argument to the content function call.
4202sub git_print_section {
4203        my ($div_args, $header_args, $content);
4204        my $arg = shift;
4205        if (ref($arg) eq 'HASH') {
4206                $div_args = $arg;
4207                $arg = shift;
4208        }
4209        if (ref($arg) eq 'ARRAY') {
4210                $header_args = $arg;
4211                $arg = shift;
4212        }
4213        $content = $arg;
4214
4215        print $cgi->start_div($div_args);
4216        git_print_header_div(@$header_args);
4217
4218        if (ref($content) eq 'CODE') {
4219                $content->(@_);
4220        } elsif (ref($content) eq 'SCALAR') {
4221                print esc_html($$content);
4222        } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4223                print <$content>;
4224        } elsif (!ref($content) && defined($content)) {
4225                print $content;
4226        }
4227
4228        print $cgi->end_div;
4229}
4230
4231sub format_timestamp_html {
4232        my $date = shift;
4233        my $strtime = $date->{'rfc2822'};
4234
4235        my (undef, undef, $datetime_class) =
4236                gitweb_get_feature('javascript-timezone');
4237        if ($datetime_class) {
4238                $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4239        }
4240
4241        my $localtime_format = '(%02d:%02d %s)';
4242        if ($date->{'hour_local'} < 6) {
4243                $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4244        }
4245        $strtime .= ' ' .
4246                    sprintf($localtime_format,
4247                            $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4248
4249        return $strtime;
4250}
4251
4252# Outputs the author name and date in long form
4253sub git_print_authorship {
4254        my $co = shift;
4255        my %opts = @_;
4256        my $tag = $opts{-tag} || 'div';
4257        my $author = $co->{'author_name'};
4258
4259        my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4260        print "<$tag class=\"author_date\">" .
4261              format_search_author($author, "author", esc_html($author)) .
4262              " [".format_timestamp_html(\%ad)."]".
4263              git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4264              "</$tag>\n";
4265}
4266
4267# Outputs table rows containing the full author or committer information,
4268# in the format expected for 'commit' view (& similar).
4269# Parameters are a commit hash reference, followed by the list of people
4270# to output information for. If the list is empty it defaults to both
4271# author and committer.
4272sub git_print_authorship_rows {
4273        my $co = shift;
4274        # too bad we can't use @people = @_ || ('author', 'committer')
4275        my @people = @_;
4276        @people = ('author', 'committer') unless @people;
4277        foreach my $who (@people) {
4278                my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4279                print "<tr><td>$who</td><td>" .
4280                      format_search_author($co->{"${who}_name"}, $who,
4281                                           esc_html($co->{"${who}_name"})) . " " .
4282                      format_search_author($co->{"${who}_email"}, $who,
4283                                           esc_html("<" . $co->{"${who}_email"} . ">")) .
4284                      "</td><td rowspan=\"2\">" .
4285                      git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4286                      "</td></tr>\n" .
4287                      "<tr>" .
4288                      "<td></td><td>" .
4289                      format_timestamp_html(\%wd) .
4290                      "</td>" .
4291                      "</tr>\n";
4292        }
4293}
4294
4295sub git_print_page_path {
4296        my $name = shift;
4297        my $type = shift;
4298        my $hb = shift;
4299
4300
4301        print "<div class=\"page_path\">";
4302        print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4303                      -title => 'tree root'}, to_utf8("[$project]"));
4304        print " / ";
4305        if (defined $name) {
4306                my @dirname = split '/', $name;
4307                my $basename = pop @dirname;
4308                my $fullname = '';
4309
4310                foreach my $dir (@dirname) {
4311                        $fullname .= ($fullname ? '/' : '') . $dir;
4312                        print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4313                                                     hash_base=>$hb),
4314                                      -title => $fullname}, esc_path($dir));
4315                        print " / ";
4316                }
4317                if (defined $type && $type eq 'blob') {
4318                        print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4319                                                     hash_base=>$hb),
4320                                      -title => $name}, esc_path($basename));
4321                } elsif (defined $type && $type eq 'tree') {
4322                        print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4323                                                     hash_base=>$hb),
4324                                      -title => $name}, esc_path($basename));
4325                        print " / ";
4326                } else {
4327                        print esc_path($basename);
4328                }
4329        }
4330        print "<br/></div>\n";
4331}
4332
4333sub git_print_log {
4334        my $log = shift;
4335        my %opts = @_;
4336
4337        if ($opts{'-remove_title'}) {
4338                # remove title, i.e. first line of log
4339                shift @$log;
4340        }
4341        # remove leading empty lines
4342        while (defined $log->[0] && $log->[0] eq "") {
4343                shift @$log;
4344        }
4345
4346        # print log
4347        my $signoff = 0;
4348        my $empty = 0;
4349        foreach my $line (@$log) {
4350                if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4351                        $signoff = 1;
4352                        $empty = 0;
4353                        if (! $opts{'-remove_signoff'}) {
4354                                print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4355                                next;
4356                        } else {
4357                                # remove signoff lines
4358                                next;
4359                        }
4360                } else {
4361                        $signoff = 0;
4362                }
4363
4364                # print only one empty line
4365                # do not print empty line after signoff
4366                if ($line eq "") {
4367                        next if ($empty || $signoff);
4368                        $empty = 1;
4369                } else {
4370                        $empty = 0;
4371                }
4372
4373                print format_log_line_html($line) . "<br/>\n";
4374        }
4375
4376        if ($opts{'-final_empty_line'}) {
4377                # end with single empty line
4378                print "<br/>\n" unless $empty;
4379        }
4380}
4381
4382# return link target (what link points to)
4383sub git_get_link_target {
4384        my $hash = shift;
4385        my $link_target;
4386
4387        # read link
4388        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4389                or return;
4390        {
4391                local $/ = undef;
4392                $link_target = <$fd>;
4393        }
4394        close $fd
4395                or return;
4396
4397        return $link_target;
4398}
4399
4400# given link target, and the directory (basedir) the link is in,
4401# return target of link relative to top directory (top tree);
4402# return undef if it is not possible (including absolute links).
4403sub normalize_link_target {
4404        my ($link_target, $basedir) = @_;
4405
4406        # absolute symlinks (beginning with '/') cannot be normalized
4407        return if (substr($link_target, 0, 1) eq '/');
4408
4409        # normalize link target to path from top (root) tree (dir)
4410        my $path;
4411        if ($basedir) {
4412                $path = $basedir . '/' . $link_target;
4413        } else {
4414                # we are in top (root) tree (dir)
4415                $path = $link_target;
4416        }
4417
4418        # remove //, /./, and /../
4419        my @path_parts;
4420        foreach my $part (split('/', $path)) {
4421                # discard '.' and ''
4422                next if (!$part || $part eq '.');
4423                # handle '..'
4424                if ($part eq '..') {
4425                        if (@path_parts) {
4426                                pop @path_parts;
4427                        } else {
4428                                # link leads outside repository (outside top dir)
4429                                return;
4430                        }
4431                } else {
4432                        push @path_parts, $part;
4433                }
4434        }
4435        $path = join('/', @path_parts);
4436
4437        return $path;
4438}
4439
4440# print tree entry (row of git_tree), but without encompassing <tr> element
4441sub git_print_tree_entry {
4442        my ($t, $basedir, $hash_base, $have_blame) = @_;
4443
4444        my %base_key = ();
4445        $base_key{'hash_base'} = $hash_base if defined $hash_base;
4446
4447        # The format of a table row is: mode list link.  Where mode is
4448        # the mode of the entry, list is the name of the entry, an href,
4449        # and link is the action links of the entry.
4450
4451        print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4452        if (exists $t->{'size'}) {
4453                print "<td class=\"size\">$t->{'size'}</td>\n";
4454        }
4455        if ($t->{'type'} eq "blob") {
4456                print "<td class=\"list\">" .
4457                        $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4458                                               file_name=>"$basedir$t->{'name'}", %base_key),
4459                                -class => "list"}, esc_path($t->{'name'}));
4460                if (S_ISLNK(oct $t->{'mode'})) {
4461                        my $link_target = git_get_link_target($t->{'hash'});
4462                        if ($link_target) {
4463                                my $norm_target = normalize_link_target($link_target, $basedir);
4464                                if (defined $norm_target) {
4465                                        print " -> " .
4466                                              $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4467                                                                     file_name=>$norm_target),
4468                                                       -title => $norm_target}, esc_path($link_target));
4469                                } else {
4470                                        print " -> " . esc_path($link_target);
4471                                }
4472                        }
4473                }
4474                print "</td>\n";
4475                print "<td class=\"link\">";
4476                print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4477                                             file_name=>"$basedir$t->{'name'}", %base_key)},
4478                              "blob");
4479                if ($have_blame) {
4480                        print " | " .
4481                              $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4482                                                     file_name=>"$basedir$t->{'name'}", %base_key)},
4483                                      "blame");
4484                }
4485                if (defined $hash_base) {
4486                        print " | " .
4487                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4488                                                     hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4489                                      "history");
4490                }
4491                print " | " .
4492                        $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4493                                               file_name=>"$basedir$t->{'name'}")},
4494                                "raw");
4495                print "</td>\n";
4496
4497        } elsif ($t->{'type'} eq "tree") {
4498                print "<td class=\"list\">";
4499                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4500                                             file_name=>"$basedir$t->{'name'}",
4501                                             %base_key)},
4502                              esc_path($t->{'name'}));
4503                print "</td>\n";
4504                print "<td class=\"link\">";
4505                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4506                                             file_name=>"$basedir$t->{'name'}",
4507                                             %base_key)},
4508                              "tree");
4509                if (defined $hash_base) {
4510                        print " | " .
4511                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4512                                                     file_name=>"$basedir$t->{'name'}")},
4513                                      "history");
4514                }
4515                print "</td>\n";
4516        } else {
4517                # unknown object: we can only present history for it
4518                # (this includes 'commit' object, i.e. submodule support)
4519                print "<td class=\"list\">" .
4520                      esc_path($t->{'name'}) .
4521                      "</td>\n";
4522                print "<td class=\"link\">";
4523                if (defined $hash_base) {
4524                        print $cgi->a({-href => href(action=>"history",
4525                                                     hash_base=>$hash_base,
4526                                                     file_name=>"$basedir$t->{'name'}")},
4527                                      "history");
4528                }
4529                print "</td>\n";
4530        }
4531}
4532
4533## ......................................................................
4534## functions printing large fragments of HTML
4535
4536# get pre-image filenames for merge (combined) diff
4537sub fill_from_file_info {
4538        my ($diff, @parents) = @_;
4539
4540        $diff->{'from_file'} = [ ];
4541        $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4542        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4543                if ($diff->{'status'}[$i] eq 'R' ||
4544                    $diff->{'status'}[$i] eq 'C') {
4545                        $diff->{'from_file'}[$i] =
4546                                git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4547                }
4548        }
4549
4550        return $diff;
4551}
4552
4553# is current raw difftree line of file deletion
4554sub is_deleted {
4555        my $diffinfo = shift;
4556
4557        return $diffinfo->{'to_id'} eq ('0' x 40);
4558}
4559
4560# does patch correspond to [previous] difftree raw line
4561# $diffinfo  - hashref of parsed raw diff format
4562# $patchinfo - hashref of parsed patch diff format
4563#              (the same keys as in $diffinfo)
4564sub is_patch_split {
4565        my ($diffinfo, $patchinfo) = @_;
4566
4567        return defined $diffinfo && defined $patchinfo
4568                && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4569}
4570
4571
4572sub git_difftree_body {
4573        my ($difftree, $hash, @parents) = @_;
4574        my ($parent) = $parents[0];
4575        my $have_blame = gitweb_check_feature('blame');
4576        print "<div class=\"list_head\">\n";
4577        if ($#{$difftree} > 10) {
4578                print(($#{$difftree} + 1) . " files changed:\n");
4579        }
4580        print "</div>\n";
4581
4582        print "<table class=\"" .
4583              (@parents > 1 ? "combined " : "") .
4584              "diff_tree\">\n";
4585
4586        # header only for combined diff in 'commitdiff' view
4587        my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4588        if ($has_header) {
4589                # table header
4590                print "<thead><tr>\n" .
4591                       "<th></th><th></th>\n"; # filename, patchN link
4592                for (my $i = 0; $i < @parents; $i++) {
4593                        my $par = $parents[$i];
4594                        print "<th>" .
4595                              $cgi->a({-href => href(action=>"commitdiff",
4596                                                     hash=>$hash, hash_parent=>$par),
4597                                       -title => 'commitdiff to parent number ' .
4598                                                  ($i+1) . ': ' . substr($par,0,7)},
4599                                      $i+1) .
4600                              "&nbsp;</th>\n";
4601                }
4602                print "</tr></thead>\n<tbody>\n";
4603        }
4604
4605        my $alternate = 1;
4606        my $patchno = 0;
4607        foreach my $line (@{$difftree}) {
4608                my $diff = parsed_difftree_line($line);
4609
4610                if ($alternate) {
4611                        print "<tr class=\"dark\">\n";
4612                } else {
4613                        print "<tr class=\"light\">\n";
4614                }
4615                $alternate ^= 1;
4616
4617                if (exists $diff->{'nparents'}) { # combined diff
4618
4619                        fill_from_file_info($diff, @parents)
4620                                unless exists $diff->{'from_file'};
4621
4622                        if (!is_deleted($diff)) {
4623                                # file exists in the result (child) commit
4624                                print "<td>" .
4625                                      $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4626                                                             file_name=>$diff->{'to_file'},
4627                                                             hash_base=>$hash),
4628                                              -class => "list"}, esc_path($diff->{'to_file'})) .
4629                                      "</td>\n";
4630                        } else {
4631                                print "<td>" .
4632                                      esc_path($diff->{'to_file'}) .
4633                                      "</td>\n";
4634                        }
4635
4636                        if ($action eq 'commitdiff') {
4637                                # link to patch
4638                                $patchno++;
4639                                print "<td class=\"link\">" .
4640                                      $cgi->a({-href => href(-anchor=>"patch$patchno")},
4641                                              "patch") .
4642                                      " | " .
4643                                      "</td>\n";
4644                        }
4645
4646                        my $has_history = 0;
4647                        my $not_deleted = 0;
4648                        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4649                                my $hash_parent = $parents[$i];
4650                                my $from_hash = $diff->{'from_id'}[$i];
4651                                my $from_path = $diff->{'from_file'}[$i];
4652                                my $status = $diff->{'status'}[$i];
4653
4654                                $has_history ||= ($status ne 'A');
4655                                $not_deleted ||= ($status ne 'D');
4656
4657                                if ($status eq 'A') {
4658                                        print "<td  class=\"link\" align=\"right\"> | </td>\n";
4659                                } elsif ($status eq 'D') {
4660                                        print "<td class=\"link\">" .
4661                                              $cgi->a({-href => href(action=>"blob",
4662                                                                     hash_base=>$hash,
4663                                                                     hash=>$from_hash,
4664                                                                     file_name=>$from_path)},
4665                                                      "blob" . ($i+1)) .
4666                                              " | </td>\n";
4667                                } else {
4668                                        if ($diff->{'to_id'} eq $from_hash) {
4669                                                print "<td class=\"link nochange\">";
4670                                        } else {
4671                                                print "<td class=\"link\">";
4672                                        }
4673                                        print $cgi->a({-href => href(action=>"blobdiff",
4674                                                                     hash=>$diff->{'to_id'},
4675                                                                     hash_parent=>$from_hash,
4676                                                                     hash_base=>$hash,
4677                                                                     hash_parent_base=>$hash_parent,
4678                                                                     file_name=>$diff->{'to_file'},
4679                                                                     file_parent=>$from_path)},
4680                                                      "diff" . ($i+1)) .
4681                                              " | </td>\n";
4682                                }
4683                        }
4684
4685                        print "<td class=\"link\">";
4686                        if ($not_deleted) {
4687                                print $cgi->a({-href => href(action=>"blob",
4688                                                             hash=>$diff->{'to_id'},
4689                                                             file_name=>$diff->{'to_file'},
4690                                                             hash_base=>$hash)},
4691                                              "blob");
4692                                print " | " if ($has_history);
4693                        }
4694                        if ($has_history) {
4695                                print $cgi->a({-href => href(action=>"history",
4696                                                             file_name=>$diff->{'to_file'},
4697                                                             hash_base=>$hash)},
4698                                              "history");
4699                        }
4700                        print "</td>\n";
4701
4702                        print "</tr>\n";
4703                        next; # instead of 'else' clause, to avoid extra indent
4704                }
4705                # else ordinary diff
4706
4707                my ($to_mode_oct, $to_mode_str, $to_file_type);
4708                my ($from_mode_oct, $from_mode_str, $from_file_type);
4709                if ($diff->{'to_mode'} ne ('0' x 6)) {
4710                        $to_mode_oct = oct $diff->{'to_mode'};
4711                        if (S_ISREG($to_mode_oct)) { # only for regular file
4712                                $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4713                        }
4714                        $to_file_type = file_type($diff->{'to_mode'});
4715                }
4716                if ($diff->{'from_mode'} ne ('0' x 6)) {
4717                        $from_mode_oct = oct $diff->{'from_mode'};
4718                        if (S_ISREG($from_mode_oct)) { # only for regular file
4719                                $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4720                        }
4721                        $from_file_type = file_type($diff->{'from_mode'});
4722                }
4723
4724                if ($diff->{'status'} eq "A") { # created
4725                        my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4726                        $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4727                        $mode_chng   .= "]</span>";
4728                        print "<td>";
4729                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4730                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4731                                      -class => "list"}, esc_path($diff->{'file'}));
4732                        print "</td>\n";
4733                        print "<td>$mode_chng</td>\n";
4734                        print "<td class=\"link\">";
4735                        if ($action eq 'commitdiff') {
4736                                # link to patch
4737                                $patchno++;
4738                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4739                                              "patch") .
4740                                      " | ";
4741                        }
4742                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4743                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4744                                      "blob");
4745                        print "</td>\n";
4746
4747                } elsif ($diff->{'status'} eq "D") { # deleted
4748                        my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4749                        print "<td>";
4750                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4751                                                     hash_base=>$parent, file_name=>$diff->{'file'}),
4752                                       -class => "list"}, esc_path($diff->{'file'}));
4753                        print "</td>\n";
4754                        print "<td>$mode_chng</td>\n";
4755                        print "<td class=\"link\">";
4756                        if ($action eq 'commitdiff') {
4757                                # link to patch
4758                                $patchno++;
4759                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4760                                              "patch") .
4761                                      " | ";
4762                        }
4763                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4764                                                     hash_base=>$parent, file_name=>$diff->{'file'})},
4765                                      "blob") . " | ";
4766                        if ($have_blame) {
4767                                print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4768                                                             file_name=>$diff->{'file'})},
4769                                              "blame") . " | ";
4770                        }
4771                        print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4772                                                     file_name=>$diff->{'file'})},
4773                                      "history");
4774                        print "</td>\n";
4775
4776                } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4777                        my $mode_chnge = "";
4778                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4779                                $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4780                                if ($from_file_type ne $to_file_type) {
4781                                        $mode_chnge .= " from $from_file_type to $to_file_type";
4782                                }
4783                                if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4784                                        if ($from_mode_str && $to_mode_str) {
4785                                                $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4786                                        } elsif ($to_mode_str) {
4787                                                $mode_chnge .= " mode: $to_mode_str";
4788                                        }
4789                                }
4790                                $mode_chnge .= "]</span>\n";
4791                        }
4792                        print "<td>";
4793                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4794                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4795                                      -class => "list"}, esc_path($diff->{'file'}));
4796                        print "</td>\n";
4797                        print "<td>$mode_chnge</td>\n";
4798                        print "<td class=\"link\">";
4799                        if ($action eq 'commitdiff') {
4800                                # link to patch
4801                                $patchno++;
4802                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4803                                              "patch") .
4804                                      " | ";
4805                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4806                                # "commit" view and modified file (not onlu mode changed)
4807                                print $cgi->a({-href => href(action=>"blobdiff",
4808                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4809                                                             hash_base=>$hash, hash_parent_base=>$parent,
4810                                                             file_name=>$diff->{'file'})},
4811                                              "diff") .
4812                                      " | ";
4813                        }
4814                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4815                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4816                                       "blob") . " | ";
4817                        if ($have_blame) {
4818                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4819                                                             file_name=>$diff->{'file'})},
4820                                              "blame") . " | ";
4821                        }
4822                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4823                                                     file_name=>$diff->{'file'})},
4824                                      "history");
4825                        print "</td>\n";
4826
4827                } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4828                        my %status_name = ('R' => 'moved', 'C' => 'copied');
4829                        my $nstatus = $status_name{$diff->{'status'}};
4830                        my $mode_chng = "";
4831                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4832                                # mode also for directories, so we cannot use $to_mode_str
4833                                $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4834                        }
4835                        print "<td>" .
4836                              $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4837                                                     hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4838                                      -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4839                              "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4840                              $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4841                                                     hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4842                                      -class => "list"}, esc_path($diff->{'from_file'})) .
4843                              " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4844                              "<td class=\"link\">";
4845                        if ($action eq 'commitdiff') {
4846                                # link to patch
4847                                $patchno++;
4848                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4849                                              "patch") .
4850                                      " | ";
4851                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4852                                # "commit" view and modified file (not only pure rename or copy)
4853                                print $cgi->a({-href => href(action=>"blobdiff",
4854                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4855                                                             hash_base=>$hash, hash_parent_base=>$parent,
4856                                                             file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4857                                              "diff") .
4858                                      " | ";
4859                        }
4860                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4861                                                     hash_base=>$parent, file_name=>$diff->{'to_file'})},
4862                                      "blob") . " | ";
4863                        if ($have_blame) {
4864                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4865                                                             file_name=>$diff->{'to_file'})},
4866                                              "blame") . " | ";
4867                        }
4868                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4869                                                    file_name=>$diff->{'to_file'})},
4870                                      "history");
4871                        print "</td>\n";
4872
4873                } # we should not encounter Unmerged (U) or Unknown (X) status
4874                print "</tr>\n";
4875        }
4876        print "</tbody>" if $has_header;
4877        print "</table>\n";
4878}
4879
4880sub print_sidebyside_diff_chunk {
4881        my @chunk = @_;
4882        my (@ctx, @rem, @add);
4883
4884        return unless @chunk;
4885
4886        # incomplete last line might be among removed or added lines,
4887        # or both, or among context lines: find which
4888        for (my $i = 1; $i < @chunk; $i++) {
4889                if ($chunk[$i][0] eq 'incomplete') {
4890                        $chunk[$i][0] = $chunk[$i-1][0];
4891                }
4892        }
4893
4894        # guardian
4895        push @chunk, ["", ""];
4896
4897        foreach my $line_info (@chunk) {
4898                my ($class, $line) = @$line_info;
4899
4900                # print chunk headers
4901                if ($class && $class eq 'chunk_header') {
4902                        print $line;
4903                        next;
4904                }
4905
4906                ## print from accumulator when type of class of lines change
4907                # empty contents block on start rem/add block, or end of chunk
4908                if (@ctx && (!$class || $class eq 'rem' || $class eq 'add')) {
4909                        print join '',
4910                                '<div class="chunk_block ctx">',
4911                                        '<div class="old">',
4912                                        @ctx,
4913                                        '</div>',
4914                                        '<div class="new">',
4915                                        @ctx,
4916                                        '</div>',
4917                                '</div>';
4918                        @ctx = ();
4919                }
4920                # empty add/rem block on start context block, or end of chunk
4921                if ((@rem || @add) && (!$class || $class eq 'ctx')) {
4922                        if (!@add) {
4923                                # pure removal
4924                                print join '',
4925                                        '<div class="chunk_block rem">',
4926                                                '<div class="old">',
4927                                                @rem,
4928                                                '</div>',
4929                                        '</div>';
4930                        } elsif (!@rem) {
4931                                # pure addition
4932                                print join '',
4933                                        '<div class="chunk_block add">',
4934                                                '<div class="new">',
4935                                                @add,
4936                                                '</div>',
4937                                        '</div>';
4938                        } else {
4939                                # assume that it is change
4940                                print join '',
4941                                        '<div class="chunk_block chg">',
4942                                                '<div class="old">',
4943                                                @rem,
4944                                                '</div>',
4945                                                '<div class="new">',
4946                                                @add,
4947                                                '</div>',
4948                                        '</div>';
4949                        }
4950                        @rem = @add = ();
4951                }
4952
4953                ## adding lines to accumulator
4954                # guardian value
4955                last unless $line;
4956                # rem, add or change
4957                if ($class eq 'rem') {
4958                        push @rem, $line;
4959                } elsif ($class eq 'add') {
4960                        push @add, $line;
4961                }
4962                # context line
4963                if ($class eq 'ctx') {
4964                        push @ctx, $line;
4965                }
4966        }
4967}
4968
4969sub git_patchset_body {
4970        my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
4971        my ($hash_parent) = $hash_parents[0];
4972
4973        my $is_combined = (@hash_parents > 1);
4974        my $patch_idx = 0;
4975        my $patch_number = 0;
4976        my $patch_line;
4977        my $diffinfo;
4978        my $to_name;
4979        my (%from, %to);
4980        my @chunk; # for side-by-side diff
4981
4982        print "<div class=\"patchset\">\n";
4983
4984        # skip to first patch
4985        while ($patch_line = <$fd>) {
4986                chomp $patch_line;
4987
4988                last if ($patch_line =~ m/^diff /);
4989        }
4990
4991 PATCH:
4992        while ($patch_line) {
4993
4994                # parse "git diff" header line
4995                if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
4996                        # $1 is from_name, which we do not use
4997                        $to_name = unquote($2);
4998                        $to_name =~ s!^b/!!;
4999                } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
5000                        # $1 is 'cc' or 'combined', which we do not use
5001                        $to_name = unquote($2);
5002                } else {
5003                        $to_name = undef;
5004                }
5005
5006                # check if current patch belong to current raw line
5007                # and parse raw git-diff line if needed
5008                if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
5009                        # this is continuation of a split patch
5010                        print "<div class=\"patch cont\">\n";
5011                } else {
5012                        # advance raw git-diff output if needed
5013                        $patch_idx++ if defined $diffinfo;
5014
5015                        # read and prepare patch information
5016                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5017
5018                        # compact combined diff output can have some patches skipped
5019                        # find which patch (using pathname of result) we are at now;
5020                        if ($is_combined) {
5021                                while ($to_name ne $diffinfo->{'to_file'}) {
5022                                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5023                                              format_diff_cc_simplified($diffinfo, @hash_parents) .
5024                                              "</div>\n";  # class="patch"
5025
5026                                        $patch_idx++;
5027                                        $patch_number++;
5028
5029                                        last if $patch_idx > $#$difftree;
5030                                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5031                                }
5032                        }
5033
5034                        # modifies %from, %to hashes
5035                        parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5036
5037                        # this is first patch for raw difftree line with $patch_idx index
5038                        # we index @$difftree array from 0, but number patches from 1
5039                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5040                }
5041
5042                # git diff header
5043                #assert($patch_line =~ m/^diff /) if DEBUG;
5044                #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5045                $patch_number++;
5046                # print "git diff" header
5047                print format_git_diff_header_line($patch_line, $diffinfo,
5048                                                  \%from, \%to);
5049
5050                # print extended diff header
5051                print "<div class=\"diff extended_header\">\n";
5052        EXTENDED_HEADER:
5053                while ($patch_line = <$fd>) {
5054                        chomp $patch_line;
5055
5056                        last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5057
5058                        print format_extended_diff_header_line($patch_line, $diffinfo,
5059                                                               \%from, \%to);
5060                }
5061                print "</div>\n"; # class="diff extended_header"
5062
5063                # from-file/to-file diff header
5064                if (! $patch_line) {
5065                        print "</div>\n"; # class="patch"
5066                        last PATCH;
5067                }
5068                next PATCH if ($patch_line =~ m/^diff /);
5069                #assert($patch_line =~ m/^---/) if DEBUG;
5070
5071                my $last_patch_line = $patch_line;
5072                $patch_line = <$fd>;
5073                chomp $patch_line;
5074                #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5075
5076                print format_diff_from_to_header($last_patch_line, $patch_line,
5077                                                 $diffinfo, \%from, \%to,
5078                                                 @hash_parents);
5079
5080                # the patch itself
5081        LINE:
5082                while ($patch_line = <$fd>) {
5083                        chomp $patch_line;
5084
5085                        next PATCH if ($patch_line =~ m/^diff /);
5086
5087                        my ($class, $line) = process_diff_line($patch_line, \%from, \%to);
5088                        my $diff_classes = "diff";
5089                        $diff_classes .= " $class" if ($class);
5090                        $line = "<div class=\"$diff_classes\">$line</div>\n";
5091
5092                        if ($diff_style eq 'sidebyside' && !$is_combined) {
5093                                if ($class eq 'chunk_header') {
5094                                        print_sidebyside_diff_chunk(@chunk);
5095                                        @chunk = ( [ $class, $line ] );
5096                                } else {
5097                                        push @chunk, [ $class, $line ];
5098                                }
5099                        } else {
5100                                # default 'inline' style and unknown styles
5101                                print $line;
5102                        }
5103                }
5104
5105        } continue {
5106                if (@chunk) {
5107                        print_sidebyside_diff_chunk(@chunk);
5108                        @chunk = ();
5109                }
5110                print "</div>\n"; # class="patch"
5111        }
5112
5113        # for compact combined (--cc) format, with chunk and patch simplification
5114        # the patchset might be empty, but there might be unprocessed raw lines
5115        for (++$patch_idx if $patch_number > 0;
5116             $patch_idx < @$difftree;
5117             ++$patch_idx) {
5118                # read and prepare patch information
5119                $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5120
5121                # generate anchor for "patch" links in difftree / whatchanged part
5122                print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5123                      format_diff_cc_simplified($diffinfo, @hash_parents) .
5124                      "</div>\n";  # class="patch"
5125
5126                $patch_number++;
5127        }
5128
5129        if ($patch_number == 0) {
5130                if (@hash_parents > 1) {
5131                        print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5132                } else {
5133                        print "<div class=\"diff nodifferences\">No differences found</div>\n";
5134                }
5135        }
5136
5137        print "</div>\n"; # class="patchset"
5138}
5139
5140# . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5141
5142# fills project list info (age, description, owner, category, forks)
5143# for each project in the list, removing invalid projects from
5144# returned list
5145# NOTE: modifies $projlist, but does not remove entries from it
5146sub fill_project_list_info {
5147        my $projlist = shift;
5148        my @projects;
5149
5150        my $show_ctags = gitweb_check_feature('ctags');
5151 PROJECT:
5152        foreach my $pr (@$projlist) {
5153                my (@activity) = git_get_last_activity($pr->{'path'});
5154                unless (@activity) {
5155                        next PROJECT;
5156                }
5157                ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5158                if (!defined $pr->{'descr'}) {
5159                        my $descr = git_get_project_description($pr->{'path'}) || "";
5160                        $descr = to_utf8($descr);
5161                        $pr->{'descr_long'} = $descr;
5162                        $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5163                }
5164                if (!defined $pr->{'owner'}) {
5165                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5166                }
5167                if ($show_ctags) {
5168                        $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5169                }
5170                if ($projects_list_group_categories && !defined $pr->{'category'}) {
5171                        my $cat = git_get_project_category($pr->{'path'}) ||
5172                                                           $project_list_default_category;
5173                        $pr->{'category'} = to_utf8($cat);
5174                }
5175
5176                push @projects, $pr;
5177        }
5178
5179        return @projects;
5180}
5181
5182sub sort_projects_list {
5183        my ($projlist, $order) = @_;
5184        my @projects;
5185
5186        my %order_info = (
5187                project => { key => 'path', type => 'str' },
5188                descr => { key => 'descr_long', type => 'str' },
5189                owner => { key => 'owner', type => 'str' },
5190                age => { key => 'age', type => 'num' }
5191        );
5192        my $oi = $order_info{$order};
5193        return @$projlist unless defined $oi;
5194        if ($oi->{'type'} eq 'str') {
5195                @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5196        } else {
5197                @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5198        }
5199
5200        return @projects;
5201}
5202
5203# returns a hash of categories, containing the list of project
5204# belonging to each category
5205sub build_projlist_by_category {
5206        my ($projlist, $from, $to) = @_;
5207        my %categories;
5208
5209        $from = 0 unless defined $from;
5210        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5211
5212        for (my $i = $from; $i <= $to; $i++) {
5213                my $pr = $projlist->[$i];
5214                push @{$categories{ $pr->{'category'} }}, $pr;
5215        }
5216
5217        return wantarray ? %categories : \%categories;
5218}
5219
5220# print 'sort by' <th> element, generating 'sort by $name' replay link
5221# if that order is not selected
5222sub print_sort_th {
5223        print format_sort_th(@_);
5224}
5225
5226sub format_sort_th {
5227        my ($name, $order, $header) = @_;
5228        my $sort_th = "";
5229        $header ||= ucfirst($name);
5230
5231        if ($order eq $name) {
5232                $sort_th .= "<th>$header</th>\n";
5233        } else {
5234                $sort_th .= "<th>" .
5235                            $cgi->a({-href => href(-replay=>1, order=>$name),
5236                                     -class => "header"}, $header) .
5237                            "</th>\n";
5238        }
5239
5240        return $sort_th;
5241}
5242
5243sub git_project_list_rows {
5244        my ($projlist, $from, $to, $check_forks) = @_;
5245
5246        $from = 0 unless defined $from;
5247        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5248
5249        my $alternate = 1;
5250        for (my $i = $from; $i <= $to; $i++) {
5251                my $pr = $projlist->[$i];
5252
5253                if ($alternate) {
5254                        print "<tr class=\"dark\">\n";
5255                } else {
5256                        print "<tr class=\"light\">\n";
5257                }
5258                $alternate ^= 1;
5259
5260                if ($check_forks) {
5261                        print "<td>";
5262                        if ($pr->{'forks'}) {
5263                                my $nforks = scalar @{$pr->{'forks'}};
5264                                if ($nforks > 0) {
5265                                        print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5266                                                       -title => "$nforks forks"}, "+");
5267                                } else {
5268                                        print $cgi->span({-title => "$nforks forks"}, "+");
5269                                }
5270                        }
5271                        print "</td>\n";
5272                }
5273                print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5274                                        -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
5275                      "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5276                                        -class => "list", -title => $pr->{'descr_long'}},
5277                                        esc_html($pr->{'descr'})) . "</td>\n" .
5278                      "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5279                print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5280                      (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
5281                      "<td class=\"link\">" .
5282                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5283                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5284                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5285                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5286                      ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5287                      "</td>\n" .
5288                      "</tr>\n";
5289        }
5290}
5291
5292sub git_project_list_body {
5293        # actually uses global variable $project
5294        my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5295        my @projects = @$projlist;
5296
5297        my $check_forks = gitweb_check_feature('forks');
5298        my $show_ctags  = gitweb_check_feature('ctags');
5299        my $tagfilter = $show_ctags ? $cgi->param('by_tag') : undef;
5300        $check_forks = undef
5301                if ($tagfilter || $searchtext);
5302
5303        # filtering out forks before filling info allows to do less work
5304        @projects = filter_forks_from_projects_list(\@projects)
5305                if ($check_forks);
5306        @projects = fill_project_list_info(\@projects);
5307        # searching projects require filling to be run before it
5308        @projects = search_projects_list(\@projects,
5309                                         'searchtext' => $searchtext,
5310                                         'tagfilter'  => $tagfilter)
5311                if ($tagfilter || $searchtext);
5312
5313        $order ||= $default_projects_order;
5314        $from = 0 unless defined $from;
5315        $to = $#projects if (!defined $to || $#projects < $to);
5316
5317        # short circuit
5318        if ($from > $to) {
5319                print "<center>\n".
5320                      "<b>No such projects found</b><br />\n".
5321                      "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5322                      "</center>\n<br />\n";
5323                return;
5324        }
5325
5326        @projects = sort_projects_list(\@projects, $order);
5327
5328        if ($show_ctags) {
5329                my $ctags = git_gather_all_ctags(\@projects);
5330                my $cloud = git_populate_project_tagcloud($ctags);
5331                print git_show_project_tagcloud($cloud, 64);
5332        }
5333
5334        print "<table class=\"project_list\">\n";
5335        unless ($no_header) {
5336                print "<tr>\n";
5337                if ($check_forks) {
5338                        print "<th></th>\n";
5339                }
5340                print_sort_th('project', $order, 'Project');
5341                print_sort_th('descr', $order, 'Description');
5342                print_sort_th('owner', $order, 'Owner');
5343                print_sort_th('age', $order, 'Last Change');
5344                print "<th></th>\n" . # for links
5345                      "</tr>\n";
5346        }
5347
5348        if ($projects_list_group_categories) {
5349                # only display categories with projects in the $from-$to window
5350                @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5351                my %categories = build_projlist_by_category(\@projects, $from, $to);
5352                foreach my $cat (sort keys %categories) {
5353                        unless ($cat eq "") {
5354                                print "<tr>\n";
5355                                if ($check_forks) {
5356                                        print "<td></td>\n";
5357                                }
5358                                print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5359                                print "</tr>\n";
5360                        }
5361
5362                        git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5363                }
5364        } else {
5365                git_project_list_rows(\@projects, $from, $to, $check_forks);
5366        }
5367
5368        if (defined $extra) {
5369                print "<tr>\n";
5370                if ($check_forks) {
5371                        print "<td></td>\n";
5372                }
5373                print "<td colspan=\"5\">$extra</td>\n" .
5374                      "</tr>\n";
5375        }
5376        print "</table>\n";
5377}
5378
5379sub git_log_body {
5380        # uses global variable $project
5381        my ($commitlist, $from, $to, $refs, $extra) = @_;
5382
5383        $from = 0 unless defined $from;
5384        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5385
5386        for (my $i = 0; $i <= $to; $i++) {
5387                my %co = %{$commitlist->[$i]};
5388                next if !%co;
5389                my $commit = $co{'id'};
5390                my $ref = format_ref_marker($refs, $commit);
5391                git_print_header_div('commit',
5392                               "<span class=\"age\">$co{'age_string'}</span>" .
5393                               esc_html($co{'title'}) . $ref,
5394                               $commit);
5395                print "<div class=\"title_text\">\n" .
5396                      "<div class=\"log_link\">\n" .
5397                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5398                      " | " .
5399                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5400                      " | " .
5401                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5402                      "<br/>\n" .
5403                      "</div>\n";
5404                      git_print_authorship(\%co, -tag => 'span');
5405                      print "<br/>\n</div>\n";
5406
5407                print "<div class=\"log_body\">\n";
5408                git_print_log($co{'comment'}, -final_empty_line=> 1);
5409                print "</div>\n";
5410        }
5411        if ($extra) {
5412                print "<div class=\"page_nav\">\n";
5413                print "$extra\n";
5414                print "</div>\n";
5415        }
5416}
5417
5418sub git_shortlog_body {
5419        # uses global variable $project
5420        my ($commitlist, $from, $to, $refs, $extra) = @_;
5421
5422        $from = 0 unless defined $from;
5423        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5424
5425        print "<table class=\"shortlog\">\n";
5426        my $alternate = 1;
5427        for (my $i = $from; $i <= $to; $i++) {
5428                my %co = %{$commitlist->[$i]};
5429                my $commit = $co{'id'};
5430                my $ref = format_ref_marker($refs, $commit);
5431                if ($alternate) {
5432                        print "<tr class=\"dark\">\n";
5433                } else {
5434                        print "<tr class=\"light\">\n";
5435                }
5436                $alternate ^= 1;
5437                # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5438                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5439                      format_author_html('td', \%co, 10) . "<td>";
5440                print format_subject_html($co{'title'}, $co{'title_short'},
5441                                          href(action=>"commit", hash=>$commit), $ref);
5442                print "</td>\n" .
5443                      "<td class=\"link\">" .
5444                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5445                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5446                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5447                my $snapshot_links = format_snapshot_links($commit);
5448                if (defined $snapshot_links) {
5449                        print " | " . $snapshot_links;
5450                }
5451                print "</td>\n" .
5452                      "</tr>\n";
5453        }
5454        if (defined $extra) {
5455                print "<tr>\n" .
5456                      "<td colspan=\"4\">$extra</td>\n" .
5457                      "</tr>\n";
5458        }
5459        print "</table>\n";
5460}
5461
5462sub git_history_body {
5463        # Warning: assumes constant type (blob or tree) during history
5464        my ($commitlist, $from, $to, $refs, $extra,
5465            $file_name, $file_hash, $ftype) = @_;
5466
5467        $from = 0 unless defined $from;
5468        $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5469
5470        print "<table class=\"history\">\n";
5471        my $alternate = 1;
5472        for (my $i = $from; $i <= $to; $i++) {
5473                my %co = %{$commitlist->[$i]};
5474                if (!%co) {
5475                        next;
5476                }
5477                my $commit = $co{'id'};
5478
5479                my $ref = format_ref_marker($refs, $commit);
5480
5481                if ($alternate) {
5482                        print "<tr class=\"dark\">\n";
5483                } else {
5484                        print "<tr class=\"light\">\n";
5485                }
5486                $alternate ^= 1;
5487                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5488        # shortlog:   format_author_html('td', \%co, 10)
5489                      format_author_html('td', \%co, 15, 3) . "<td>";
5490                # originally git_history used chop_str($co{'title'}, 50)
5491                print format_subject_html($co{'title'}, $co{'title_short'},
5492                                          href(action=>"commit", hash=>$commit), $ref);
5493                print "</td>\n" .
5494                      "<td class=\"link\">" .
5495                      $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5496                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5497
5498                if ($ftype eq 'blob') {
5499                        my $blob_current = $file_hash;
5500                        my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5501                        if (defined $blob_current && defined $blob_parent &&
5502                                        $blob_current ne $blob_parent) {
5503                                print " | " .
5504                                        $cgi->a({-href => href(action=>"blobdiff",
5505                                                               hash=>$blob_current, hash_parent=>$blob_parent,
5506                                                               hash_base=>$hash_base, hash_parent_base=>$commit,
5507                                                               file_name=>$file_name)},
5508                                                "diff to current");
5509                        }
5510                }
5511                print "</td>\n" .
5512                      "</tr>\n";
5513        }
5514        if (defined $extra) {
5515                print "<tr>\n" .
5516                      "<td colspan=\"4\">$extra</td>\n" .
5517                      "</tr>\n";
5518        }
5519        print "</table>\n";
5520}
5521
5522sub git_tags_body {
5523        # uses global variable $project
5524        my ($taglist, $from, $to, $extra) = @_;
5525        $from = 0 unless defined $from;
5526        $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5527
5528        print "<table class=\"tags\">\n";
5529        my $alternate = 1;
5530        for (my $i = $from; $i <= $to; $i++) {
5531                my $entry = $taglist->[$i];
5532                my %tag = %$entry;
5533                my $comment = $tag{'subject'};
5534                my $comment_short;
5535                if (defined $comment) {
5536                        $comment_short = chop_str($comment, 30, 5);
5537                }
5538                if ($alternate) {
5539                        print "<tr class=\"dark\">\n";
5540                } else {
5541                        print "<tr class=\"light\">\n";
5542                }
5543                $alternate ^= 1;
5544                if (defined $tag{'age'}) {
5545                        print "<td><i>$tag{'age'}</i></td>\n";
5546                } else {
5547                        print "<td></td>\n";
5548                }
5549                print "<td>" .
5550                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5551                               -class => "list name"}, esc_html($tag{'name'})) .
5552                      "</td>\n" .
5553                      "<td>";
5554                if (defined $comment) {
5555                        print format_subject_html($comment, $comment_short,
5556                                                  href(action=>"tag", hash=>$tag{'id'}));
5557                }
5558                print "</td>\n" .
5559                      "<td class=\"selflink\">";
5560                if ($tag{'type'} eq "tag") {
5561                        print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5562                } else {
5563                        print "&nbsp;";
5564                }
5565                print "</td>\n" .
5566                      "<td class=\"link\">" . " | " .
5567                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5568                if ($tag{'reftype'} eq "commit") {
5569                        print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5570                              " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5571                } elsif ($tag{'reftype'} eq "blob") {
5572                        print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5573                }
5574                print "</td>\n" .
5575                      "</tr>";
5576        }
5577        if (defined $extra) {
5578                print "<tr>\n" .
5579                      "<td colspan=\"5\">$extra</td>\n" .
5580                      "</tr>\n";
5581        }
5582        print "</table>\n";
5583}
5584
5585sub git_heads_body {
5586        # uses global variable $project
5587        my ($headlist, $head, $from, $to, $extra) = @_;
5588        $from = 0 unless defined $from;
5589        $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5590
5591        print "<table class=\"heads\">\n";
5592        my $alternate = 1;
5593        for (my $i = $from; $i <= $to; $i++) {
5594                my $entry = $headlist->[$i];
5595                my %ref = %$entry;
5596                my $curr = $ref{'id'} eq $head;
5597                if ($alternate) {
5598                        print "<tr class=\"dark\">\n";
5599                } else {
5600                        print "<tr class=\"light\">\n";
5601                }
5602                $alternate ^= 1;
5603                print "<td><i>$ref{'age'}</i></td>\n" .
5604                      ($curr ? "<td class=\"current_head\">" : "<td>") .
5605                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5606                               -class => "list name"},esc_html($ref{'name'})) .
5607                      "</td>\n" .
5608                      "<td class=\"link\">" .
5609                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5610                      $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5611                      $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5612                      "</td>\n" .
5613                      "</tr>";
5614        }
5615        if (defined $extra) {
5616                print "<tr>\n" .
5617                      "<td colspan=\"3\">$extra</td>\n" .
5618                      "</tr>\n";
5619        }
5620        print "</table>\n";
5621}
5622
5623# Display a single remote block
5624sub git_remote_block {
5625        my ($remote, $rdata, $limit, $head) = @_;
5626
5627        my $heads = $rdata->{'heads'};
5628        my $fetch = $rdata->{'fetch'};
5629        my $push = $rdata->{'push'};
5630
5631        my $urls_table = "<table class=\"projects_list\">\n" ;
5632
5633        if (defined $fetch) {
5634                if ($fetch eq $push) {
5635                        $urls_table .= format_repo_url("URL", $fetch);
5636                } else {
5637                        $urls_table .= format_repo_url("Fetch URL", $fetch);
5638                        $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5639                }
5640        } elsif (defined $push) {
5641                $urls_table .= format_repo_url("Push URL", $push);
5642        } else {
5643                $urls_table .= format_repo_url("", "No remote URL");
5644        }
5645
5646        $urls_table .= "</table>\n";
5647
5648        my $dots;
5649        if (defined $limit && $limit < @$heads) {
5650                $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5651        }
5652
5653        print $urls_table;
5654        git_heads_body($heads, $head, 0, $limit, $dots);
5655}
5656
5657# Display a list of remote names with the respective fetch and push URLs
5658sub git_remotes_list {
5659        my ($remotedata, $limit) = @_;
5660        print "<table class=\"heads\">\n";
5661        my $alternate = 1;
5662        my @remotes = sort keys %$remotedata;
5663
5664        my $limited = $limit && $limit < @remotes;
5665
5666        $#remotes = $limit - 1 if $limited;
5667
5668        while (my $remote = shift @remotes) {
5669                my $rdata = $remotedata->{$remote};
5670                my $fetch = $rdata->{'fetch'};
5671                my $push = $rdata->{'push'};
5672                if ($alternate) {
5673                        print "<tr class=\"dark\">\n";
5674                } else {
5675                        print "<tr class=\"light\">\n";
5676                }
5677                $alternate ^= 1;
5678                print "<td>" .
5679                      $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5680                               -class=> "list name"},esc_html($remote)) .
5681                      "</td>";
5682                print "<td class=\"link\">" .
5683                      (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5684                      " | " .
5685                      (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5686                      "</td>";
5687
5688                print "</tr>\n";
5689        }
5690
5691        if ($limited) {
5692                print "<tr>\n" .
5693                      "<td colspan=\"3\">" .
5694                      $cgi->a({-href => href(action=>"remotes")}, "...") .
5695                      "</td>\n" . "</tr>\n";
5696        }
5697
5698        print "</table>";
5699}
5700
5701# Display remote heads grouped by remote, unless there are too many
5702# remotes, in which case we only display the remote names
5703sub git_remotes_body {
5704        my ($remotedata, $limit, $head) = @_;
5705        if ($limit and $limit < keys %$remotedata) {
5706                git_remotes_list($remotedata, $limit);
5707        } else {
5708                fill_remote_heads($remotedata);
5709                while (my ($remote, $rdata) = each %$remotedata) {
5710                        git_print_section({-class=>"remote", -id=>$remote},
5711                                ["remotes", $remote, $remote], sub {
5712                                        git_remote_block($remote, $rdata, $limit, $head);
5713                                });
5714                }
5715        }
5716}
5717
5718sub git_search_message {
5719        my %co = @_;
5720
5721        my $greptype;
5722        if ($searchtype eq 'commit') {
5723                $greptype = "--grep=";
5724        } elsif ($searchtype eq 'author') {
5725                $greptype = "--author=";
5726        } elsif ($searchtype eq 'committer') {
5727                $greptype = "--committer=";
5728        }
5729        $greptype .= $searchtext;
5730        my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
5731                                       $greptype, '--regexp-ignore-case',
5732                                       $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
5733
5734        my $paging_nav = '';
5735        if ($page > 0) {
5736                $paging_nav .=
5737                        $cgi->a({-href => href(-replay=>1, page=>undef)},
5738                                "first") .
5739                        " &sdot; " .
5740                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
5741                                 -accesskey => "p", -title => "Alt-p"}, "prev");
5742        } else {
5743                $paging_nav .= "first &sdot; prev";
5744        }
5745        my $next_link = '';
5746        if ($#commitlist >= 100) {
5747                $next_link =
5748                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
5749                                 -accesskey => "n", -title => "Alt-n"}, "next");
5750                $paging_nav .= " &sdot; $next_link";
5751        } else {
5752                $paging_nav .= " &sdot; next";
5753        }
5754
5755        git_header_html();
5756
5757        git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
5758        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5759        if ($page == 0 && !@commitlist) {
5760                print "<p>No match.</p>\n";
5761        } else {
5762                git_search_grep_body(\@commitlist, 0, 99, $next_link);
5763        }
5764
5765        git_footer_html();
5766}
5767
5768sub git_search_changes {
5769        my %co = @_;
5770
5771        local $/ = "\n";
5772        open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
5773                '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
5774                ($search_use_regexp ? '--pickaxe-regex' : ())
5775                        or die_error(500, "Open git-log failed");
5776
5777        git_header_html();
5778
5779        git_print_page_nav('','', $hash,$co{'tree'},$hash);
5780        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5781
5782        print "<table class=\"pickaxe search\">\n";
5783        my $alternate = 1;
5784        undef %co;
5785        my @files;
5786        while (my $line = <$fd>) {
5787                chomp $line;
5788                next unless $line;
5789
5790                my %set = parse_difftree_raw_line($line);
5791                if (defined $set{'commit'}) {
5792                        # finish previous commit
5793                        if (%co) {
5794                                print "</td>\n" .
5795                                      "<td class=\"link\">" .
5796                                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5797                                              "commit") .
5798                                      " | " .
5799                                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5800                                                             hash_base=>$co{'id'})},
5801                                              "tree") .
5802                                      "</td>\n" .
5803                                      "</tr>\n";
5804                        }
5805
5806                        if ($alternate) {
5807                                print "<tr class=\"dark\">\n";
5808                        } else {
5809                                print "<tr class=\"light\">\n";
5810                        }
5811                        $alternate ^= 1;
5812                        %co = parse_commit($set{'commit'});
5813                        my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
5814                        print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5815                              "<td><i>$author</i></td>\n" .
5816                              "<td>" .
5817                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5818                                      -class => "list subject"},
5819                                      chop_and_escape_str($co{'title'}, 50) . "<br/>");
5820                } elsif (defined $set{'to_id'}) {
5821                        next if ($set{'to_id'} =~ m/^0{40}$/);
5822
5823                        print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
5824                                                     hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
5825                                      -class => "list"},
5826                                      "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
5827                              "<br/>\n";
5828                }
5829        }
5830        close $fd;
5831
5832        # finish last commit (warning: repetition!)
5833        if (%co) {
5834                print "</td>\n" .
5835                      "<td class=\"link\">" .
5836                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5837                              "commit") .
5838                      " | " .
5839                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5840                                             hash_base=>$co{'id'})},
5841                              "tree") .
5842                      "</td>\n" .
5843                      "</tr>\n";
5844        }
5845
5846        print "</table>\n";
5847
5848        git_footer_html();
5849}
5850
5851sub git_search_files {
5852        my %co = @_;
5853
5854        local $/ = "\n";
5855        open my $fd, "-|", git_cmd(), 'grep', '-n', '-z',
5856                $search_use_regexp ? ('-E', '-i') : '-F',
5857                $searchtext, $co{'tree'}
5858                        or die_error(500, "Open git-grep failed");
5859
5860        git_header_html();
5861
5862        git_print_page_nav('','', $hash,$co{'tree'},$hash);
5863        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5864
5865        print "<table class=\"grep_search\">\n";
5866        my $alternate = 1;
5867        my $matches = 0;
5868        my $lastfile = '';
5869        while (my $line = <$fd>) {
5870                chomp $line;
5871                my ($file, $file_href, $lno, $ltext, $binary);
5872                last if ($matches++ > 1000);
5873                if ($line =~ /^Binary file (.+) matches$/) {
5874                        $file = $1;
5875                        $binary = 1;
5876                } else {
5877                        ($file, $lno, $ltext) = split(/\0/, $line, 3);
5878                        $file =~ s/^$co{'tree'}://;
5879                }
5880                if ($file ne $lastfile) {
5881                        $lastfile and print "</td></tr>\n";
5882                        if ($alternate++) {
5883                                print "<tr class=\"dark\">\n";
5884                        } else {
5885                                print "<tr class=\"light\">\n";
5886                        }
5887                        $file_href = href(action=>"blob", hash_base=>$co{'id'},
5888                                          file_name=>$file);
5889                        print "<td class=\"list\">".
5890                                $cgi->a({-href => $file_href, -class => "list"}, esc_path($file));
5891                        print "</td><td>\n";
5892                        $lastfile = $file;
5893                }
5894                if ($binary) {
5895                        print "<div class=\"binary\">Binary file</div>\n";
5896                } else {
5897                        $ltext = untabify($ltext);
5898                        if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
5899                                $ltext = esc_html($1, -nbsp=>1);
5900                                $ltext .= '<span class="match">';
5901                                $ltext .= esc_html($2, -nbsp=>1);
5902                                $ltext .= '</span>';
5903                                $ltext .= esc_html($3, -nbsp=>1);
5904                        } else {
5905                                $ltext = esc_html($ltext, -nbsp=>1);
5906                        }
5907                        print "<div class=\"pre\">" .
5908                                $cgi->a({-href => $file_href.'#l'.$lno,
5909                                        -class => "linenr"}, sprintf('%4i', $lno)) .
5910                                ' ' .  $ltext . "</div>\n";
5911                }
5912        }
5913        if ($lastfile) {
5914                print "</td></tr>\n";
5915                if ($matches > 1000) {
5916                        print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
5917                }
5918        } else {
5919                print "<div class=\"diff nodifferences\">No matches found</div>\n";
5920        }
5921        close $fd;
5922
5923        print "</table>\n";
5924
5925        git_footer_html();
5926}
5927
5928sub git_search_grep_body {
5929        my ($commitlist, $from, $to, $extra) = @_;
5930        $from = 0 unless defined $from;
5931        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5932
5933        print "<table class=\"commit_search\">\n";
5934        my $alternate = 1;
5935        for (my $i = $from; $i <= $to; $i++) {
5936                my %co = %{$commitlist->[$i]};
5937                if (!%co) {
5938                        next;
5939                }
5940                my $commit = $co{'id'};
5941                if ($alternate) {
5942                        print "<tr class=\"dark\">\n";
5943                } else {
5944                        print "<tr class=\"light\">\n";
5945                }
5946                $alternate ^= 1;
5947                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5948                      format_author_html('td', \%co, 15, 5) .
5949                      "<td>" .
5950                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5951                               -class => "list subject"},
5952                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
5953                my $comment = $co{'comment'};
5954                foreach my $line (@$comment) {
5955                        if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
5956                                my ($lead, $match, $trail) = ($1, $2, $3);
5957                                $match = chop_str($match, 70, 5, 'center');
5958                                my $contextlen = int((80 - length($match))/2);
5959                                $contextlen = 30 if ($contextlen > 30);
5960                                $lead  = chop_str($lead,  $contextlen, 10, 'left');
5961                                $trail = chop_str($trail, $contextlen, 10, 'right');
5962
5963                                $lead  = esc_html($lead);
5964                                $match = esc_html($match);
5965                                $trail = esc_html($trail);
5966
5967                                print "$lead<span class=\"match\">$match</span>$trail<br />";
5968                        }
5969                }
5970                print "</td>\n" .
5971                      "<td class=\"link\">" .
5972                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5973                      " | " .
5974                      $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5975                      " | " .
5976                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5977                print "</td>\n" .
5978                      "</tr>\n";
5979        }
5980        if (defined $extra) {
5981                print "<tr>\n" .
5982                      "<td colspan=\"3\">$extra</td>\n" .
5983                      "</tr>\n";
5984        }
5985        print "</table>\n";
5986}
5987
5988## ======================================================================
5989## ======================================================================
5990## actions
5991
5992sub git_project_list {
5993        my $order = $input_params{'order'};
5994        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5995                die_error(400, "Unknown order parameter");
5996        }
5997
5998        my @list = git_get_projects_list($project_filter, $strict_export);
5999        if (!@list) {
6000                die_error(404, "No projects found");
6001        }
6002
6003        git_header_html();
6004        if (defined $home_text && -f $home_text) {
6005                print "<div class=\"index_include\">\n";
6006                insert_file($home_text);
6007                print "</div>\n";
6008        }
6009        print $cgi->startform(-method => "get") .
6010              "<p class=\"projsearch\">Search:\n" .
6011              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
6012              "</p>" .
6013              $cgi->end_form() . "\n";
6014        git_project_list_body(\@list, $order);
6015        git_footer_html();
6016}
6017
6018sub git_forks {
6019        my $order = $input_params{'order'};
6020        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6021                die_error(400, "Unknown order parameter");
6022        }
6023
6024        my $filter = $project;
6025        $filter =~ s/\.git$//;
6026        my @list = git_get_projects_list($filter);
6027        if (!@list) {
6028                die_error(404, "No forks found");
6029        }
6030
6031        git_header_html();
6032        git_print_page_nav('','');
6033        git_print_header_div('summary', "$project forks");
6034        git_project_list_body(\@list, $order);
6035        git_footer_html();
6036}
6037
6038sub git_project_index {
6039        my @projects = git_get_projects_list($project_filter, $strict_export);
6040        if (!@projects) {
6041                die_error(404, "No projects found");
6042        }
6043
6044        print $cgi->header(
6045                -type => 'text/plain',
6046                -charset => 'utf-8',
6047                -content_disposition => 'inline; filename="index.aux"');
6048
6049        foreach my $pr (@projects) {
6050                if (!exists $pr->{'owner'}) {
6051                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6052                }
6053
6054                my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6055                # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6056                $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6057                $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6058                $path  =~ s/ /\+/g;
6059                $owner =~ s/ /\+/g;
6060
6061                print "$path $owner\n";
6062        }
6063}
6064
6065sub git_summary {
6066        my $descr = git_get_project_description($project) || "none";
6067        my %co = parse_commit("HEAD");
6068        my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6069        my $head = $co{'id'};
6070        my $remote_heads = gitweb_check_feature('remote_heads');
6071
6072        my $owner = git_get_project_owner($project);
6073
6074        my $refs = git_get_references();
6075        # These get_*_list functions return one more to allow us to see if
6076        # there are more ...
6077        my @taglist  = git_get_tags_list(16);
6078        my @headlist = git_get_heads_list(16);
6079        my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6080        my @forklist;
6081        my $check_forks = gitweb_check_feature('forks');
6082
6083        if ($check_forks) {
6084                # find forks of a project
6085                my $filter = $project;
6086                $filter =~ s/\.git$//;
6087                @forklist = git_get_projects_list($filter);
6088                # filter out forks of forks
6089                @forklist = filter_forks_from_projects_list(\@forklist)
6090                        if (@forklist);
6091        }
6092
6093        git_header_html();
6094        git_print_page_nav('summary','', $head);
6095
6096        print "<div class=\"title\">&nbsp;</div>\n";
6097        print "<table class=\"projects_list\">\n" .
6098              "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
6099              "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6100        if (defined $cd{'rfc2822'}) {
6101                print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6102                      "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6103        }
6104
6105        # use per project git URL list in $projectroot/$project/cloneurl
6106        # or make project git URL from git base URL and project name
6107        my $url_tag = "URL";
6108        my @url_list = git_get_project_url_list($project);
6109        @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6110        foreach my $git_url (@url_list) {
6111                next unless $git_url;
6112                print format_repo_url($url_tag, $git_url);
6113                $url_tag = "";
6114        }
6115
6116        # Tag cloud
6117        my $show_ctags = gitweb_check_feature('ctags');
6118        if ($show_ctags) {
6119                my $ctags = git_get_project_ctags($project);
6120                if (%$ctags) {
6121                        # without ability to add tags, don't show if there are none
6122                        my $cloud = git_populate_project_tagcloud($ctags);
6123                        print "<tr id=\"metadata_ctags\">" .
6124                              "<td>content tags</td>" .
6125                              "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6126                              "</tr>\n";
6127                }
6128        }
6129
6130        print "</table>\n";
6131
6132        # If XSS prevention is on, we don't include README.html.
6133        # TODO: Allow a readme in some safe format.
6134        if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6135                print "<div class=\"title\">readme</div>\n" .
6136                      "<div class=\"readme\">\n";
6137                insert_file("$projectroot/$project/README.html");
6138                print "\n</div>\n"; # class="readme"
6139        }
6140
6141        # we need to request one more than 16 (0..15) to check if
6142        # those 16 are all
6143        my @commitlist = $head ? parse_commits($head, 17) : ();
6144        if (@commitlist) {
6145                git_print_header_div('shortlog');
6146                git_shortlog_body(\@commitlist, 0, 15, $refs,
6147                                  $#commitlist <=  15 ? undef :
6148                                  $cgi->a({-href => href(action=>"shortlog")}, "..."));
6149        }
6150
6151        if (@taglist) {
6152                git_print_header_div('tags');
6153                git_tags_body(\@taglist, 0, 15,
6154                              $#taglist <=  15 ? undef :
6155                              $cgi->a({-href => href(action=>"tags")}, "..."));
6156        }
6157
6158        if (@headlist) {
6159                git_print_header_div('heads');
6160                git_heads_body(\@headlist, $head, 0, 15,
6161                               $#headlist <= 15 ? undef :
6162                               $cgi->a({-href => href(action=>"heads")}, "..."));
6163        }
6164
6165        if (%remotedata) {
6166                git_print_header_div('remotes');
6167                git_remotes_body(\%remotedata, 15, $head);
6168        }
6169
6170        if (@forklist) {
6171                git_print_header_div('forks');
6172                git_project_list_body(\@forklist, 'age', 0, 15,
6173                                      $#forklist <= 15 ? undef :
6174                                      $cgi->a({-href => href(action=>"forks")}, "..."),
6175                                      'no_header');
6176        }
6177
6178        git_footer_html();
6179}
6180
6181sub git_tag {
6182        my %tag = parse_tag($hash);
6183
6184        if (! %tag) {
6185                die_error(404, "Unknown tag object");
6186        }
6187
6188        my $head = git_get_head_hash($project);
6189        git_header_html();
6190        git_print_page_nav('','', $head,undef,$head);
6191        git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6192        print "<div class=\"title_text\">\n" .
6193              "<table class=\"object_header\">\n" .
6194              "<tr>\n" .
6195              "<td>object</td>\n" .
6196              "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6197                               $tag{'object'}) . "</td>\n" .
6198              "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6199                                              $tag{'type'}) . "</td>\n" .
6200              "</tr>\n";
6201        if (defined($tag{'author'})) {
6202                git_print_authorship_rows(\%tag, 'author');
6203        }
6204        print "</table>\n\n" .
6205              "</div>\n";
6206        print "<div class=\"page_body\">";
6207        my $comment = $tag{'comment'};
6208        foreach my $line (@$comment) {
6209                chomp $line;
6210                print esc_html($line, -nbsp=>1) . "<br/>\n";
6211        }
6212        print "</div>\n";
6213        git_footer_html();
6214}
6215
6216sub git_blame_common {
6217        my $format = shift || 'porcelain';
6218        if ($format eq 'porcelain' && $cgi->param('js')) {
6219                $format = 'incremental';
6220                $action = 'blame_incremental'; # for page title etc
6221        }
6222
6223        # permissions
6224        gitweb_check_feature('blame')
6225                or die_error(403, "Blame view not allowed");
6226
6227        # error checking
6228        die_error(400, "No file name given") unless $file_name;
6229        $hash_base ||= git_get_head_hash($project);
6230        die_error(404, "Couldn't find base commit") unless $hash_base;
6231        my %co = parse_commit($hash_base)
6232                or die_error(404, "Commit not found");
6233        my $ftype = "blob";
6234        if (!defined $hash) {
6235                $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6236                        or die_error(404, "Error looking up file");
6237        } else {
6238                $ftype = git_get_type($hash);
6239                if ($ftype !~ "blob") {
6240                        die_error(400, "Object is not a blob");
6241                }
6242        }
6243
6244        my $fd;
6245        if ($format eq 'incremental') {
6246                # get file contents (as base)
6247                open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6248                        or die_error(500, "Open git-cat-file failed");
6249        } elsif ($format eq 'data') {
6250                # run git-blame --incremental
6251                open $fd, "-|", git_cmd(), "blame", "--incremental",
6252                        $hash_base, "--", $file_name
6253                        or die_error(500, "Open git-blame --incremental failed");
6254        } else {
6255                # run git-blame --porcelain
6256                open $fd, "-|", git_cmd(), "blame", '-p',
6257                        $hash_base, '--', $file_name
6258                        or die_error(500, "Open git-blame --porcelain failed");
6259        }
6260
6261        # incremental blame data returns early
6262        if ($format eq 'data') {
6263                print $cgi->header(
6264                        -type=>"text/plain", -charset => "utf-8",
6265                        -status=> "200 OK");
6266                local $| = 1; # output autoflush
6267                while (my $line = <$fd>) {
6268                        print to_utf8($line);
6269                }
6270                close $fd
6271                        or print "ERROR $!\n";
6272
6273                print 'END';
6274                if (defined $t0 && gitweb_check_feature('timed')) {
6275                        print ' '.
6276                              tv_interval($t0, [ gettimeofday() ]).
6277                              ' '.$number_of_git_cmds;
6278                }
6279                print "\n";
6280
6281                return;
6282        }
6283
6284        # page header
6285        git_header_html();
6286        my $formats_nav =
6287                $cgi->a({-href => href(action=>"blob", -replay=>1)},
6288                        "blob") .
6289                " | ";
6290        if ($format eq 'incremental') {
6291                $formats_nav .=
6292                        $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6293                                "blame") . " (non-incremental)";
6294        } else {
6295                $formats_nav .=
6296                        $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6297                                "blame") . " (incremental)";
6298        }
6299        $formats_nav .=
6300                " | " .
6301                $cgi->a({-href => href(action=>"history", -replay=>1)},
6302                        "history") .
6303                " | " .
6304                $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6305                        "HEAD");
6306        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6307        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6308        git_print_page_path($file_name, $ftype, $hash_base);
6309
6310        # page body
6311        if ($format eq 'incremental') {
6312                print "<noscript>\n<div class=\"error\"><center><b>\n".
6313                      "This page requires JavaScript to run.\n Use ".
6314                      $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6315                              'this page').
6316                      " instead.\n".
6317                      "</b></center></div>\n</noscript>\n";
6318
6319                print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6320        }
6321
6322        print qq!<div class="page_body">\n!;
6323        print qq!<div id="progress_info">... / ...</div>\n!
6324                if ($format eq 'incremental');
6325        print qq!<table id="blame_table" class="blame" width="100%">\n!.
6326              #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6327              qq!<thead>\n!.
6328              qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6329              qq!</thead>\n!.
6330              qq!<tbody>\n!;
6331
6332        my @rev_color = qw(light dark);
6333        my $num_colors = scalar(@rev_color);
6334        my $current_color = 0;
6335
6336        if ($format eq 'incremental') {
6337                my $color_class = $rev_color[$current_color];
6338
6339                #contents of a file
6340                my $linenr = 0;
6341        LINE:
6342                while (my $line = <$fd>) {
6343                        chomp $line;
6344                        $linenr++;
6345
6346                        print qq!<tr id="l$linenr" class="$color_class">!.
6347                              qq!<td class="sha1"><a href=""> </a></td>!.
6348                              qq!<td class="linenr">!.
6349                              qq!<a class="linenr" href="">$linenr</a></td>!;
6350                        print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6351                        print qq!</tr>\n!;
6352                }
6353
6354        } else { # porcelain, i.e. ordinary blame
6355                my %metainfo = (); # saves information about commits
6356
6357                # blame data
6358        LINE:
6359                while (my $line = <$fd>) {
6360                        chomp $line;
6361                        # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6362                        # no <lines in group> for subsequent lines in group of lines
6363                        my ($full_rev, $orig_lineno, $lineno, $group_size) =
6364                           ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6365                        if (!exists $metainfo{$full_rev}) {
6366                                $metainfo{$full_rev} = { 'nprevious' => 0 };
6367                        }
6368                        my $meta = $metainfo{$full_rev};
6369                        my $data;
6370                        while ($data = <$fd>) {
6371                                chomp $data;
6372                                last if ($data =~ s/^\t//); # contents of line
6373                                if ($data =~ /^(\S+)(?: (.*))?$/) {
6374                                        $meta->{$1} = $2 unless exists $meta->{$1};
6375                                }
6376                                if ($data =~ /^previous /) {
6377                                        $meta->{'nprevious'}++;
6378                                }
6379                        }
6380                        my $short_rev = substr($full_rev, 0, 8);
6381                        my $author = $meta->{'author'};
6382                        my %date =
6383                                parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6384                        my $date = $date{'iso-tz'};
6385                        if ($group_size) {
6386                                $current_color = ($current_color + 1) % $num_colors;
6387                        }
6388                        my $tr_class = $rev_color[$current_color];
6389                        $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6390                        $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6391                        $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6392                        print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6393                        if ($group_size) {
6394                                print "<td class=\"sha1\"";
6395                                print " title=\"". esc_html($author) . ", $date\"";
6396                                print " rowspan=\"$group_size\"" if ($group_size > 1);
6397                                print ">";
6398                                print $cgi->a({-href => href(action=>"commit",
6399                                                             hash=>$full_rev,
6400                                                             file_name=>$file_name)},
6401                                              esc_html($short_rev));
6402                                if ($group_size >= 2) {
6403                                        my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6404                                        if (@author_initials) {
6405                                                print "<br />" .
6406                                                      esc_html(join('', @author_initials));
6407                                                #           or join('.', ...)
6408                                        }
6409                                }
6410                                print "</td>\n";
6411                        }
6412                        # 'previous' <sha1 of parent commit> <filename at commit>
6413                        if (exists $meta->{'previous'} &&
6414                            $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6415                                $meta->{'parent'} = $1;
6416                                $meta->{'file_parent'} = unquote($2);
6417                        }
6418                        my $linenr_commit =
6419                                exists($meta->{'parent'}) ?
6420                                $meta->{'parent'} : $full_rev;
6421                        my $linenr_filename =
6422                                exists($meta->{'file_parent'}) ?
6423                                $meta->{'file_parent'} : unquote($meta->{'filename'});
6424                        my $blamed = href(action => 'blame',
6425                                          file_name => $linenr_filename,
6426                                          hash_base => $linenr_commit);
6427                        print "<td class=\"linenr\">";
6428                        print $cgi->a({ -href => "$blamed#l$orig_lineno",
6429                                        -class => "linenr" },
6430                                      esc_html($lineno));
6431                        print "</td>";
6432                        print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6433                        print "</tr>\n";
6434                } # end while
6435
6436        }
6437
6438        # footer
6439        print "</tbody>\n".
6440              "</table>\n"; # class="blame"
6441        print "</div>\n";   # class="blame_body"
6442        close $fd
6443                or print "Reading blob failed\n";
6444
6445        git_footer_html();
6446}
6447
6448sub git_blame {
6449        git_blame_common();
6450}
6451
6452sub git_blame_incremental {
6453        git_blame_common('incremental');
6454}
6455
6456sub git_blame_data {
6457        git_blame_common('data');
6458}
6459
6460sub git_tags {
6461        my $head = git_get_head_hash($project);
6462        git_header_html();
6463        git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6464        git_print_header_div('summary', $project);
6465
6466        my @tagslist = git_get_tags_list();
6467        if (@tagslist) {
6468                git_tags_body(\@tagslist);
6469        }
6470        git_footer_html();
6471}
6472
6473sub git_heads {
6474        my $head = git_get_head_hash($project);
6475        git_header_html();
6476        git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6477        git_print_header_div('summary', $project);
6478
6479        my @headslist = git_get_heads_list();
6480        if (@headslist) {
6481                git_heads_body(\@headslist, $head);
6482        }
6483        git_footer_html();
6484}
6485
6486# used both for single remote view and for list of all the remotes
6487sub git_remotes {
6488        gitweb_check_feature('remote_heads')
6489                or die_error(403, "Remote heads view is disabled");
6490
6491        my $head = git_get_head_hash($project);
6492        my $remote = $input_params{'hash'};
6493
6494        my $remotedata = git_get_remotes_list($remote);
6495        die_error(500, "Unable to get remote information") unless defined $remotedata;
6496
6497        unless (%$remotedata) {
6498                die_error(404, defined $remote ?
6499                        "Remote $remote not found" :
6500                        "No remotes found");
6501        }
6502
6503        git_header_html(undef, undef, -action_extra => $remote);
6504        git_print_page_nav('', '',  $head, undef, $head,
6505                format_ref_views($remote ? '' : 'remotes'));
6506
6507        fill_remote_heads($remotedata);
6508        if (defined $remote) {
6509                git_print_header_div('remotes', "$remote remote for $project");
6510                git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6511        } else {
6512                git_print_header_div('summary', "$project remotes");
6513                git_remotes_body($remotedata, undef, $head);
6514        }
6515
6516        git_footer_html();
6517}
6518
6519sub git_blob_plain {
6520        my $type = shift;
6521        my $expires;
6522
6523        if (!defined $hash) {
6524                if (defined $file_name) {
6525                        my $base = $hash_base || git_get_head_hash($project);
6526                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6527                                or die_error(404, "Cannot find file");
6528                } else {
6529                        die_error(400, "No file name defined");
6530                }
6531        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6532                # blobs defined by non-textual hash id's can be cached
6533                $expires = "+1d";
6534        }
6535
6536        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6537                or die_error(500, "Open git-cat-file blob '$hash' failed");
6538
6539        # content-type (can include charset)
6540        $type = blob_contenttype($fd, $file_name, $type);
6541
6542        # "save as" filename, even when no $file_name is given
6543        my $save_as = "$hash";
6544        if (defined $file_name) {
6545                $save_as = $file_name;
6546        } elsif ($type =~ m/^text\//) {
6547                $save_as .= '.txt';
6548        }
6549
6550        # With XSS prevention on, blobs of all types except a few known safe
6551        # ones are served with "Content-Disposition: attachment" to make sure
6552        # they don't run in our security domain.  For certain image types,
6553        # blob view writes an <img> tag referring to blob_plain view, and we
6554        # want to be sure not to break that by serving the image as an
6555        # attachment (though Firefox 3 doesn't seem to care).
6556        my $sandbox = $prevent_xss &&
6557                $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6558
6559        # serve text/* as text/plain
6560        if ($prevent_xss &&
6561            ($type =~ m!^text/[a-z]+\b(.*)$! ||
6562             ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
6563                my $rest = $1;
6564                $rest = defined $rest ? $rest : '';
6565                $type = "text/plain$rest";
6566        }
6567
6568        print $cgi->header(
6569                -type => $type,
6570                -expires => $expires,
6571                -content_disposition =>
6572                        ($sandbox ? 'attachment' : 'inline')
6573                        . '; filename="' . $save_as . '"');
6574        local $/ = undef;
6575        binmode STDOUT, ':raw';
6576        print <$fd>;
6577        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6578        close $fd;
6579}
6580
6581sub git_blob {
6582        my $expires;
6583
6584        if (!defined $hash) {
6585                if (defined $file_name) {
6586                        my $base = $hash_base || git_get_head_hash($project);
6587                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6588                                or die_error(404, "Cannot find file");
6589                } else {
6590                        die_error(400, "No file name defined");
6591                }
6592        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6593                # blobs defined by non-textual hash id's can be cached
6594                $expires = "+1d";
6595        }
6596
6597        my $have_blame = gitweb_check_feature('blame');
6598        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6599                or die_error(500, "Couldn't cat $file_name, $hash");
6600        my $mimetype = blob_mimetype($fd, $file_name);
6601        # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6602        if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6603                close $fd;
6604                return git_blob_plain($mimetype);
6605        }
6606        # we can have blame only for text/* mimetype
6607        $have_blame &&= ($mimetype =~ m!^text/!);
6608
6609        my $highlight = gitweb_check_feature('highlight');
6610        my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6611        $fd = run_highlighter($fd, $highlight, $syntax)
6612                if $syntax;
6613
6614        git_header_html(undef, $expires);
6615        my $formats_nav = '';
6616        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6617                if (defined $file_name) {
6618                        if ($have_blame) {
6619                                $formats_nav .=
6620                                        $cgi->a({-href => href(action=>"blame", -replay=>1)},
6621                                                "blame") .
6622                                        " | ";
6623                        }
6624                        $formats_nav .=
6625                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6626                                        "history") .
6627                                " | " .
6628                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6629                                        "raw") .
6630                                " | " .
6631                                $cgi->a({-href => href(action=>"blob",
6632                                                       hash_base=>"HEAD", file_name=>$file_name)},
6633                                        "HEAD");
6634                } else {
6635                        $formats_nav .=
6636                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6637                                        "raw");
6638                }
6639                git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6640                git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6641        } else {
6642                print "<div class=\"page_nav\">\n" .
6643                      "<br/><br/></div>\n" .
6644                      "<div class=\"title\">".esc_html($hash)."</div>\n";
6645        }
6646        git_print_page_path($file_name, "blob", $hash_base);
6647        print "<div class=\"page_body\">\n";
6648        if ($mimetype =~ m!^image/!) {
6649                print qq!<img type="!.esc_attr($mimetype).qq!"!;
6650                if ($file_name) {
6651                        print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
6652                }
6653                print qq! src="! .
6654                      href(action=>"blob_plain", hash=>$hash,
6655                           hash_base=>$hash_base, file_name=>$file_name) .
6656                      qq!" />\n!;
6657        } else {
6658                my $nr;
6659                while (my $line = <$fd>) {
6660                        chomp $line;
6661                        $nr++;
6662                        $line = untabify($line);
6663                        printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
6664                               $nr, esc_attr(href(-replay => 1)), $nr, $nr,
6665                               $syntax ? sanitize($line) : esc_html($line, -nbsp=>1);
6666                }
6667        }
6668        close $fd
6669                or print "Reading blob failed.\n";
6670        print "</div>";
6671        git_footer_html();
6672}
6673
6674sub git_tree {
6675        if (!defined $hash_base) {
6676                $hash_base = "HEAD";
6677        }
6678        if (!defined $hash) {
6679                if (defined $file_name) {
6680                        $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
6681                } else {
6682                        $hash = $hash_base;
6683                }
6684        }
6685        die_error(404, "No such tree") unless defined($hash);
6686
6687        my $show_sizes = gitweb_check_feature('show-sizes');
6688        my $have_blame = gitweb_check_feature('blame');
6689
6690        my @entries = ();
6691        {
6692                local $/ = "\0";
6693                open my $fd, "-|", git_cmd(), "ls-tree", '-z',
6694                        ($show_sizes ? '-l' : ()), @extra_options, $hash
6695                        or die_error(500, "Open git-ls-tree failed");
6696                @entries = map { chomp; $_ } <$fd>;
6697                close $fd
6698                        or die_error(404, "Reading tree failed");
6699        }
6700
6701        my $refs = git_get_references();
6702        my $ref = format_ref_marker($refs, $hash_base);
6703        git_header_html();
6704        my $basedir = '';
6705        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6706                my @views_nav = ();
6707                if (defined $file_name) {
6708                        push @views_nav,
6709                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6710                                        "history"),
6711                                $cgi->a({-href => href(action=>"tree",
6712                                                       hash_base=>"HEAD", file_name=>$file_name)},
6713                                        "HEAD"),
6714                }
6715                my $snapshot_links = format_snapshot_links($hash);
6716                if (defined $snapshot_links) {
6717                        # FIXME: Should be available when we have no hash base as well.
6718                        push @views_nav, $snapshot_links;
6719                }
6720                git_print_page_nav('tree','', $hash_base, undef, undef,
6721                                   join(' | ', @views_nav));
6722                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6723        } else {
6724                undef $hash_base;
6725                print "<div class=\"page_nav\">\n";
6726                print "<br/><br/></div>\n";
6727                print "<div class=\"title\">".esc_html($hash)."</div>\n";
6728        }
6729        if (defined $file_name) {
6730                $basedir = $file_name;
6731                if ($basedir ne '' && substr($basedir, -1) ne '/') {
6732                        $basedir .= '/';
6733                }
6734                git_print_page_path($file_name, 'tree', $hash_base);
6735        }
6736        print "<div class=\"page_body\">\n";
6737        print "<table class=\"tree\">\n";
6738        my $alternate = 1;
6739        # '..' (top directory) link if possible
6740        if (defined $hash_base &&
6741            defined $file_name && $file_name =~ m![^/]+$!) {
6742                if ($alternate) {
6743                        print "<tr class=\"dark\">\n";
6744                } else {
6745                        print "<tr class=\"light\">\n";
6746                }
6747                $alternate ^= 1;
6748
6749                my $up = $file_name;
6750                $up =~ s!/?[^/]+$!!;
6751                undef $up unless $up;
6752                # based on git_print_tree_entry
6753                print '<td class="mode">' . mode_str('040000') . "</td>\n";
6754                print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6755                print '<td class="list">';
6756                print $cgi->a({-href => href(action=>"tree",
6757                                             hash_base=>$hash_base,
6758                                             file_name=>$up)},
6759                              "..");
6760                print "</td>\n";
6761                print "<td class=\"link\"></td>\n";
6762
6763                print "</tr>\n";
6764        }
6765        foreach my $line (@entries) {
6766                my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6767
6768                if ($alternate) {
6769                        print "<tr class=\"dark\">\n";
6770                } else {
6771                        print "<tr class=\"light\">\n";
6772                }
6773                $alternate ^= 1;
6774
6775                git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6776
6777                print "</tr>\n";
6778        }
6779        print "</table>\n" .
6780              "</div>";
6781        git_footer_html();
6782}
6783
6784sub snapshot_name {
6785        my ($project, $hash) = @_;
6786
6787        # path/to/project.git  -> project
6788        # path/to/project/.git -> project
6789        my $name = to_utf8($project);
6790        $name =~ s,([^/])/*\.git$,$1,;
6791        $name = basename($name);
6792        # sanitize name
6793        $name =~ s/[[:cntrl:]]/?/g;
6794
6795        my $ver = $hash;
6796        if ($hash =~ /^[0-9a-fA-F]+$/) {
6797                # shorten SHA-1 hash
6798                my $full_hash = git_get_full_hash($project, $hash);
6799                if ($full_hash =~ /^$hash/ && length($hash) > 7) {
6800                        $ver = git_get_short_hash($project, $hash);
6801                }
6802        } elsif ($hash =~ m!^refs/tags/(.*)$!) {
6803                # tags don't need shortened SHA-1 hash
6804                $ver = $1;
6805        } else {
6806                # branches and other need shortened SHA-1 hash
6807                if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
6808                        $ver = $1;
6809                }
6810                $ver .= '-' . git_get_short_hash($project, $hash);
6811        }
6812        # in case of hierarchical branch names
6813        $ver =~ s!/!.!g;
6814
6815        # name = project-version_string
6816        $name = "$name-$ver";
6817
6818        return wantarray ? ($name, $name) : $name;
6819}
6820
6821sub git_snapshot {
6822        my $format = $input_params{'snapshot_format'};
6823        if (!@snapshot_fmts) {
6824                die_error(403, "Snapshots not allowed");
6825        }
6826        # default to first supported snapshot format
6827        $format ||= $snapshot_fmts[0];
6828        if ($format !~ m/^[a-z0-9]+$/) {
6829                die_error(400, "Invalid snapshot format parameter");
6830        } elsif (!exists($known_snapshot_formats{$format})) {
6831                die_error(400, "Unknown snapshot format");
6832        } elsif ($known_snapshot_formats{$format}{'disabled'}) {
6833                die_error(403, "Snapshot format not allowed");
6834        } elsif (!grep($_ eq $format, @snapshot_fmts)) {
6835                die_error(403, "Unsupported snapshot format");
6836        }
6837
6838        my $type = git_get_type("$hash^{}");
6839        if (!$type) {
6840                die_error(404, 'Object does not exist');
6841        }  elsif ($type eq 'blob') {
6842                die_error(400, 'Object is not a tree-ish');
6843        }
6844
6845        my ($name, $prefix) = snapshot_name($project, $hash);
6846        my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
6847        my $cmd = quote_command(
6848                git_cmd(), 'archive',
6849                "--format=$known_snapshot_formats{$format}{'format'}",
6850                "--prefix=$prefix/", $hash);
6851        if (exists $known_snapshot_formats{$format}{'compressor'}) {
6852                $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
6853        }
6854
6855        $filename =~ s/(["\\])/\\$1/g;
6856        print $cgi->header(
6857                -type => $known_snapshot_formats{$format}{'type'},
6858                -content_disposition => 'inline; filename="' . $filename . '"',
6859                -status => '200 OK');
6860
6861        open my $fd, "-|", $cmd
6862                or die_error(500, "Execute git-archive failed");
6863        binmode STDOUT, ':raw';
6864        print <$fd>;
6865        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6866        close $fd;
6867}
6868
6869sub git_log_generic {
6870        my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
6871
6872        my $head = git_get_head_hash($project);
6873        if (!defined $base) {
6874                $base = $head;
6875        }
6876        if (!defined $page) {
6877                $page = 0;
6878        }
6879        my $refs = git_get_references();
6880
6881        my $commit_hash = $base;
6882        if (defined $parent) {
6883                $commit_hash = "$parent..$base";
6884        }
6885        my @commitlist =
6886                parse_commits($commit_hash, 101, (100 * $page),
6887                              defined $file_name ? ($file_name, "--full-history") : ());
6888
6889        my $ftype;
6890        if (!defined $file_hash && defined $file_name) {
6891                # some commits could have deleted file in question,
6892                # and not have it in tree, but one of them has to have it
6893                for (my $i = 0; $i < @commitlist; $i++) {
6894                        $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
6895                        last if defined $file_hash;
6896                }
6897        }
6898        if (defined $file_hash) {
6899                $ftype = git_get_type($file_hash);
6900        }
6901        if (defined $file_name && !defined $ftype) {
6902                die_error(500, "Unknown type of object");
6903        }
6904        my %co;
6905        if (defined $file_name) {
6906                %co = parse_commit($base)
6907                        or die_error(404, "Unknown commit object");
6908        }
6909
6910
6911        my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
6912        my $next_link = '';
6913        if ($#commitlist >= 100) {
6914                $next_link =
6915                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
6916                                 -accesskey => "n", -title => "Alt-n"}, "next");
6917        }
6918        my $patch_max = gitweb_get_feature('patches');
6919        if ($patch_max && !defined $file_name) {
6920                if ($patch_max < 0 || @commitlist <= $patch_max) {
6921                        $paging_nav .= " &sdot; " .
6922                                $cgi->a({-href => href(action=>"patches", -replay=>1)},
6923                                        "patches");
6924                }
6925        }
6926
6927        git_header_html();
6928        git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
6929        if (defined $file_name) {
6930                git_print_header_div('commit', esc_html($co{'title'}), $base);
6931        } else {
6932                git_print_header_div('summary', $project)
6933        }
6934        git_print_page_path($file_name, $ftype, $hash_base)
6935                if (defined $file_name);
6936
6937        $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
6938                     $file_name, $file_hash, $ftype);
6939
6940        git_footer_html();
6941}
6942
6943sub git_log {
6944        git_log_generic('log', \&git_log_body,
6945                        $hash, $hash_parent);
6946}
6947
6948sub git_commit {
6949        $hash ||= $hash_base || "HEAD";
6950        my %co = parse_commit($hash)
6951            or die_error(404, "Unknown commit object");
6952
6953        my $parent  = $co{'parent'};
6954        my $parents = $co{'parents'}; # listref
6955
6956        # we need to prepare $formats_nav before any parameter munging
6957        my $formats_nav;
6958        if (!defined $parent) {
6959                # --root commitdiff
6960                $formats_nav .= '(initial)';
6961        } elsif (@$parents == 1) {
6962                # single parent commit
6963                $formats_nav .=
6964                        '(parent: ' .
6965                        $cgi->a({-href => href(action=>"commit",
6966                                               hash=>$parent)},
6967                                esc_html(substr($parent, 0, 7))) .
6968                        ')';
6969        } else {
6970                # merge commit
6971                $formats_nav .=
6972                        '(merge: ' .
6973                        join(' ', map {
6974                                $cgi->a({-href => href(action=>"commit",
6975                                                       hash=>$_)},
6976                                        esc_html(substr($_, 0, 7)));
6977                        } @$parents ) .
6978                        ')';
6979        }
6980        if (gitweb_check_feature('patches') && @$parents <= 1) {
6981                $formats_nav .= " | " .
6982                        $cgi->a({-href => href(action=>"patch", -replay=>1)},
6983                                "patch");
6984        }
6985
6986        if (!defined $parent) {
6987                $parent = "--root";
6988        }
6989        my @difftree;
6990        open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
6991                @diff_opts,
6992                (@$parents <= 1 ? $parent : '-c'),
6993                $hash, "--"
6994                or die_error(500, "Open git-diff-tree failed");
6995        @difftree = map { chomp; $_ } <$fd>;
6996        close $fd or die_error(404, "Reading git-diff-tree failed");
6997
6998        # non-textual hash id's can be cached
6999        my $expires;
7000        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7001                $expires = "+1d";
7002        }
7003        my $refs = git_get_references();
7004        my $ref = format_ref_marker($refs, $co{'id'});
7005
7006        git_header_html(undef, $expires);
7007        git_print_page_nav('commit', '',
7008                           $hash, $co{'tree'}, $hash,
7009                           $formats_nav);
7010
7011        if (defined $co{'parent'}) {
7012                git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
7013        } else {
7014                git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
7015        }
7016        print "<div class=\"title_text\">\n" .
7017              "<table class=\"object_header\">\n";
7018        git_print_authorship_rows(\%co);
7019        print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
7020        print "<tr>" .
7021              "<td>tree</td>" .
7022              "<td class=\"sha1\">" .
7023              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7024                       class => "list"}, $co{'tree'}) .
7025              "</td>" .
7026              "<td class=\"link\">" .
7027              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7028                      "tree");
7029        my $snapshot_links = format_snapshot_links($hash);
7030        if (defined $snapshot_links) {
7031                print " | " . $snapshot_links;
7032        }
7033        print "</td>" .
7034              "</tr>\n";
7035
7036        foreach my $par (@$parents) {
7037                print "<tr>" .
7038                      "<td>parent</td>" .
7039                      "<td class=\"sha1\">" .
7040                      $cgi->a({-href => href(action=>"commit", hash=>$par),
7041                               class => "list"}, $par) .
7042                      "</td>" .
7043                      "<td class=\"link\">" .
7044                      $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7045                      " | " .
7046                      $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7047                      "</td>" .
7048                      "</tr>\n";
7049        }
7050        print "</table>".
7051              "</div>\n";
7052
7053        print "<div class=\"page_body\">\n";
7054        git_print_log($co{'comment'});
7055        print "</div>\n";
7056
7057        git_difftree_body(\@difftree, $hash, @$parents);
7058
7059        git_footer_html();
7060}
7061
7062sub git_object {
7063        # object is defined by:
7064        # - hash or hash_base alone
7065        # - hash_base and file_name
7066        my $type;
7067
7068        # - hash or hash_base alone
7069        if ($hash || ($hash_base && !defined $file_name)) {
7070                my $object_id = $hash || $hash_base;
7071
7072                open my $fd, "-|", quote_command(
7073                        git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7074                        or die_error(404, "Object does not exist");
7075                $type = <$fd>;
7076                chomp $type;
7077                close $fd
7078                        or die_error(404, "Object does not exist");
7079
7080        # - hash_base and file_name
7081        } elsif ($hash_base && defined $file_name) {
7082                $file_name =~ s,/+$,,;
7083
7084                system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7085                        or die_error(404, "Base object does not exist");
7086
7087                # here errors should not hapen
7088                open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7089                        or die_error(500, "Open git-ls-tree failed");
7090                my $line = <$fd>;
7091                close $fd;
7092
7093                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7094                unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7095                        die_error(404, "File or directory for given base does not exist");
7096                }
7097                $type = $2;
7098                $hash = $3;
7099        } else {
7100                die_error(400, "Not enough information to find object");
7101        }
7102
7103        print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7104                                          hash=>$hash, hash_base=>$hash_base,
7105                                          file_name=>$file_name),
7106                             -status => '302 Found');
7107}
7108
7109sub git_blobdiff {
7110        my $format = shift || 'html';
7111        my $diff_style = $input_params{'diff_style'} || 'inline';
7112
7113        my $fd;
7114        my @difftree;
7115        my %diffinfo;
7116        my $expires;
7117
7118        # preparing $fd and %diffinfo for git_patchset_body
7119        # new style URI
7120        if (defined $hash_base && defined $hash_parent_base) {
7121                if (defined $file_name) {
7122                        # read raw output
7123                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7124                                $hash_parent_base, $hash_base,
7125                                "--", (defined $file_parent ? $file_parent : ()), $file_name
7126                                or die_error(500, "Open git-diff-tree failed");
7127                        @difftree = map { chomp; $_ } <$fd>;
7128                        close $fd
7129                                or die_error(404, "Reading git-diff-tree failed");
7130                        @difftree
7131                                or die_error(404, "Blob diff not found");
7132
7133                } elsif (defined $hash &&
7134                         $hash =~ /[0-9a-fA-F]{40}/) {
7135                        # try to find filename from $hash
7136
7137                        # read filtered raw output
7138                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7139                                $hash_parent_base, $hash_base, "--"
7140                                or die_error(500, "Open git-diff-tree failed");
7141                        @difftree =
7142                                # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7143                                # $hash == to_id
7144                                grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7145                                map { chomp; $_ } <$fd>;
7146                        close $fd
7147                                or die_error(404, "Reading git-diff-tree failed");
7148                        @difftree
7149                                or die_error(404, "Blob diff not found");
7150
7151                } else {
7152                        die_error(400, "Missing one of the blob diff parameters");
7153                }
7154
7155                if (@difftree > 1) {
7156                        die_error(400, "Ambiguous blob diff specification");
7157                }
7158
7159                %diffinfo = parse_difftree_raw_line($difftree[0]);
7160                $file_parent ||= $diffinfo{'from_file'} || $file_name;
7161                $file_name   ||= $diffinfo{'to_file'};
7162
7163                $hash_parent ||= $diffinfo{'from_id'};
7164                $hash        ||= $diffinfo{'to_id'};
7165
7166                # non-textual hash id's can be cached
7167                if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7168                    $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7169                        $expires = '+1d';
7170                }
7171
7172                # open patch output
7173                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7174                        '-p', ($format eq 'html' ? "--full-index" : ()),
7175                        $hash_parent_base, $hash_base,
7176                        "--", (defined $file_parent ? $file_parent : ()), $file_name
7177                        or die_error(500, "Open git-diff-tree failed");
7178        }
7179
7180        # old/legacy style URI -- not generated anymore since 1.4.3.
7181        if (!%diffinfo) {
7182                die_error('404 Not Found', "Missing one of the blob diff parameters")
7183        }
7184
7185        # header
7186        if ($format eq 'html') {
7187                my $formats_nav =
7188                        $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7189                                "raw");
7190                $formats_nav .= diff_style_nav($diff_style);
7191                git_header_html(undef, $expires);
7192                if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7193                        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7194                        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7195                } else {
7196                        print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7197                        print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7198                }
7199                if (defined $file_name) {
7200                        git_print_page_path($file_name, "blob", $hash_base);
7201                } else {
7202                        print "<div class=\"page_path\"></div>\n";
7203                }
7204
7205        } elsif ($format eq 'plain') {
7206                print $cgi->header(
7207                        -type => 'text/plain',
7208                        -charset => 'utf-8',
7209                        -expires => $expires,
7210                        -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7211
7212                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7213
7214        } else {
7215                die_error(400, "Unknown blobdiff format");
7216        }
7217
7218        # patch
7219        if ($format eq 'html') {
7220                print "<div class=\"page_body\">\n";
7221
7222                git_patchset_body($fd, $diff_style,
7223                                  [ \%diffinfo ], $hash_base, $hash_parent_base);
7224                close $fd;
7225
7226                print "</div>\n"; # class="page_body"
7227                git_footer_html();
7228
7229        } else {
7230                while (my $line = <$fd>) {
7231                        $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7232                        $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7233
7234                        print $line;
7235
7236                        last if $line =~ m!^\+\+\+!;
7237                }
7238                local $/ = undef;
7239                print <$fd>;
7240                close $fd;
7241        }
7242}
7243
7244sub git_blobdiff_plain {
7245        git_blobdiff('plain');
7246}
7247
7248# assumes that it is added as later part of already existing navigation,
7249# so it returns "| foo | bar" rather than just "foo | bar"
7250sub diff_style_nav {
7251        my ($diff_style, $is_combined) = @_;
7252        $diff_style ||= 'inline';
7253
7254        return "" if ($is_combined);
7255
7256        my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7257        my %styles = @styles;
7258        @styles =
7259                @styles[ map { $_ * 2 } 0..$#styles/2 ];
7260
7261        return join '',
7262                map { " | ".$_ }
7263                map {
7264                        $_ eq $diff_style ? $styles{$_} :
7265                        $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7266                } @styles;
7267}
7268
7269sub git_commitdiff {
7270        my %params = @_;
7271        my $format = $params{-format} || 'html';
7272        my $diff_style = $input_params{'diff_style'} || 'inline';
7273
7274        my ($patch_max) = gitweb_get_feature('patches');
7275        if ($format eq 'patch') {
7276                die_error(403, "Patch view not allowed") unless $patch_max;
7277        }
7278
7279        $hash ||= $hash_base || "HEAD";
7280        my %co = parse_commit($hash)
7281            or die_error(404, "Unknown commit object");
7282
7283        # choose format for commitdiff for merge
7284        if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7285                $hash_parent = '--cc';
7286        }
7287        # we need to prepare $formats_nav before almost any parameter munging
7288        my $formats_nav;
7289        if ($format eq 'html') {
7290                $formats_nav =
7291                        $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7292                                "raw");
7293                if ($patch_max && @{$co{'parents'}} <= 1) {
7294                        $formats_nav .= " | " .
7295                                $cgi->a({-href => href(action=>"patch", -replay=>1)},
7296                                        "patch");
7297                }
7298                $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7299
7300                if (defined $hash_parent &&
7301                    $hash_parent ne '-c' && $hash_parent ne '--cc') {
7302                        # commitdiff with two commits given
7303                        my $hash_parent_short = $hash_parent;
7304                        if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7305                                $hash_parent_short = substr($hash_parent, 0, 7);
7306                        }
7307                        $formats_nav .=
7308                                ' (from';
7309                        for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7310                                if ($co{'parents'}[$i] eq $hash_parent) {
7311                                        $formats_nav .= ' parent ' . ($i+1);
7312                                        last;
7313                                }
7314                        }
7315                        $formats_nav .= ': ' .
7316                                $cgi->a({-href => href(-replay=>1,
7317                                                       hash=>$hash_parent, hash_base=>undef)},
7318                                        esc_html($hash_parent_short)) .
7319                                ')';
7320                } elsif (!$co{'parent'}) {
7321                        # --root commitdiff
7322                        $formats_nav .= ' (initial)';
7323                } elsif (scalar @{$co{'parents'}} == 1) {
7324                        # single parent commit
7325                        $formats_nav .=
7326                                ' (parent: ' .
7327                                $cgi->a({-href => href(-replay=>1,
7328                                                       hash=>$co{'parent'}, hash_base=>undef)},
7329                                        esc_html(substr($co{'parent'}, 0, 7))) .
7330                                ')';
7331                } else {
7332                        # merge commit
7333                        if ($hash_parent eq '--cc') {
7334                                $formats_nav .= ' | ' .
7335                                        $cgi->a({-href => href(-replay=>1,
7336                                                               hash=>$hash, hash_parent=>'-c')},
7337                                                'combined');
7338                        } else { # $hash_parent eq '-c'
7339                                $formats_nav .= ' | ' .
7340                                        $cgi->a({-href => href(-replay=>1,
7341                                                               hash=>$hash, hash_parent=>'--cc')},
7342                                                'compact');
7343                        }
7344                        $formats_nav .=
7345                                ' (merge: ' .
7346                                join(' ', map {
7347                                        $cgi->a({-href => href(-replay=>1,
7348                                                               hash=>$_, hash_base=>undef)},
7349                                                esc_html(substr($_, 0, 7)));
7350                                } @{$co{'parents'}} ) .
7351                                ')';
7352                }
7353        }
7354
7355        my $hash_parent_param = $hash_parent;
7356        if (!defined $hash_parent_param) {
7357                # --cc for multiple parents, --root for parentless
7358                $hash_parent_param =
7359                        @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7360        }
7361
7362        # read commitdiff
7363        my $fd;
7364        my @difftree;
7365        if ($format eq 'html') {
7366                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7367                        "--no-commit-id", "--patch-with-raw", "--full-index",
7368                        $hash_parent_param, $hash, "--"
7369                        or die_error(500, "Open git-diff-tree failed");
7370
7371                while (my $line = <$fd>) {
7372                        chomp $line;
7373                        # empty line ends raw part of diff-tree output
7374                        last unless $line;
7375                        push @difftree, scalar parse_difftree_raw_line($line);
7376                }
7377
7378        } elsif ($format eq 'plain') {
7379                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7380                        '-p', $hash_parent_param, $hash, "--"
7381                        or die_error(500, "Open git-diff-tree failed");
7382        } elsif ($format eq 'patch') {
7383                # For commit ranges, we limit the output to the number of
7384                # patches specified in the 'patches' feature.
7385                # For single commits, we limit the output to a single patch,
7386                # diverging from the git-format-patch default.
7387                my @commit_spec = ();
7388                if ($hash_parent) {
7389                        if ($patch_max > 0) {
7390                                push @commit_spec, "-$patch_max";
7391                        }
7392                        push @commit_spec, '-n', "$hash_parent..$hash";
7393                } else {
7394                        if ($params{-single}) {
7395                                push @commit_spec, '-1';
7396                        } else {
7397                                if ($patch_max > 0) {
7398                                        push @commit_spec, "-$patch_max";
7399                                }
7400                                push @commit_spec, "-n";
7401                        }
7402                        push @commit_spec, '--root', $hash;
7403                }
7404                open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7405                        '--encoding=utf8', '--stdout', @commit_spec
7406                        or die_error(500, "Open git-format-patch failed");
7407        } else {
7408                die_error(400, "Unknown commitdiff format");
7409        }
7410
7411        # non-textual hash id's can be cached
7412        my $expires;
7413        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7414                $expires = "+1d";
7415        }
7416
7417        # write commit message
7418        if ($format eq 'html') {
7419                my $refs = git_get_references();
7420                my $ref = format_ref_marker($refs, $co{'id'});
7421
7422                git_header_html(undef, $expires);
7423                git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7424                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7425                print "<div class=\"title_text\">\n" .
7426                      "<table class=\"object_header\">\n";
7427                git_print_authorship_rows(\%co);
7428                print "</table>".
7429                      "</div>\n";
7430                print "<div class=\"page_body\">\n";
7431                if (@{$co{'comment'}} > 1) {
7432                        print "<div class=\"log\">\n";
7433                        git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7434                        print "</div>\n"; # class="log"
7435                }
7436
7437        } elsif ($format eq 'plain') {
7438                my $refs = git_get_references("tags");
7439                my $tagname = git_get_rev_name_tags($hash);
7440                my $filename = basename($project) . "-$hash.patch";
7441
7442                print $cgi->header(
7443                        -type => 'text/plain',
7444                        -charset => 'utf-8',
7445                        -expires => $expires,
7446                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7447                my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7448                print "From: " . to_utf8($co{'author'}) . "\n";
7449                print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7450                print "Subject: " . to_utf8($co{'title'}) . "\n";
7451
7452                print "X-Git-Tag: $tagname\n" if $tagname;
7453                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7454
7455                foreach my $line (@{$co{'comment'}}) {
7456                        print to_utf8($line) . "\n";
7457                }
7458                print "---\n\n";
7459        } elsif ($format eq 'patch') {
7460                my $filename = basename($project) . "-$hash.patch";
7461
7462                print $cgi->header(
7463                        -type => 'text/plain',
7464                        -charset => 'utf-8',
7465                        -expires => $expires,
7466                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7467        }
7468
7469        # write patch
7470        if ($format eq 'html') {
7471                my $use_parents = !defined $hash_parent ||
7472                        $hash_parent eq '-c' || $hash_parent eq '--cc';
7473                git_difftree_body(\@difftree, $hash,
7474                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7475                print "<br/>\n";
7476
7477                git_patchset_body($fd, $diff_style,
7478                                  \@difftree, $hash,
7479                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7480                close $fd;
7481                print "</div>\n"; # class="page_body"
7482                git_footer_html();
7483
7484        } elsif ($format eq 'plain') {
7485                local $/ = undef;
7486                print <$fd>;
7487                close $fd
7488                        or print "Reading git-diff-tree failed\n";
7489        } elsif ($format eq 'patch') {
7490                local $/ = undef;
7491                print <$fd>;
7492                close $fd
7493                        or print "Reading git-format-patch failed\n";
7494        }
7495}
7496
7497sub git_commitdiff_plain {
7498        git_commitdiff(-format => 'plain');
7499}
7500
7501# format-patch-style patches
7502sub git_patch {
7503        git_commitdiff(-format => 'patch', -single => 1);
7504}
7505
7506sub git_patches {
7507        git_commitdiff(-format => 'patch');
7508}
7509
7510sub git_history {
7511        git_log_generic('history', \&git_history_body,
7512                        $hash_base, $hash_parent_base,
7513                        $file_name, $hash);
7514}
7515
7516sub git_search {
7517        $searchtype ||= 'commit';
7518
7519        # check if appropriate features are enabled
7520        gitweb_check_feature('search')
7521                or die_error(403, "Search is disabled");
7522        if ($searchtype eq 'pickaxe') {
7523                # pickaxe may take all resources of your box and run for several minutes
7524                # with every query - so decide by yourself how public you make this feature
7525                gitweb_check_feature('pickaxe')
7526                        or die_error(403, "Pickaxe search is disabled");
7527        }
7528        if ($searchtype eq 'grep') {
7529                # grep search might be potentially CPU-intensive, too
7530                gitweb_check_feature('grep')
7531                        or die_error(403, "Grep search is disabled");
7532        }
7533
7534        if (!defined $searchtext) {
7535                die_error(400, "Text field is empty");
7536        }
7537        if (!defined $hash) {
7538                $hash = git_get_head_hash($project);
7539        }
7540        my %co = parse_commit($hash);
7541        if (!%co) {
7542                die_error(404, "Unknown commit object");
7543        }
7544        if (!defined $page) {
7545                $page = 0;
7546        }
7547
7548        if ($searchtype eq 'commit' ||
7549            $searchtype eq 'author' ||
7550            $searchtype eq 'committer') {
7551                git_search_message(%co);
7552        } elsif ($searchtype eq 'pickaxe') {
7553                git_search_changes(%co);
7554        } elsif ($searchtype eq 'grep') {
7555                git_search_files(%co);
7556        } else {
7557                die_error(400, "Unknown search type");
7558        }
7559}
7560
7561sub git_search_help {
7562        git_header_html();
7563        git_print_page_nav('','', $hash,$hash,$hash);
7564        print <<EOT;
7565<p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7566regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7567the pattern entered is recognized as the POSIX extended
7568<a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7569insensitive).</p>
7570<dl>
7571<dt><b>commit</b></dt>
7572<dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7573EOT
7574        my $have_grep = gitweb_check_feature('grep');
7575        if ($have_grep) {
7576                print <<EOT;
7577<dt><b>grep</b></dt>
7578<dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7579    a different one) are searched for the given pattern. On large trees, this search can take
7580a while and put some strain on the server, so please use it with some consideration. Note that
7581due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7582case-sensitive.</dd>
7583EOT
7584        }
7585        print <<EOT;
7586<dt><b>author</b></dt>
7587<dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7588<dt><b>committer</b></dt>
7589<dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7590EOT
7591        my $have_pickaxe = gitweb_check_feature('pickaxe');
7592        if ($have_pickaxe) {
7593                print <<EOT;
7594<dt><b>pickaxe</b></dt>
7595<dd>All commits that caused the string to appear or disappear from any file (changes that
7596added, removed or "modified" the string) will be listed. This search can take a while and
7597takes a lot of strain on the server, so please use it wisely. Note that since you may be
7598interested even in changes just changing the case as well, this search is case sensitive.</dd>
7599EOT
7600        }
7601        print "</dl>\n";
7602        git_footer_html();
7603}
7604
7605sub git_shortlog {
7606        git_log_generic('shortlog', \&git_shortlog_body,
7607                        $hash, $hash_parent);
7608}
7609
7610## ......................................................................
7611## feeds (RSS, Atom; OPML)
7612
7613sub git_feed {
7614        my $format = shift || 'atom';
7615        my $have_blame = gitweb_check_feature('blame');
7616
7617        # Atom: http://www.atomenabled.org/developers/syndication/
7618        # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7619        if ($format ne 'rss' && $format ne 'atom') {
7620                die_error(400, "Unknown web feed format");
7621        }
7622
7623        # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7624        my $head = $hash || 'HEAD';
7625        my @commitlist = parse_commits($head, 150, 0, $file_name);
7626
7627        my %latest_commit;
7628        my %latest_date;
7629        my $content_type = "application/$format+xml";
7630        if (defined $cgi->http('HTTP_ACCEPT') &&
7631                 $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7632                # browser (feed reader) prefers text/xml
7633                $content_type = 'text/xml';
7634        }
7635        if (defined($commitlist[0])) {
7636                %latest_commit = %{$commitlist[0]};
7637                my $latest_epoch = $latest_commit{'committer_epoch'};
7638                %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7639                my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7640                if (defined $if_modified) {
7641                        my $since;
7642                        if (eval { require HTTP::Date; 1; }) {
7643                                $since = HTTP::Date::str2time($if_modified);
7644                        } elsif (eval { require Time::ParseDate; 1; }) {
7645                                $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7646                        }
7647                        if (defined $since && $latest_epoch <= $since) {
7648                                print $cgi->header(
7649                                        -type => $content_type,
7650                                        -charset => 'utf-8',
7651                                        -last_modified => $latest_date{'rfc2822'},
7652                                        -status => '304 Not Modified');
7653                                return;
7654                        }
7655                }
7656                print $cgi->header(
7657                        -type => $content_type,
7658                        -charset => 'utf-8',
7659                        -last_modified => $latest_date{'rfc2822'});
7660        } else {
7661                print $cgi->header(
7662                        -type => $content_type,
7663                        -charset => 'utf-8');
7664        }
7665
7666        # Optimization: skip generating the body if client asks only
7667        # for Last-Modified date.
7668        return if ($cgi->request_method() eq 'HEAD');
7669
7670        # header variables
7671        my $title = "$site_name - $project/$action";
7672        my $feed_type = 'log';
7673        if (defined $hash) {
7674                $title .= " - '$hash'";
7675                $feed_type = 'branch log';
7676                if (defined $file_name) {
7677                        $title .= " :: $file_name";
7678                        $feed_type = 'history';
7679                }
7680        } elsif (defined $file_name) {
7681                $title .= " - $file_name";
7682                $feed_type = 'history';
7683        }
7684        $title .= " $feed_type";
7685        my $descr = git_get_project_description($project);
7686        if (defined $descr) {
7687                $descr = esc_html($descr);
7688        } else {
7689                $descr = "$project " .
7690                         ($format eq 'rss' ? 'RSS' : 'Atom') .
7691                         " feed";
7692        }
7693        my $owner = git_get_project_owner($project);
7694        $owner = esc_html($owner);
7695
7696        #header
7697        my $alt_url;
7698        if (defined $file_name) {
7699                $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7700        } elsif (defined $hash) {
7701                $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7702        } else {
7703                $alt_url = href(-full=>1, action=>"summary");
7704        }
7705        print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7706        if ($format eq 'rss') {
7707                print <<XML;
7708<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7709<channel>
7710XML
7711                print "<title>$title</title>\n" .
7712                      "<link>$alt_url</link>\n" .
7713                      "<description>$descr</description>\n" .
7714                      "<language>en</language>\n" .
7715                      # project owner is responsible for 'editorial' content
7716                      "<managingEditor>$owner</managingEditor>\n";
7717                if (defined $logo || defined $favicon) {
7718                        # prefer the logo to the favicon, since RSS
7719                        # doesn't allow both
7720                        my $img = esc_url($logo || $favicon);
7721                        print "<image>\n" .
7722                              "<url>$img</url>\n" .
7723                              "<title>$title</title>\n" .
7724                              "<link>$alt_url</link>\n" .
7725                              "</image>\n";
7726                }
7727                if (%latest_date) {
7728                        print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7729                        print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7730                }
7731                print "<generator>gitweb v.$version/$git_version</generator>\n";
7732        } elsif ($format eq 'atom') {
7733                print <<XML;
7734<feed xmlns="http://www.w3.org/2005/Atom">
7735XML
7736                print "<title>$title</title>\n" .
7737                      "<subtitle>$descr</subtitle>\n" .
7738                      '<link rel="alternate" type="text/html" href="' .
7739                      $alt_url . '" />' . "\n" .
7740                      '<link rel="self" type="' . $content_type . '" href="' .
7741                      $cgi->self_url() . '" />' . "\n" .
7742                      "<id>" . href(-full=>1) . "</id>\n" .
7743                      # use project owner for feed author
7744                      "<author><name>$owner</name></author>\n";
7745                if (defined $favicon) {
7746                        print "<icon>" . esc_url($favicon) . "</icon>\n";
7747                }
7748                if (defined $logo) {
7749                        # not twice as wide as tall: 72 x 27 pixels
7750                        print "<logo>" . esc_url($logo) . "</logo>\n";
7751                }
7752                if (! %latest_date) {
7753                        # dummy date to keep the feed valid until commits trickle in:
7754                        print "<updated>1970-01-01T00:00:00Z</updated>\n";
7755                } else {
7756                        print "<updated>$latest_date{'iso-8601'}</updated>\n";
7757                }
7758                print "<generator version='$version/$git_version'>gitweb</generator>\n";
7759        }
7760
7761        # contents
7762        for (my $i = 0; $i <= $#commitlist; $i++) {
7763                my %co = %{$commitlist[$i]};
7764                my $commit = $co{'id'};
7765                # we read 150, we always show 30 and the ones more recent than 48 hours
7766                if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7767                        last;
7768                }
7769                my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7770
7771                # get list of changed files
7772                open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7773                        $co{'parent'} || "--root",
7774                        $co{'id'}, "--", (defined $file_name ? $file_name : ())
7775                        or next;
7776                my @difftree = map { chomp; $_ } <$fd>;
7777                close $fd
7778                        or next;
7779
7780                # print element (entry, item)
7781                my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7782                if ($format eq 'rss') {
7783                        print "<item>\n" .
7784                              "<title>" . esc_html($co{'title'}) . "</title>\n" .
7785                              "<author>" . esc_html($co{'author'}) . "</author>\n" .
7786                              "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7787                              "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7788                              "<link>$co_url</link>\n" .
7789                              "<description>" . esc_html($co{'title'}) . "</description>\n" .
7790                              "<content:encoded>" .
7791                              "<![CDATA[\n";
7792                } elsif ($format eq 'atom') {
7793                        print "<entry>\n" .
7794                              "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7795                              "<updated>$cd{'iso-8601'}</updated>\n" .
7796                              "<author>\n" .
7797                              "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7798                        if ($co{'author_email'}) {
7799                                print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7800                        }
7801                        print "</author>\n" .
7802                              # use committer for contributor
7803                              "<contributor>\n" .
7804                              "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7805                        if ($co{'committer_email'}) {
7806                                print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7807                        }
7808                        print "</contributor>\n" .
7809                              "<published>$cd{'iso-8601'}</published>\n" .
7810                              "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7811                              "<id>$co_url</id>\n" .
7812                              "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
7813                              "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
7814                }
7815                my $comment = $co{'comment'};
7816                print "<pre>\n";
7817                foreach my $line (@$comment) {
7818                        $line = esc_html($line);
7819                        print "$line\n";
7820                }
7821                print "</pre><ul>\n";
7822                foreach my $difftree_line (@difftree) {
7823                        my %difftree = parse_difftree_raw_line($difftree_line);
7824                        next if !$difftree{'from_id'};
7825
7826                        my $file = $difftree{'file'} || $difftree{'to_file'};
7827
7828                        print "<li>" .
7829                              "[" .
7830                              $cgi->a({-href => href(-full=>1, action=>"blobdiff",
7831                                                     hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
7832                                                     hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
7833                                                     file_name=>$file, file_parent=>$difftree{'from_file'}),
7834                                      -title => "diff"}, 'D');
7835                        if ($have_blame) {
7836                                print $cgi->a({-href => href(-full=>1, action=>"blame",
7837                                                             file_name=>$file, hash_base=>$commit),
7838                                              -title => "blame"}, 'B');
7839                        }
7840                        # if this is not a feed of a file history
7841                        if (!defined $file_name || $file_name ne $file) {
7842                                print $cgi->a({-href => href(-full=>1, action=>"history",
7843                                                             file_name=>$file, hash=>$commit),
7844                                              -title => "history"}, 'H');
7845                        }
7846                        $file = esc_path($file);
7847                        print "] ".
7848                              "$file</li>\n";
7849                }
7850                if ($format eq 'rss') {
7851                        print "</ul>]]>\n" .
7852                              "</content:encoded>\n" .
7853                              "</item>\n";
7854                } elsif ($format eq 'atom') {
7855                        print "</ul>\n</div>\n" .
7856                              "</content>\n" .
7857                              "</entry>\n";
7858                }
7859        }
7860
7861        # end of feed
7862        if ($format eq 'rss') {
7863                print "</channel>\n</rss>\n";
7864        } elsif ($format eq 'atom') {
7865                print "</feed>\n";
7866        }
7867}
7868
7869sub git_rss {
7870        git_feed('rss');
7871}
7872
7873sub git_atom {
7874        git_feed('atom');
7875}
7876
7877sub git_opml {
7878        my @list = git_get_projects_list($project_filter, $strict_export);
7879        if (!@list) {
7880                die_error(404, "No projects found");
7881        }
7882
7883        print $cgi->header(
7884                -type => 'text/xml',
7885                -charset => 'utf-8',
7886                -content_disposition => 'inline; filename="opml.xml"');
7887
7888        my $title = esc_html($site_name);
7889        my $filter = " within subdirectory ";
7890        if (defined $project_filter) {
7891                $filter .= esc_html($project_filter);
7892        } else {
7893                $filter = "";
7894        }
7895        print <<XML;
7896<?xml version="1.0" encoding="utf-8"?>
7897<opml version="1.0">
7898<head>
7899  <title>$title OPML Export$filter</title>
7900</head>
7901<body>
7902<outline text="git RSS feeds">
7903XML
7904
7905        foreach my $pr (@list) {
7906                my %proj = %$pr;
7907                my $head = git_get_head_hash($proj{'path'});
7908                if (!defined $head) {
7909                        next;
7910                }
7911                $git_dir = "$projectroot/$proj{'path'}";
7912                my %co = parse_commit($head);
7913                if (!%co) {
7914                        next;
7915                }
7916
7917                my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7918                my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7919                my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7920                print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7921        }
7922        print <<XML;
7923</outline>
7924</body>
7925</opml>
7926XML
7927}