gitweb / gitweb.perlon commit gitweb: Use descriptive names in esc_html_hl_regions() (ce61fb9)
   1#!/usr/bin/perl
   2
   3# gitweb - simple web interface to track changes in git repositories
   4#
   5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
   6# (C) 2005, Christian Gierke
   7#
   8# This program is licensed under the GPLv2
   9
  10use 5.008;
  11use strict;
  12use warnings;
  13use CGI qw(:standard :escapeHTML -nosticky);
  14use CGI::Util qw(unescape);
  15use CGI::Carp qw(fatalsToBrowser set_message);
  16use Encode;
  17use Fcntl ':mode';
  18use File::Find qw();
  19use File::Basename qw(basename);
  20use Time::HiRes qw(gettimeofday tv_interval);
  21binmode STDOUT, ':utf8';
  22
  23our $t0 = [ gettimeofday() ];
  24our $number_of_git_cmds = 0;
  25
  26BEGIN {
  27        CGI->compile() if $ENV{'MOD_PERL'};
  28}
  29
  30our $version = "++GIT_VERSION++";
  31
  32our ($my_url, $my_uri, $base_url, $path_info, $home_link);
  33sub evaluate_uri {
  34        our $cgi;
  35
  36        our $my_url = $cgi->url();
  37        our $my_uri = $cgi->url(-absolute => 1);
  38
  39        # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
  40        # needed and used only for URLs with nonempty PATH_INFO
  41        our $base_url = $my_url;
  42
  43        # When the script is used as DirectoryIndex, the URL does not contain the name
  44        # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
  45        # have to do it ourselves. We make $path_info global because it's also used
  46        # later on.
  47        #
  48        # Another issue with the script being the DirectoryIndex is that the resulting
  49        # $my_url data is not the full script URL: this is good, because we want
  50        # generated links to keep implying the script name if it wasn't explicitly
  51        # indicated in the URL we're handling, but it means that $my_url cannot be used
  52        # as base URL.
  53        # Therefore, if we needed to strip PATH_INFO, then we know that we have
  54        # to build the base URL ourselves:
  55        our $path_info = decode_utf8($ENV{"PATH_INFO"});
  56        if ($path_info) {
  57                if ($my_url =~ s,\Q$path_info\E$,, &&
  58                    $my_uri =~ s,\Q$path_info\E$,, &&
  59                    defined $ENV{'SCRIPT_NAME'}) {
  60                        $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
  61                }
  62        }
  63
  64        # target of the home link on top of all pages
  65        our $home_link = $my_uri || "/";
  66}
  67
  68# core git executable to use
  69# this can just be "git" if your webserver has a sensible PATH
  70our $GIT = "++GIT_BINDIR++/git";
  71
  72# absolute fs-path which will be prepended to the project path
  73#our $projectroot = "/pub/scm";
  74our $projectroot = "++GITWEB_PROJECTROOT++";
  75
  76# fs traversing limit for getting project list
  77# the number is relative to the projectroot
  78our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
  79
  80# string of the home link on top of all pages
  81our $home_link_str = "++GITWEB_HOME_LINK_STR++";
  82
  83# name of your site or organization to appear in page titles
  84# replace this with something more descriptive for clearer bookmarks
  85our $site_name = "++GITWEB_SITENAME++"
  86                 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
  87
  88# html snippet to include in the <head> section of each page
  89our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
  90# filename of html text to include at top of each page
  91our $site_header = "++GITWEB_SITE_HEADER++";
  92# html text to include at home page
  93our $home_text = "++GITWEB_HOMETEXT++";
  94# filename of html text to include at bottom of each page
  95our $site_footer = "++GITWEB_SITE_FOOTER++";
  96
  97# URI of stylesheets
  98our @stylesheets = ("++GITWEB_CSS++");
  99# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
 100our $stylesheet = undef;
 101# URI of GIT logo (72x27 size)
 102our $logo = "++GITWEB_LOGO++";
 103# URI of GIT favicon, assumed to be image/png type
 104our $favicon = "++GITWEB_FAVICON++";
 105# URI of gitweb.js (JavaScript code for gitweb)
 106our $javascript = "++GITWEB_JS++";
 107
 108# URI and label (title) of GIT logo link
 109#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
 110#our $logo_label = "git documentation";
 111our $logo_url = "http://git-scm.com/";
 112our $logo_label = "git homepage";
 113
 114# source of projects list
 115our $projects_list = "++GITWEB_LIST++";
 116
 117# the width (in characters) of the projects list "Description" column
 118our $projects_list_description_width = 25;
 119
 120# group projects by category on the projects list
 121# (enabled if this variable evaluates to true)
 122our $projects_list_group_categories = 0;
 123
 124# default category if none specified
 125# (leave the empty string for no category)
 126our $project_list_default_category = "";
 127
 128# default order of projects list
 129# valid values are none, project, descr, owner, and age
 130our $default_projects_order = "project";
 131
 132# show repository only if this file exists
 133# (only effective if this variable evaluates to true)
 134our $export_ok = "++GITWEB_EXPORT_OK++";
 135
 136# show repository only if this subroutine returns true
 137# when given the path to the project, for example:
 138#    sub { return -e "$_[0]/git-daemon-export-ok"; }
 139our $export_auth_hook = undef;
 140
 141# only allow viewing of repositories also shown on the overview page
 142our $strict_export = "++GITWEB_STRICT_EXPORT++";
 143
 144# list of git base URLs used for URL to where fetch project from,
 145# i.e. full URL is "$git_base_url/$project"
 146our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
 147
 148# default blob_plain mimetype and default charset for text/plain blob
 149our $default_blob_plain_mimetype = 'text/plain';
 150our $default_text_plain_charset  = undef;
 151
 152# file to use for guessing MIME types before trying /etc/mime.types
 153# (relative to the current git repository)
 154our $mimetypes_file = undef;
 155
 156# assume this charset if line contains non-UTF-8 characters;
 157# it should be valid encoding (see Encoding::Supported(3pm) for list),
 158# for which encoding all byte sequences are valid, for example
 159# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
 160# could be even 'utf-8' for the old behavior)
 161our $fallback_encoding = 'latin1';
 162
 163# rename detection options for git-diff and git-diff-tree
 164# - default is '-M', with the cost proportional to
 165#   (number of removed files) * (number of new files).
 166# - more costly is '-C' (which implies '-M'), with the cost proportional to
 167#   (number of changed files + number of removed files) * (number of new files)
 168# - even more costly is '-C', '--find-copies-harder' with cost
 169#   (number of files in the original tree) * (number of new files)
 170# - one might want to include '-B' option, e.g. '-B', '-M'
 171our @diff_opts = ('-M'); # taken from git_commit
 172
 173# Disables features that would allow repository owners to inject script into
 174# the gitweb domain.
 175our $prevent_xss = 0;
 176
 177# Path to the highlight executable to use (must be the one from
 178# http://www.andre-simon.de due to assumptions about parameters and output).
 179# Useful if highlight is not installed on your webserver's PATH.
 180# [Default: highlight]
 181our $highlight_bin = "++HIGHLIGHT_BIN++";
 182
 183# information about snapshot formats that gitweb is capable of serving
 184our %known_snapshot_formats = (
 185        # name => {
 186        #       'display' => display name,
 187        #       'type' => mime type,
 188        #       'suffix' => filename suffix,
 189        #       'format' => --format for git-archive,
 190        #       'compressor' => [compressor command and arguments]
 191        #                       (array reference, optional)
 192        #       'disabled' => boolean (optional)}
 193        #
 194        'tgz' => {
 195                'display' => 'tar.gz',
 196                'type' => 'application/x-gzip',
 197                'suffix' => '.tar.gz',
 198                'format' => 'tar',
 199                'compressor' => ['gzip', '-n']},
 200
 201        'tbz2' => {
 202                'display' => 'tar.bz2',
 203                'type' => 'application/x-bzip2',
 204                'suffix' => '.tar.bz2',
 205                'format' => 'tar',
 206                'compressor' => ['bzip2']},
 207
 208        'txz' => {
 209                'display' => 'tar.xz',
 210                'type' => 'application/x-xz',
 211                'suffix' => '.tar.xz',
 212                'format' => 'tar',
 213                'compressor' => ['xz'],
 214                'disabled' => 1},
 215
 216        'zip' => {
 217                'display' => 'zip',
 218                'type' => 'application/x-zip',
 219                'suffix' => '.zip',
 220                'format' => 'zip'},
 221);
 222
 223# Aliases so we understand old gitweb.snapshot values in repository
 224# configuration.
 225our %known_snapshot_format_aliases = (
 226        'gzip'  => 'tgz',
 227        'bzip2' => 'tbz2',
 228        'xz'    => 'txz',
 229
 230        # backward compatibility: legacy gitweb config support
 231        'x-gzip' => undef, 'gz' => undef,
 232        'x-bzip2' => undef, 'bz2' => undef,
 233        'x-zip' => undef, '' => undef,
 234);
 235
 236# Pixel sizes for icons and avatars. If the default font sizes or lineheights
 237# are changed, it may be appropriate to change these values too via
 238# $GITWEB_CONFIG.
 239our %avatar_size = (
 240        'default' => 16,
 241        'double'  => 32
 242);
 243
 244# Used to set the maximum load that we will still respond to gitweb queries.
 245# If server load exceed this value then return "503 server busy" error.
 246# If gitweb cannot determined server load, it is taken to be 0.
 247# Leave it undefined (or set to 'undef') to turn off load checking.
 248our $maxload = 300;
 249
 250# configuration for 'highlight' (http://www.andre-simon.de/)
 251# match by basename
 252our %highlight_basename = (
 253        #'Program' => 'py',
 254        #'Library' => 'py',
 255        'SConstruct' => 'py', # SCons equivalent of Makefile
 256        'Makefile' => 'make',
 257);
 258# match by extension
 259our %highlight_ext = (
 260        # main extensions, defining name of syntax;
 261        # see files in /usr/share/highlight/langDefs/ directory
 262        map { $_ => $_ }
 263                qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
 264        # alternate extensions, see /etc/highlight/filetypes.conf
 265        'h' => 'c',
 266        map { $_ => 'sh'  } qw(bash zsh ksh),
 267        map { $_ => 'cpp' } qw(cxx c++ cc),
 268        map { $_ => 'php' } qw(php3 php4 php5 phps),
 269        map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
 270        map { $_ => 'make'} qw(mak mk),
 271        map { $_ => 'xml' } qw(xhtml html htm),
 272);
 273
 274# You define site-wide feature defaults here; override them with
 275# $GITWEB_CONFIG as necessary.
 276our %feature = (
 277        # feature => {
 278        #       'sub' => feature-sub (subroutine),
 279        #       'override' => allow-override (boolean),
 280        #       'default' => [ default options...] (array reference)}
 281        #
 282        # if feature is overridable (it means that allow-override has true value),
 283        # then feature-sub will be called with default options as parameters;
 284        # return value of feature-sub indicates if to enable specified feature
 285        #
 286        # if there is no 'sub' key (no feature-sub), then feature cannot be
 287        # overridden
 288        #
 289        # use gitweb_get_feature(<feature>) to retrieve the <feature> value
 290        # (an array) or gitweb_check_feature(<feature>) to check if <feature>
 291        # is enabled
 292
 293        # Enable the 'blame' blob view, showing the last commit that modified
 294        # each line in the file. This can be very CPU-intensive.
 295
 296        # To enable system wide have in $GITWEB_CONFIG
 297        # $feature{'blame'}{'default'} = [1];
 298        # To have project specific config enable override in $GITWEB_CONFIG
 299        # $feature{'blame'}{'override'} = 1;
 300        # and in project config gitweb.blame = 0|1;
 301        'blame' => {
 302                'sub' => sub { feature_bool('blame', @_) },
 303                'override' => 0,
 304                'default' => [0]},
 305
 306        # Enable the 'snapshot' link, providing a compressed archive of any
 307        # tree. This can potentially generate high traffic if you have large
 308        # project.
 309
 310        # Value is a list of formats defined in %known_snapshot_formats that
 311        # you wish to offer.
 312        # To disable system wide have in $GITWEB_CONFIG
 313        # $feature{'snapshot'}{'default'} = [];
 314        # To have project specific config enable override in $GITWEB_CONFIG
 315        # $feature{'snapshot'}{'override'} = 1;
 316        # and in project config, a comma-separated list of formats or "none"
 317        # to disable.  Example: gitweb.snapshot = tbz2,zip;
 318        'snapshot' => {
 319                'sub' => \&feature_snapshot,
 320                'override' => 0,
 321                'default' => ['tgz']},
 322
 323        # Enable text search, which will list the commits which match author,
 324        # committer or commit text to a given string.  Enabled by default.
 325        # Project specific override is not supported.
 326        #
 327        # Note that this controls all search features, which means that if
 328        # it is disabled, then 'grep' and 'pickaxe' search would also be
 329        # disabled.
 330        'search' => {
 331                'override' => 0,
 332                'default' => [1]},
 333
 334        # Enable grep search, which will list the files in currently selected
 335        # tree containing the given string. Enabled by default. This can be
 336        # potentially CPU-intensive, of course.
 337        # Note that you need to have 'search' feature enabled too.
 338
 339        # To enable system wide have in $GITWEB_CONFIG
 340        # $feature{'grep'}{'default'} = [1];
 341        # To have project specific config enable override in $GITWEB_CONFIG
 342        # $feature{'grep'}{'override'} = 1;
 343        # and in project config gitweb.grep = 0|1;
 344        'grep' => {
 345                'sub' => sub { feature_bool('grep', @_) },
 346                'override' => 0,
 347                'default' => [1]},
 348
 349        # Enable the pickaxe search, which will list the commits that modified
 350        # a given string in a file. This can be practical and quite faster
 351        # alternative to 'blame', but still potentially CPU-intensive.
 352        # Note that you need to have 'search' feature enabled too.
 353
 354        # To enable system wide have in $GITWEB_CONFIG
 355        # $feature{'pickaxe'}{'default'} = [1];
 356        # To have project specific config enable override in $GITWEB_CONFIG
 357        # $feature{'pickaxe'}{'override'} = 1;
 358        # and in project config gitweb.pickaxe = 0|1;
 359        'pickaxe' => {
 360                'sub' => sub { feature_bool('pickaxe', @_) },
 361                'override' => 0,
 362                'default' => [1]},
 363
 364        # Enable showing size of blobs in a 'tree' view, in a separate
 365        # column, similar to what 'ls -l' does.  This cost a bit of IO.
 366
 367        # To disable system wide have in $GITWEB_CONFIG
 368        # $feature{'show-sizes'}{'default'} = [0];
 369        # To have project specific config enable override in $GITWEB_CONFIG
 370        # $feature{'show-sizes'}{'override'} = 1;
 371        # and in project config gitweb.showsizes = 0|1;
 372        'show-sizes' => {
 373                'sub' => sub { feature_bool('showsizes', @_) },
 374                'override' => 0,
 375                'default' => [1]},
 376
 377        # Make gitweb use an alternative format of the URLs which can be
 378        # more readable and natural-looking: project name is embedded
 379        # directly in the path and the query string contains other
 380        # auxiliary information. All gitweb installations recognize
 381        # URL in either format; this configures in which formats gitweb
 382        # generates links.
 383
 384        # To enable system wide have in $GITWEB_CONFIG
 385        # $feature{'pathinfo'}{'default'} = [1];
 386        # Project specific override is not supported.
 387
 388        # Note that you will need to change the default location of CSS,
 389        # favicon, logo and possibly other files to an absolute URL. Also,
 390        # if gitweb.cgi serves as your indexfile, you will need to force
 391        # $my_uri to contain the script name in your $GITWEB_CONFIG.
 392        'pathinfo' => {
 393                'override' => 0,
 394                'default' => [0]},
 395
 396        # Make gitweb consider projects in project root subdirectories
 397        # to be forks of existing projects. Given project $projname.git,
 398        # projects matching $projname/*.git will not be shown in the main
 399        # projects list, instead a '+' mark will be added to $projname
 400        # there and a 'forks' view will be enabled for the project, listing
 401        # all the forks. If project list is taken from a file, forks have
 402        # to be listed after the main project.
 403
 404        # To enable system wide have in $GITWEB_CONFIG
 405        # $feature{'forks'}{'default'} = [1];
 406        # Project specific override is not supported.
 407        'forks' => {
 408                'override' => 0,
 409                'default' => [0]},
 410
 411        # Insert custom links to the action bar of all project pages.
 412        # This enables you mainly to link to third-party scripts integrating
 413        # into gitweb; e.g. git-browser for graphical history representation
 414        # or custom web-based repository administration interface.
 415
 416        # The 'default' value consists of a list of triplets in the form
 417        # (label, link, position) where position is the label after which
 418        # to insert the link and link is a format string where %n expands
 419        # to the project name, %f to the project path within the filesystem,
 420        # %h to the current hash (h gitweb parameter) and %b to the current
 421        # hash base (hb gitweb parameter); %% expands to %.
 422
 423        # To enable system wide have in $GITWEB_CONFIG e.g.
 424        # $feature{'actions'}{'default'} = [('graphiclog',
 425        #       '/git-browser/by-commit.html?r=%n', 'summary')];
 426        # Project specific override is not supported.
 427        'actions' => {
 428                'override' => 0,
 429                'default' => []},
 430
 431        # Allow gitweb scan project content tags of project repository,
 432        # and display the popular Web 2.0-ish "tag cloud" near the projects
 433        # list.  Note that this is something COMPLETELY different from the
 434        # normal Git tags.
 435
 436        # gitweb by itself can show existing tags, but it does not handle
 437        # tagging itself; you need to do it externally, outside gitweb.
 438        # The format is described in git_get_project_ctags() subroutine.
 439        # You may want to install the HTML::TagCloud Perl module to get
 440        # a pretty tag cloud instead of just a list of tags.
 441
 442        # To enable system wide have in $GITWEB_CONFIG
 443        # $feature{'ctags'}{'default'} = [1];
 444        # Project specific override is not supported.
 445
 446        # In the future whether ctags editing is enabled might depend
 447        # on the value, but using 1 should always mean no editing of ctags.
 448        'ctags' => {
 449                'override' => 0,
 450                'default' => [0]},
 451
 452        # The maximum number of patches in a patchset generated in patch
 453        # view. Set this to 0 or undef to disable patch view, or to a
 454        # negative number to remove any limit.
 455
 456        # To disable system wide have in $GITWEB_CONFIG
 457        # $feature{'patches'}{'default'} = [0];
 458        # To have project specific config enable override in $GITWEB_CONFIG
 459        # $feature{'patches'}{'override'} = 1;
 460        # and in project config gitweb.patches = 0|n;
 461        # where n is the maximum number of patches allowed in a patchset.
 462        'patches' => {
 463                'sub' => \&feature_patches,
 464                'override' => 0,
 465                'default' => [16]},
 466
 467        # Avatar support. When this feature is enabled, views such as
 468        # shortlog or commit will display an avatar associated with
 469        # the email of the committer(s) and/or author(s).
 470
 471        # Currently available providers are gravatar and picon.
 472        # If an unknown provider is specified, the feature is disabled.
 473
 474        # Gravatar depends on Digest::MD5.
 475        # Picon currently relies on the indiana.edu database.
 476
 477        # To enable system wide have in $GITWEB_CONFIG
 478        # $feature{'avatar'}{'default'} = ['<provider>'];
 479        # where <provider> is either gravatar or picon.
 480        # To have project specific config enable override in $GITWEB_CONFIG
 481        # $feature{'avatar'}{'override'} = 1;
 482        # and in project config gitweb.avatar = <provider>;
 483        'avatar' => {
 484                'sub' => \&feature_avatar,
 485                'override' => 0,
 486                'default' => ['']},
 487
 488        # Enable displaying how much time and how many git commands
 489        # it took to generate and display page.  Disabled by default.
 490        # Project specific override is not supported.
 491        'timed' => {
 492                'override' => 0,
 493                'default' => [0]},
 494
 495        # Enable turning some links into links to actions which require
 496        # JavaScript to run (like 'blame_incremental').  Not enabled by
 497        # default.  Project specific override is currently not supported.
 498        'javascript-actions' => {
 499                'override' => 0,
 500                'default' => [0]},
 501
 502        # Enable and configure ability to change common timezone for dates
 503        # in gitweb output via JavaScript.  Enabled by default.
 504        # Project specific override is not supported.
 505        'javascript-timezone' => {
 506                'override' => 0,
 507                'default' => [
 508                        'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
 509                                     # or undef to turn off this feature
 510                        'gitweb_tz', # name of cookie where to store selected timezone
 511                        'datetime',  # CSS class used to mark up dates for manipulation
 512                ]},
 513
 514        # Syntax highlighting support. This is based on Daniel Svensson's
 515        # and Sham Chukoury's work in gitweb-xmms2.git.
 516        # It requires the 'highlight' program present in $PATH,
 517        # and therefore is disabled by default.
 518
 519        # To enable system wide have in $GITWEB_CONFIG
 520        # $feature{'highlight'}{'default'} = [1];
 521
 522        'highlight' => {
 523                'sub' => sub { feature_bool('highlight', @_) },
 524                'override' => 0,
 525                'default' => [0]},
 526
 527        # Enable displaying of remote heads in the heads list
 528
 529        # To enable system wide have in $GITWEB_CONFIG
 530        # $feature{'remote_heads'}{'default'} = [1];
 531        # To have project specific config enable override in $GITWEB_CONFIG
 532        # $feature{'remote_heads'}{'override'} = 1;
 533        # and in project config gitweb.remote_heads = 0|1;
 534        'remote_heads' => {
 535                'sub' => sub { feature_bool('remote_heads', @_) },
 536                'override' => 0,
 537                'default' => [0]},
 538);
 539
 540sub gitweb_get_feature {
 541        my ($name) = @_;
 542        return unless exists $feature{$name};
 543        my ($sub, $override, @defaults) = (
 544                $feature{$name}{'sub'},
 545                $feature{$name}{'override'},
 546                @{$feature{$name}{'default'}});
 547        # project specific override is possible only if we have project
 548        our $git_dir; # global variable, declared later
 549        if (!$override || !defined $git_dir) {
 550                return @defaults;
 551        }
 552        if (!defined $sub) {
 553                warn "feature $name is not overridable";
 554                return @defaults;
 555        }
 556        return $sub->(@defaults);
 557}
 558
 559# A wrapper to check if a given feature is enabled.
 560# With this, you can say
 561#
 562#   my $bool_feat = gitweb_check_feature('bool_feat');
 563#   gitweb_check_feature('bool_feat') or somecode;
 564#
 565# instead of
 566#
 567#   my ($bool_feat) = gitweb_get_feature('bool_feat');
 568#   (gitweb_get_feature('bool_feat'))[0] or somecode;
 569#
 570sub gitweb_check_feature {
 571        return (gitweb_get_feature(@_))[0];
 572}
 573
 574
 575sub feature_bool {
 576        my $key = shift;
 577        my ($val) = git_get_project_config($key, '--bool');
 578
 579        if (!defined $val) {
 580                return ($_[0]);
 581        } elsif ($val eq 'true') {
 582                return (1);
 583        } elsif ($val eq 'false') {
 584                return (0);
 585        }
 586}
 587
 588sub feature_snapshot {
 589        my (@fmts) = @_;
 590
 591        my ($val) = git_get_project_config('snapshot');
 592
 593        if ($val) {
 594                @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
 595        }
 596
 597        return @fmts;
 598}
 599
 600sub feature_patches {
 601        my @val = (git_get_project_config('patches', '--int'));
 602
 603        if (@val) {
 604                return @val;
 605        }
 606
 607        return ($_[0]);
 608}
 609
 610sub feature_avatar {
 611        my @val = (git_get_project_config('avatar'));
 612
 613        return @val ? @val : @_;
 614}
 615
 616# checking HEAD file with -e is fragile if the repository was
 617# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
 618# and then pruned.
 619sub check_head_link {
 620        my ($dir) = @_;
 621        my $headfile = "$dir/HEAD";
 622        return ((-e $headfile) ||
 623                (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
 624}
 625
 626sub check_export_ok {
 627        my ($dir) = @_;
 628        return (check_head_link($dir) &&
 629                (!$export_ok || -e "$dir/$export_ok") &&
 630                (!$export_auth_hook || $export_auth_hook->($dir)));
 631}
 632
 633# process alternate names for backward compatibility
 634# filter out unsupported (unknown) snapshot formats
 635sub filter_snapshot_fmts {
 636        my @fmts = @_;
 637
 638        @fmts = map {
 639                exists $known_snapshot_format_aliases{$_} ?
 640                       $known_snapshot_format_aliases{$_} : $_} @fmts;
 641        @fmts = grep {
 642                exists $known_snapshot_formats{$_} &&
 643                !$known_snapshot_formats{$_}{'disabled'}} @fmts;
 644}
 645
 646# If it is set to code reference, it is code that it is to be run once per
 647# request, allowing updating configurations that change with each request,
 648# while running other code in config file only once.
 649#
 650# Otherwise, if it is false then gitweb would process config file only once;
 651# if it is true then gitweb config would be run for each request.
 652our $per_request_config = 1;
 653
 654# read and parse gitweb config file given by its parameter.
 655# returns true on success, false on recoverable error, allowing
 656# to chain this subroutine, using first file that exists.
 657# dies on errors during parsing config file, as it is unrecoverable.
 658sub read_config_file {
 659        my $filename = shift;
 660        return unless defined $filename;
 661        # die if there are errors parsing config file
 662        if (-e $filename) {
 663                do $filename;
 664                die $@ if $@;
 665                return 1;
 666        }
 667        return;
 668}
 669
 670our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
 671sub evaluate_gitweb_config {
 672        our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
 673        our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
 674        our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
 675
 676        # Protect agains duplications of file names, to not read config twice.
 677        # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
 678        # there possibility of duplication of filename there doesn't matter.
 679        $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
 680        $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
 681
 682        # Common system-wide settings for convenience.
 683        # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
 684        read_config_file($GITWEB_CONFIG_COMMON);
 685
 686        # Use first config file that exists.  This means use the per-instance
 687        # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
 688        read_config_file($GITWEB_CONFIG) and return;
 689        read_config_file($GITWEB_CONFIG_SYSTEM);
 690}
 691
 692# Get loadavg of system, to compare against $maxload.
 693# Currently it requires '/proc/loadavg' present to get loadavg;
 694# if it is not present it returns 0, which means no load checking.
 695sub get_loadavg {
 696        if( -e '/proc/loadavg' ){
 697                open my $fd, '<', '/proc/loadavg'
 698                        or return 0;
 699                my @load = split(/\s+/, scalar <$fd>);
 700                close $fd;
 701
 702                # The first three columns measure CPU and IO utilization of the last one,
 703                # five, and 10 minute periods.  The fourth column shows the number of
 704                # currently running processes and the total number of processes in the m/n
 705                # format.  The last column displays the last process ID used.
 706                return $load[0] || 0;
 707        }
 708        # additional checks for load average should go here for things that don't export
 709        # /proc/loadavg
 710
 711        return 0;
 712}
 713
 714# version of the core git binary
 715our $git_version;
 716sub evaluate_git_version {
 717        our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
 718        $number_of_git_cmds++;
 719}
 720
 721sub check_loadavg {
 722        if (defined $maxload && get_loadavg() > $maxload) {
 723                die_error(503, "The load average on the server is too high");
 724        }
 725}
 726
 727# ======================================================================
 728# input validation and dispatch
 729
 730# input parameters can be collected from a variety of sources (presently, CGI
 731# and PATH_INFO), so we define an %input_params hash that collects them all
 732# together during validation: this allows subsequent uses (e.g. href()) to be
 733# agnostic of the parameter origin
 734
 735our %input_params = ();
 736
 737# input parameters are stored with the long parameter name as key. This will
 738# also be used in the href subroutine to convert parameters to their CGI
 739# equivalent, and since the href() usage is the most frequent one, we store
 740# the name -> CGI key mapping here, instead of the reverse.
 741#
 742# XXX: Warning: If you touch this, check the search form for updating,
 743# too.
 744
 745our @cgi_param_mapping = (
 746        project => "p",
 747        action => "a",
 748        file_name => "f",
 749        file_parent => "fp",
 750        hash => "h",
 751        hash_parent => "hp",
 752        hash_base => "hb",
 753        hash_parent_base => "hpb",
 754        page => "pg",
 755        order => "o",
 756        searchtext => "s",
 757        searchtype => "st",
 758        snapshot_format => "sf",
 759        extra_options => "opt",
 760        search_use_regexp => "sr",
 761        ctag => "by_tag",
 762        diff_style => "ds",
 763        project_filter => "pf",
 764        # this must be last entry (for manipulation from JavaScript)
 765        javascript => "js"
 766);
 767our %cgi_param_mapping = @cgi_param_mapping;
 768
 769# we will also need to know the possible actions, for validation
 770our %actions = (
 771        "blame" => \&git_blame,
 772        "blame_incremental" => \&git_blame_incremental,
 773        "blame_data" => \&git_blame_data,
 774        "blobdiff" => \&git_blobdiff,
 775        "blobdiff_plain" => \&git_blobdiff_plain,
 776        "blob" => \&git_blob,
 777        "blob_plain" => \&git_blob_plain,
 778        "commitdiff" => \&git_commitdiff,
 779        "commitdiff_plain" => \&git_commitdiff_plain,
 780        "commit" => \&git_commit,
 781        "forks" => \&git_forks,
 782        "heads" => \&git_heads,
 783        "history" => \&git_history,
 784        "log" => \&git_log,
 785        "patch" => \&git_patch,
 786        "patches" => \&git_patches,
 787        "remotes" => \&git_remotes,
 788        "rss" => \&git_rss,
 789        "atom" => \&git_atom,
 790        "search" => \&git_search,
 791        "search_help" => \&git_search_help,
 792        "shortlog" => \&git_shortlog,
 793        "summary" => \&git_summary,
 794        "tag" => \&git_tag,
 795        "tags" => \&git_tags,
 796        "tree" => \&git_tree,
 797        "snapshot" => \&git_snapshot,
 798        "object" => \&git_object,
 799        # those below don't need $project
 800        "opml" => \&git_opml,
 801        "project_list" => \&git_project_list,
 802        "project_index" => \&git_project_index,
 803);
 804
 805# finally, we have the hash of allowed extra_options for the commands that
 806# allow them
 807our %allowed_options = (
 808        "--no-merges" => [ qw(rss atom log shortlog history) ],
 809);
 810
 811# fill %input_params with the CGI parameters. All values except for 'opt'
 812# should be single values, but opt can be an array. We should probably
 813# build an array of parameters that can be multi-valued, but since for the time
 814# being it's only this one, we just single it out
 815sub evaluate_query_params {
 816        our $cgi;
 817
 818        while (my ($name, $symbol) = each %cgi_param_mapping) {
 819                if ($symbol eq 'opt') {
 820                        $input_params{$name} = [ map { decode_utf8($_) } $cgi->param($symbol) ];
 821                } else {
 822                        $input_params{$name} = decode_utf8($cgi->param($symbol));
 823                }
 824        }
 825}
 826
 827# now read PATH_INFO and update the parameter list for missing parameters
 828sub evaluate_path_info {
 829        return if defined $input_params{'project'};
 830        return if !$path_info;
 831        $path_info =~ s,^/+,,;
 832        return if !$path_info;
 833
 834        # find which part of PATH_INFO is project
 835        my $project = $path_info;
 836        $project =~ s,/+$,,;
 837        while ($project && !check_head_link("$projectroot/$project")) {
 838                $project =~ s,/*[^/]*$,,;
 839        }
 840        return unless $project;
 841        $input_params{'project'} = $project;
 842
 843        # do not change any parameters if an action is given using the query string
 844        return if $input_params{'action'};
 845        $path_info =~ s,^\Q$project\E/*,,;
 846
 847        # next, check if we have an action
 848        my $action = $path_info;
 849        $action =~ s,/.*$,,;
 850        if (exists $actions{$action}) {
 851                $path_info =~ s,^$action/*,,;
 852                $input_params{'action'} = $action;
 853        }
 854
 855        # list of actions that want hash_base instead of hash, but can have no
 856        # pathname (f) parameter
 857        my @wants_base = (
 858                'tree',
 859                'history',
 860        );
 861
 862        # we want to catch, among others
 863        # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
 864        my ($parentrefname, $parentpathname, $refname, $pathname) =
 865                ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
 866
 867        # first, analyze the 'current' part
 868        if (defined $pathname) {
 869                # we got "branch:filename" or "branch:dir/"
 870                # we could use git_get_type(branch:pathname), but:
 871                # - it needs $git_dir
 872                # - it does a git() call
 873                # - the convention of terminating directories with a slash
 874                #   makes it superfluous
 875                # - embedding the action in the PATH_INFO would make it even
 876                #   more superfluous
 877                $pathname =~ s,^/+,,;
 878                if (!$pathname || substr($pathname, -1) eq "/") {
 879                        $input_params{'action'} ||= "tree";
 880                        $pathname =~ s,/$,,;
 881                } else {
 882                        # the default action depends on whether we had parent info
 883                        # or not
 884                        if ($parentrefname) {
 885                                $input_params{'action'} ||= "blobdiff_plain";
 886                        } else {
 887                                $input_params{'action'} ||= "blob_plain";
 888                        }
 889                }
 890                $input_params{'hash_base'} ||= $refname;
 891                $input_params{'file_name'} ||= $pathname;
 892        } elsif (defined $refname) {
 893                # we got "branch". In this case we have to choose if we have to
 894                # set hash or hash_base.
 895                #
 896                # Most of the actions without a pathname only want hash to be
 897                # set, except for the ones specified in @wants_base that want
 898                # hash_base instead. It should also be noted that hand-crafted
 899                # links having 'history' as an action and no pathname or hash
 900                # set will fail, but that happens regardless of PATH_INFO.
 901                if (defined $parentrefname) {
 902                        # if there is parent let the default be 'shortlog' action
 903                        # (for http://git.example.com/repo.git/A..B links); if there
 904                        # is no parent, dispatch will detect type of object and set
 905                        # action appropriately if required (if action is not set)
 906                        $input_params{'action'} ||= "shortlog";
 907                }
 908                if ($input_params{'action'} &&
 909                    grep { $_ eq $input_params{'action'} } @wants_base) {
 910                        $input_params{'hash_base'} ||= $refname;
 911                } else {
 912                        $input_params{'hash'} ||= $refname;
 913                }
 914        }
 915
 916        # next, handle the 'parent' part, if present
 917        if (defined $parentrefname) {
 918                # a missing pathspec defaults to the 'current' filename, allowing e.g.
 919                # someproject/blobdiff/oldrev..newrev:/filename
 920                if ($parentpathname) {
 921                        $parentpathname =~ s,^/+,,;
 922                        $parentpathname =~ s,/$,,;
 923                        $input_params{'file_parent'} ||= $parentpathname;
 924                } else {
 925                        $input_params{'file_parent'} ||= $input_params{'file_name'};
 926                }
 927                # we assume that hash_parent_base is wanted if a path was specified,
 928                # or if the action wants hash_base instead of hash
 929                if (defined $input_params{'file_parent'} ||
 930                        grep { $_ eq $input_params{'action'} } @wants_base) {
 931                        $input_params{'hash_parent_base'} ||= $parentrefname;
 932                } else {
 933                        $input_params{'hash_parent'} ||= $parentrefname;
 934                }
 935        }
 936
 937        # for the snapshot action, we allow URLs in the form
 938        # $project/snapshot/$hash.ext
 939        # where .ext determines the snapshot and gets removed from the
 940        # passed $refname to provide the $hash.
 941        #
 942        # To be able to tell that $refname includes the format extension, we
 943        # require the following two conditions to be satisfied:
 944        # - the hash input parameter MUST have been set from the $refname part
 945        #   of the URL (i.e. they must be equal)
 946        # - the snapshot format MUST NOT have been defined already (e.g. from
 947        #   CGI parameter sf)
 948        # It's also useless to try any matching unless $refname has a dot,
 949        # so we check for that too
 950        if (defined $input_params{'action'} &&
 951                $input_params{'action'} eq 'snapshot' &&
 952                defined $refname && index($refname, '.') != -1 &&
 953                $refname eq $input_params{'hash'} &&
 954                !defined $input_params{'snapshot_format'}) {
 955                # We loop over the known snapshot formats, checking for
 956                # extensions. Allowed extensions are both the defined suffix
 957                # (which includes the initial dot already) and the snapshot
 958                # format key itself, with a prepended dot
 959                while (my ($fmt, $opt) = each %known_snapshot_formats) {
 960                        my $hash = $refname;
 961                        unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
 962                                next;
 963                        }
 964                        my $sfx = $1;
 965                        # a valid suffix was found, so set the snapshot format
 966                        # and reset the hash parameter
 967                        $input_params{'snapshot_format'} = $fmt;
 968                        $input_params{'hash'} = $hash;
 969                        # we also set the format suffix to the one requested
 970                        # in the URL: this way a request for e.g. .tgz returns
 971                        # a .tgz instead of a .tar.gz
 972                        $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
 973                        last;
 974                }
 975        }
 976}
 977
 978our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
 979     $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
 980     $searchtext, $search_regexp, $project_filter);
 981sub evaluate_and_validate_params {
 982        our $action = $input_params{'action'};
 983        if (defined $action) {
 984                if (!validate_action($action)) {
 985                        die_error(400, "Invalid action parameter");
 986                }
 987        }
 988
 989        # parameters which are pathnames
 990        our $project = $input_params{'project'};
 991        if (defined $project) {
 992                if (!validate_project($project)) {
 993                        undef $project;
 994                        die_error(404, "No such project");
 995                }
 996        }
 997
 998        our $project_filter = $input_params{'project_filter'};
 999        if (defined $project_filter) {
1000                if (!validate_pathname($project_filter)) {
1001                        die_error(404, "Invalid project_filter parameter");
1002                }
1003        }
1004
1005        our $file_name = $input_params{'file_name'};
1006        if (defined $file_name) {
1007                if (!validate_pathname($file_name)) {
1008                        die_error(400, "Invalid file parameter");
1009                }
1010        }
1011
1012        our $file_parent = $input_params{'file_parent'};
1013        if (defined $file_parent) {
1014                if (!validate_pathname($file_parent)) {
1015                        die_error(400, "Invalid file parent parameter");
1016                }
1017        }
1018
1019        # parameters which are refnames
1020        our $hash = $input_params{'hash'};
1021        if (defined $hash) {
1022                if (!validate_refname($hash)) {
1023                        die_error(400, "Invalid hash parameter");
1024                }
1025        }
1026
1027        our $hash_parent = $input_params{'hash_parent'};
1028        if (defined $hash_parent) {
1029                if (!validate_refname($hash_parent)) {
1030                        die_error(400, "Invalid hash parent parameter");
1031                }
1032        }
1033
1034        our $hash_base = $input_params{'hash_base'};
1035        if (defined $hash_base) {
1036                if (!validate_refname($hash_base)) {
1037                        die_error(400, "Invalid hash base parameter");
1038                }
1039        }
1040
1041        our @extra_options = @{$input_params{'extra_options'}};
1042        # @extra_options is always defined, since it can only be (currently) set from
1043        # CGI, and $cgi->param() returns the empty array in array context if the param
1044        # is not set
1045        foreach my $opt (@extra_options) {
1046                if (not exists $allowed_options{$opt}) {
1047                        die_error(400, "Invalid option parameter");
1048                }
1049                if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1050                        die_error(400, "Invalid option parameter for this action");
1051                }
1052        }
1053
1054        our $hash_parent_base = $input_params{'hash_parent_base'};
1055        if (defined $hash_parent_base) {
1056                if (!validate_refname($hash_parent_base)) {
1057                        die_error(400, "Invalid hash parent base parameter");
1058                }
1059        }
1060
1061        # other parameters
1062        our $page = $input_params{'page'};
1063        if (defined $page) {
1064                if ($page =~ m/[^0-9]/) {
1065                        die_error(400, "Invalid page parameter");
1066                }
1067        }
1068
1069        our $searchtype = $input_params{'searchtype'};
1070        if (defined $searchtype) {
1071                if ($searchtype =~ m/[^a-z]/) {
1072                        die_error(400, "Invalid searchtype parameter");
1073                }
1074        }
1075
1076        our $search_use_regexp = $input_params{'search_use_regexp'};
1077
1078        our $searchtext = $input_params{'searchtext'};
1079        our $search_regexp;
1080        if (defined $searchtext) {
1081                if (length($searchtext) < 2) {
1082                        die_error(403, "At least two characters are required for search parameter");
1083                }
1084                if ($search_use_regexp) {
1085                        $search_regexp = $searchtext;
1086                        if (!eval { qr/$search_regexp/; 1; }) {
1087                                (my $error = $@) =~ s/ at \S+ line \d+.*\n?//;
1088                                die_error(400, "Invalid search regexp '$search_regexp'",
1089                                          esc_html($error));
1090                        }
1091                } else {
1092                        $search_regexp = quotemeta $searchtext;
1093                }
1094        }
1095}
1096
1097# path to the current git repository
1098our $git_dir;
1099sub evaluate_git_dir {
1100        our $git_dir = "$projectroot/$project" if $project;
1101}
1102
1103our (@snapshot_fmts, $git_avatar);
1104sub configure_gitweb_features {
1105        # list of supported snapshot formats
1106        our @snapshot_fmts = gitweb_get_feature('snapshot');
1107        @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1108
1109        # check that the avatar feature is set to a known provider name,
1110        # and for each provider check if the dependencies are satisfied.
1111        # if the provider name is invalid or the dependencies are not met,
1112        # reset $git_avatar to the empty string.
1113        our ($git_avatar) = gitweb_get_feature('avatar');
1114        if ($git_avatar eq 'gravatar') {
1115                $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1116        } elsif ($git_avatar eq 'picon') {
1117                # no dependencies
1118        } else {
1119                $git_avatar = '';
1120        }
1121}
1122
1123# custom error handler: 'die <message>' is Internal Server Error
1124sub handle_errors_html {
1125        my $msg = shift; # it is already HTML escaped
1126
1127        # to avoid infinite loop where error occurs in die_error,
1128        # change handler to default handler, disabling handle_errors_html
1129        set_message("Error occured when inside die_error:\n$msg");
1130
1131        # you cannot jump out of die_error when called as error handler;
1132        # the subroutine set via CGI::Carp::set_message is called _after_
1133        # HTTP headers are already written, so it cannot write them itself
1134        die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1135}
1136set_message(\&handle_errors_html);
1137
1138# dispatch
1139sub dispatch {
1140        if (!defined $action) {
1141                if (defined $hash) {
1142                        $action = git_get_type($hash);
1143                        $action or die_error(404, "Object does not exist");
1144                } elsif (defined $hash_base && defined $file_name) {
1145                        $action = git_get_type("$hash_base:$file_name");
1146                        $action or die_error(404, "File or directory does not exist");
1147                } elsif (defined $project) {
1148                        $action = 'summary';
1149                } else {
1150                        $action = 'project_list';
1151                }
1152        }
1153        if (!defined($actions{$action})) {
1154                die_error(400, "Unknown action");
1155        }
1156        if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1157            !$project) {
1158                die_error(400, "Project needed");
1159        }
1160        $actions{$action}->();
1161}
1162
1163sub reset_timer {
1164        our $t0 = [ gettimeofday() ]
1165                if defined $t0;
1166        our $number_of_git_cmds = 0;
1167}
1168
1169our $first_request = 1;
1170sub run_request {
1171        reset_timer();
1172
1173        evaluate_uri();
1174        if ($first_request) {
1175                evaluate_gitweb_config();
1176                evaluate_git_version();
1177        }
1178        if ($per_request_config) {
1179                if (ref($per_request_config) eq 'CODE') {
1180                        $per_request_config->();
1181                } elsif (!$first_request) {
1182                        evaluate_gitweb_config();
1183                }
1184        }
1185        check_loadavg();
1186
1187        # $projectroot and $projects_list might be set in gitweb config file
1188        $projects_list ||= $projectroot;
1189
1190        evaluate_query_params();
1191        evaluate_path_info();
1192        evaluate_and_validate_params();
1193        evaluate_git_dir();
1194
1195        configure_gitweb_features();
1196
1197        dispatch();
1198}
1199
1200our $is_last_request = sub { 1 };
1201our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1202our $CGI = 'CGI';
1203our $cgi;
1204sub configure_as_fcgi {
1205        require CGI::Fast;
1206        our $CGI = 'CGI::Fast';
1207
1208        my $request_number = 0;
1209        # let each child service 100 requests
1210        our $is_last_request = sub { ++$request_number > 100 };
1211}
1212sub evaluate_argv {
1213        my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1214        configure_as_fcgi()
1215                if $script_name =~ /\.fcgi$/;
1216
1217        return unless (@ARGV);
1218
1219        require Getopt::Long;
1220        Getopt::Long::GetOptions(
1221                'fastcgi|fcgi|f' => \&configure_as_fcgi,
1222                'nproc|n=i' => sub {
1223                        my ($arg, $val) = @_;
1224                        return unless eval { require FCGI::ProcManager; 1; };
1225                        my $proc_manager = FCGI::ProcManager->new({
1226                                n_processes => $val,
1227                        });
1228                        our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1229                        our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1230                        our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1231                },
1232        );
1233}
1234
1235sub run {
1236        evaluate_argv();
1237
1238        $first_request = 1;
1239        $pre_listen_hook->()
1240                if $pre_listen_hook;
1241
1242 REQUEST:
1243        while ($cgi = $CGI->new()) {
1244                $pre_dispatch_hook->()
1245                        if $pre_dispatch_hook;
1246
1247                run_request();
1248
1249                $post_dispatch_hook->()
1250                        if $post_dispatch_hook;
1251                $first_request = 0;
1252
1253                last REQUEST if ($is_last_request->());
1254        }
1255
1256 DONE_GITWEB:
1257        1;
1258}
1259
1260run();
1261
1262if (defined caller) {
1263        # wrapped in a subroutine processing requests,
1264        # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1265        return;
1266} else {
1267        # pure CGI script, serving single request
1268        exit;
1269}
1270
1271## ======================================================================
1272## action links
1273
1274# possible values of extra options
1275# -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1276# -replay => 1      - start from a current view (replay with modifications)
1277# -path_info => 0|1 - don't use/use path_info URL (if possible)
1278# -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1279sub href {
1280        my %params = @_;
1281        # default is to use -absolute url() i.e. $my_uri
1282        my $href = $params{-full} ? $my_url : $my_uri;
1283
1284        # implicit -replay, must be first of implicit params
1285        $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1286
1287        $params{'project'} = $project unless exists $params{'project'};
1288
1289        if ($params{-replay}) {
1290                while (my ($name, $symbol) = each %cgi_param_mapping) {
1291                        if (!exists $params{$name}) {
1292                                $params{$name} = $input_params{$name};
1293                        }
1294                }
1295        }
1296
1297        my $use_pathinfo = gitweb_check_feature('pathinfo');
1298        if (defined $params{'project'} &&
1299            (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1300                # try to put as many parameters as possible in PATH_INFO:
1301                #   - project name
1302                #   - action
1303                #   - hash_parent or hash_parent_base:/file_parent
1304                #   - hash or hash_base:/filename
1305                #   - the snapshot_format as an appropriate suffix
1306
1307                # When the script is the root DirectoryIndex for the domain,
1308                # $href here would be something like http://gitweb.example.com/
1309                # Thus, we strip any trailing / from $href, to spare us double
1310                # slashes in the final URL
1311                $href =~ s,/$,,;
1312
1313                # Then add the project name, if present
1314                $href .= "/".esc_path_info($params{'project'});
1315                delete $params{'project'};
1316
1317                # since we destructively absorb parameters, we keep this
1318                # boolean that remembers if we're handling a snapshot
1319                my $is_snapshot = $params{'action'} eq 'snapshot';
1320
1321                # Summary just uses the project path URL, any other action is
1322                # added to the URL
1323                if (defined $params{'action'}) {
1324                        $href .= "/".esc_path_info($params{'action'})
1325                                unless $params{'action'} eq 'summary';
1326                        delete $params{'action'};
1327                }
1328
1329                # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1330                # stripping nonexistent or useless pieces
1331                $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1332                        || $params{'hash_parent'} || $params{'hash'});
1333                if (defined $params{'hash_base'}) {
1334                        if (defined $params{'hash_parent_base'}) {
1335                                $href .= esc_path_info($params{'hash_parent_base'});
1336                                # skip the file_parent if it's the same as the file_name
1337                                if (defined $params{'file_parent'}) {
1338                                        if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1339                                                delete $params{'file_parent'};
1340                                        } elsif ($params{'file_parent'} !~ /\.\./) {
1341                                                $href .= ":/".esc_path_info($params{'file_parent'});
1342                                                delete $params{'file_parent'};
1343                                        }
1344                                }
1345                                $href .= "..";
1346                                delete $params{'hash_parent'};
1347                                delete $params{'hash_parent_base'};
1348                        } elsif (defined $params{'hash_parent'}) {
1349                                $href .= esc_path_info($params{'hash_parent'}). "..";
1350                                delete $params{'hash_parent'};
1351                        }
1352
1353                        $href .= esc_path_info($params{'hash_base'});
1354                        if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1355                                $href .= ":/".esc_path_info($params{'file_name'});
1356                                delete $params{'file_name'};
1357                        }
1358                        delete $params{'hash'};
1359                        delete $params{'hash_base'};
1360                } elsif (defined $params{'hash'}) {
1361                        $href .= esc_path_info($params{'hash'});
1362                        delete $params{'hash'};
1363                }
1364
1365                # If the action was a snapshot, we can absorb the
1366                # snapshot_format parameter too
1367                if ($is_snapshot) {
1368                        my $fmt = $params{'snapshot_format'};
1369                        # snapshot_format should always be defined when href()
1370                        # is called, but just in case some code forgets, we
1371                        # fall back to the default
1372                        $fmt ||= $snapshot_fmts[0];
1373                        $href .= $known_snapshot_formats{$fmt}{'suffix'};
1374                        delete $params{'snapshot_format'};
1375                }
1376        }
1377
1378        # now encode the parameters explicitly
1379        my @result = ();
1380        for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1381                my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1382                if (defined $params{$name}) {
1383                        if (ref($params{$name}) eq "ARRAY") {
1384                                foreach my $par (@{$params{$name}}) {
1385                                        push @result, $symbol . "=" . esc_param($par);
1386                                }
1387                        } else {
1388                                push @result, $symbol . "=" . esc_param($params{$name});
1389                        }
1390                }
1391        }
1392        $href .= "?" . join(';', @result) if scalar @result;
1393
1394        # final transformation: trailing spaces must be escaped (URI-encoded)
1395        $href =~ s/(\s+)$/CGI::escape($1)/e;
1396
1397        if ($params{-anchor}) {
1398                $href .= "#".esc_param($params{-anchor});
1399        }
1400
1401        return $href;
1402}
1403
1404
1405## ======================================================================
1406## validation, quoting/unquoting and escaping
1407
1408sub validate_action {
1409        my $input = shift || return undef;
1410        return undef unless exists $actions{$input};
1411        return $input;
1412}
1413
1414sub validate_project {
1415        my $input = shift || return undef;
1416        if (!validate_pathname($input) ||
1417                !(-d "$projectroot/$input") ||
1418                !check_export_ok("$projectroot/$input") ||
1419                ($strict_export && !project_in_list($input))) {
1420                return undef;
1421        } else {
1422                return $input;
1423        }
1424}
1425
1426sub validate_pathname {
1427        my $input = shift || return undef;
1428
1429        # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1430        # at the beginning, at the end, and between slashes.
1431        # also this catches doubled slashes
1432        if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1433                return undef;
1434        }
1435        # no null characters
1436        if ($input =~ m!\0!) {
1437                return undef;
1438        }
1439        return $input;
1440}
1441
1442sub validate_refname {
1443        my $input = shift || return undef;
1444
1445        # textual hashes are O.K.
1446        if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1447                return $input;
1448        }
1449        # it must be correct pathname
1450        $input = validate_pathname($input)
1451                or return undef;
1452        # restrictions on ref name according to git-check-ref-format
1453        if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1454                return undef;
1455        }
1456        return $input;
1457}
1458
1459# decode sequences of octets in utf8 into Perl's internal form,
1460# which is utf-8 with utf8 flag set if needed.  gitweb writes out
1461# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1462sub to_utf8 {
1463        my $str = shift;
1464        return undef unless defined $str;
1465
1466        if (utf8::is_utf8($str) || utf8::decode($str)) {
1467                return $str;
1468        } else {
1469                return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1470        }
1471}
1472
1473# quote unsafe chars, but keep the slash, even when it's not
1474# correct, but quoted slashes look too horrible in bookmarks
1475sub esc_param {
1476        my $str = shift;
1477        return undef unless defined $str;
1478        $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1479        $str =~ s/ /\+/g;
1480        return $str;
1481}
1482
1483# the quoting rules for path_info fragment are slightly different
1484sub esc_path_info {
1485        my $str = shift;
1486        return undef unless defined $str;
1487
1488        # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1489        $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1490
1491        return $str;
1492}
1493
1494# quote unsafe chars in whole URL, so some characters cannot be quoted
1495sub esc_url {
1496        my $str = shift;
1497        return undef unless defined $str;
1498        $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1499        $str =~ s/ /\+/g;
1500        return $str;
1501}
1502
1503# quote unsafe characters in HTML attributes
1504sub esc_attr {
1505
1506        # for XHTML conformance escaping '"' to '&quot;' is not enough
1507        return esc_html(@_);
1508}
1509
1510# replace invalid utf8 character with SUBSTITUTION sequence
1511sub esc_html {
1512        my $str = shift;
1513        my %opts = @_;
1514
1515        return undef unless defined $str;
1516
1517        $str = to_utf8($str);
1518        $str = $cgi->escapeHTML($str);
1519        if ($opts{'-nbsp'}) {
1520                $str =~ s/ /&nbsp;/g;
1521        }
1522        $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1523        return $str;
1524}
1525
1526# quote control characters and escape filename to HTML
1527sub esc_path {
1528        my $str = shift;
1529        my %opts = @_;
1530
1531        return undef unless defined $str;
1532
1533        $str = to_utf8($str);
1534        $str = $cgi->escapeHTML($str);
1535        if ($opts{'-nbsp'}) {
1536                $str =~ s/ /&nbsp;/g;
1537        }
1538        $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1539        return $str;
1540}
1541
1542# Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1543sub sanitize {
1544        my $str = shift;
1545
1546        return undef unless defined $str;
1547
1548        $str = to_utf8($str);
1549        $str =~ s|([[:cntrl:]])|($1 =~ /[\t\n\r]/ ? $1 : quot_cec($1))|eg;
1550        return $str;
1551}
1552
1553# Make control characters "printable", using character escape codes (CEC)
1554sub quot_cec {
1555        my $cntrl = shift;
1556        my %opts = @_;
1557        my %es = ( # character escape codes, aka escape sequences
1558                "\t" => '\t',   # tab            (HT)
1559                "\n" => '\n',   # line feed      (LF)
1560                "\r" => '\r',   # carrige return (CR)
1561                "\f" => '\f',   # form feed      (FF)
1562                "\b" => '\b',   # backspace      (BS)
1563                "\a" => '\a',   # alarm (bell)   (BEL)
1564                "\e" => '\e',   # escape         (ESC)
1565                "\013" => '\v', # vertical tab   (VT)
1566                "\000" => '\0', # nul character  (NUL)
1567        );
1568        my $chr = ( (exists $es{$cntrl})
1569                    ? $es{$cntrl}
1570                    : sprintf('\%2x', ord($cntrl)) );
1571        if ($opts{-nohtml}) {
1572                return $chr;
1573        } else {
1574                return "<span class=\"cntrl\">$chr</span>";
1575        }
1576}
1577
1578# Alternatively use unicode control pictures codepoints,
1579# Unicode "printable representation" (PR)
1580sub quot_upr {
1581        my $cntrl = shift;
1582        my %opts = @_;
1583
1584        my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1585        if ($opts{-nohtml}) {
1586                return $chr;
1587        } else {
1588                return "<span class=\"cntrl\">$chr</span>";
1589        }
1590}
1591
1592# git may return quoted and escaped filenames
1593sub unquote {
1594        my $str = shift;
1595
1596        sub unq {
1597                my $seq = shift;
1598                my %es = ( # character escape codes, aka escape sequences
1599                        't' => "\t",   # tab            (HT, TAB)
1600                        'n' => "\n",   # newline        (NL)
1601                        'r' => "\r",   # return         (CR)
1602                        'f' => "\f",   # form feed      (FF)
1603                        'b' => "\b",   # backspace      (BS)
1604                        'a' => "\a",   # alarm (bell)   (BEL)
1605                        'e' => "\e",   # escape         (ESC)
1606                        'v' => "\013", # vertical tab   (VT)
1607                );
1608
1609                if ($seq =~ m/^[0-7]{1,3}$/) {
1610                        # octal char sequence
1611                        return chr(oct($seq));
1612                } elsif (exists $es{$seq}) {
1613                        # C escape sequence, aka character escape code
1614                        return $es{$seq};
1615                }
1616                # quoted ordinary character
1617                return $seq;
1618        }
1619
1620        if ($str =~ m/^"(.*)"$/) {
1621                # needs unquoting
1622                $str = $1;
1623                $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1624        }
1625        return $str;
1626}
1627
1628# escape tabs (convert tabs to spaces)
1629sub untabify {
1630        my $line = shift;
1631
1632        while ((my $pos = index($line, "\t")) != -1) {
1633                if (my $count = (8 - ($pos % 8))) {
1634                        my $spaces = ' ' x $count;
1635                        $line =~ s/\t/$spaces/;
1636                }
1637        }
1638
1639        return $line;
1640}
1641
1642sub project_in_list {
1643        my $project = shift;
1644        my @list = git_get_projects_list();
1645        return @list && scalar(grep { $_->{'path'} eq $project } @list);
1646}
1647
1648## ----------------------------------------------------------------------
1649## HTML aware string manipulation
1650
1651# Try to chop given string on a word boundary between position
1652# $len and $len+$add_len. If there is no word boundary there,
1653# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1654# (marking chopped part) would be longer than given string.
1655sub chop_str {
1656        my $str = shift;
1657        my $len = shift;
1658        my $add_len = shift || 10;
1659        my $where = shift || 'right'; # 'left' | 'center' | 'right'
1660
1661        # Make sure perl knows it is utf8 encoded so we don't
1662        # cut in the middle of a utf8 multibyte char.
1663        $str = to_utf8($str);
1664
1665        # allow only $len chars, but don't cut a word if it would fit in $add_len
1666        # if it doesn't fit, cut it if it's still longer than the dots we would add
1667        # remove chopped character entities entirely
1668
1669        # when chopping in the middle, distribute $len into left and right part
1670        # return early if chopping wouldn't make string shorter
1671        if ($where eq 'center') {
1672                return $str if ($len + 5 >= length($str)); # filler is length 5
1673                $len = int($len/2);
1674        } else {
1675                return $str if ($len + 4 >= length($str)); # filler is length 4
1676        }
1677
1678        # regexps: ending and beginning with word part up to $add_len
1679        my $endre = qr/.{$len}\w{0,$add_len}/;
1680        my $begre = qr/\w{0,$add_len}.{$len}/;
1681
1682        if ($where eq 'left') {
1683                $str =~ m/^(.*?)($begre)$/;
1684                my ($lead, $body) = ($1, $2);
1685                if (length($lead) > 4) {
1686                        $lead = " ...";
1687                }
1688                return "$lead$body";
1689
1690        } elsif ($where eq 'center') {
1691                $str =~ m/^($endre)(.*)$/;
1692                my ($left, $str)  = ($1, $2);
1693                $str =~ m/^(.*?)($begre)$/;
1694                my ($mid, $right) = ($1, $2);
1695                if (length($mid) > 5) {
1696                        $mid = " ... ";
1697                }
1698                return "$left$mid$right";
1699
1700        } else {
1701                $str =~ m/^($endre)(.*)$/;
1702                my $body = $1;
1703                my $tail = $2;
1704                if (length($tail) > 4) {
1705                        $tail = "... ";
1706                }
1707                return "$body$tail";
1708        }
1709}
1710
1711# takes the same arguments as chop_str, but also wraps a <span> around the
1712# result with a title attribute if it does get chopped. Additionally, the
1713# string is HTML-escaped.
1714sub chop_and_escape_str {
1715        my ($str) = @_;
1716
1717        my $chopped = chop_str(@_);
1718        $str = to_utf8($str);
1719        if ($chopped eq $str) {
1720                return esc_html($chopped);
1721        } else {
1722                $str =~ s/[[:cntrl:]]/?/g;
1723                return $cgi->span({-title=>$str}, esc_html($chopped));
1724        }
1725}
1726
1727# Highlight selected fragments of string, using given CSS class,
1728# and escape HTML.  It is assumed that fragments do not overlap.
1729# Regions are passed as list of pairs (array references).
1730#
1731# Example: esc_html_hl_regions("foobar", "mark", [ 0, 3 ]) returns
1732# '<span class="mark">foo</span>bar'
1733sub esc_html_hl_regions {
1734        my ($str, $css_class, @sel) = @_;
1735        return esc_html($str) unless @sel;
1736
1737        my $out = '';
1738        my $pos = 0;
1739
1740        for my $s (@sel) {
1741                my ($begin, $end) = @$s;
1742
1743                my $escaped = esc_html(substr($str, $begin, $end - $begin));
1744
1745                $out .= esc_html(substr($str, $pos, $begin - $pos))
1746                        if ($begin - $pos > 0);
1747                $out .= $cgi->span({-class => $css_class}, $escaped);
1748
1749                $pos = $end;
1750        }
1751        $out .= esc_html(substr($str, $pos))
1752                if ($pos < length($str));
1753
1754        return $out;
1755}
1756
1757# return positions of beginning and end of each match
1758sub matchpos_list {
1759        my ($str, $regexp) = @_;
1760        return unless (defined $str && defined $regexp);
1761
1762        my @matches;
1763        while ($str =~ /$regexp/g) {
1764                push @matches, [$-[0], $+[0]];
1765        }
1766        return @matches;
1767}
1768
1769# highlight match (if any), and escape HTML
1770sub esc_html_match_hl {
1771        my ($str, $regexp) = @_;
1772        return esc_html($str) unless defined $regexp;
1773
1774        my @matches = matchpos_list($str, $regexp);
1775        return esc_html($str) unless @matches;
1776
1777        return esc_html_hl_regions($str, 'match', @matches);
1778}
1779
1780
1781# highlight match (if any) of shortened string, and escape HTML
1782sub esc_html_match_hl_chopped {
1783        my ($str, $chopped, $regexp) = @_;
1784        return esc_html_match_hl($str, $regexp) unless defined $chopped;
1785
1786        my @matches = matchpos_list($str, $regexp);
1787        return esc_html($chopped) unless @matches;
1788
1789        # filter matches so that we mark chopped string
1790        my $tail = "... "; # see chop_str
1791        unless ($chopped =~ s/\Q$tail\E$//) {
1792                $tail = '';
1793        }
1794        my $chop_len = length($chopped);
1795        my $tail_len = length($tail);
1796        my @filtered;
1797
1798        for my $m (@matches) {
1799                if ($m->[0] > $chop_len) {
1800                        push @filtered, [ $chop_len, $chop_len + $tail_len ] if ($tail_len > 0);
1801                        last;
1802                } elsif ($m->[1] > $chop_len) {
1803                        push @filtered, [ $m->[0], $chop_len + $tail_len ];
1804                        last;
1805                }
1806                push @filtered, $m;
1807        }
1808
1809        return esc_html_hl_regions($chopped . $tail, 'match', @filtered);
1810}
1811
1812## ----------------------------------------------------------------------
1813## functions returning short strings
1814
1815# CSS class for given age value (in seconds)
1816sub age_class {
1817        my $age = shift;
1818
1819        if (!defined $age) {
1820                return "noage";
1821        } elsif ($age < 60*60*2) {
1822                return "age0";
1823        } elsif ($age < 60*60*24*2) {
1824                return "age1";
1825        } else {
1826                return "age2";
1827        }
1828}
1829
1830# convert age in seconds to "nn units ago" string
1831sub age_string {
1832        my $age = shift;
1833        my $age_str;
1834
1835        if ($age > 60*60*24*365*2) {
1836                $age_str = (int $age/60/60/24/365);
1837                $age_str .= " years ago";
1838        } elsif ($age > 60*60*24*(365/12)*2) {
1839                $age_str = int $age/60/60/24/(365/12);
1840                $age_str .= " months ago";
1841        } elsif ($age > 60*60*24*7*2) {
1842                $age_str = int $age/60/60/24/7;
1843                $age_str .= " weeks ago";
1844        } elsif ($age > 60*60*24*2) {
1845                $age_str = int $age/60/60/24;
1846                $age_str .= " days ago";
1847        } elsif ($age > 60*60*2) {
1848                $age_str = int $age/60/60;
1849                $age_str .= " hours ago";
1850        } elsif ($age > 60*2) {
1851                $age_str = int $age/60;
1852                $age_str .= " min ago";
1853        } elsif ($age > 2) {
1854                $age_str = int $age;
1855                $age_str .= " sec ago";
1856        } else {
1857                $age_str .= " right now";
1858        }
1859        return $age_str;
1860}
1861
1862use constant {
1863        S_IFINVALID => 0030000,
1864        S_IFGITLINK => 0160000,
1865};
1866
1867# submodule/subproject, a commit object reference
1868sub S_ISGITLINK {
1869        my $mode = shift;
1870
1871        return (($mode & S_IFMT) == S_IFGITLINK)
1872}
1873
1874# convert file mode in octal to symbolic file mode string
1875sub mode_str {
1876        my $mode = oct shift;
1877
1878        if (S_ISGITLINK($mode)) {
1879                return 'm---------';
1880        } elsif (S_ISDIR($mode & S_IFMT)) {
1881                return 'drwxr-xr-x';
1882        } elsif (S_ISLNK($mode)) {
1883                return 'lrwxrwxrwx';
1884        } elsif (S_ISREG($mode)) {
1885                # git cares only about the executable bit
1886                if ($mode & S_IXUSR) {
1887                        return '-rwxr-xr-x';
1888                } else {
1889                        return '-rw-r--r--';
1890                };
1891        } else {
1892                return '----------';
1893        }
1894}
1895
1896# convert file mode in octal to file type string
1897sub file_type {
1898        my $mode = shift;
1899
1900        if ($mode !~ m/^[0-7]+$/) {
1901                return $mode;
1902        } else {
1903                $mode = oct $mode;
1904        }
1905
1906        if (S_ISGITLINK($mode)) {
1907                return "submodule";
1908        } elsif (S_ISDIR($mode & S_IFMT)) {
1909                return "directory";
1910        } elsif (S_ISLNK($mode)) {
1911                return "symlink";
1912        } elsif (S_ISREG($mode)) {
1913                return "file";
1914        } else {
1915                return "unknown";
1916        }
1917}
1918
1919# convert file mode in octal to file type description string
1920sub file_type_long {
1921        my $mode = shift;
1922
1923        if ($mode !~ m/^[0-7]+$/) {
1924                return $mode;
1925        } else {
1926                $mode = oct $mode;
1927        }
1928
1929        if (S_ISGITLINK($mode)) {
1930                return "submodule";
1931        } elsif (S_ISDIR($mode & S_IFMT)) {
1932                return "directory";
1933        } elsif (S_ISLNK($mode)) {
1934                return "symlink";
1935        } elsif (S_ISREG($mode)) {
1936                if ($mode & S_IXUSR) {
1937                        return "executable";
1938                } else {
1939                        return "file";
1940                };
1941        } else {
1942                return "unknown";
1943        }
1944}
1945
1946
1947## ----------------------------------------------------------------------
1948## functions returning short HTML fragments, or transforming HTML fragments
1949## which don't belong to other sections
1950
1951# format line of commit message.
1952sub format_log_line_html {
1953        my $line = shift;
1954
1955        $line = esc_html($line, -nbsp=>1);
1956        $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1957                $cgi->a({-href => href(action=>"object", hash=>$1),
1958                                        -class => "text"}, $1);
1959        }eg;
1960
1961        return $line;
1962}
1963
1964# format marker of refs pointing to given object
1965
1966# the destination action is chosen based on object type and current context:
1967# - for annotated tags, we choose the tag view unless it's the current view
1968#   already, in which case we go to shortlog view
1969# - for other refs, we keep the current view if we're in history, shortlog or
1970#   log view, and select shortlog otherwise
1971sub format_ref_marker {
1972        my ($refs, $id) = @_;
1973        my $markers = '';
1974
1975        if (defined $refs->{$id}) {
1976                foreach my $ref (@{$refs->{$id}}) {
1977                        # this code exploits the fact that non-lightweight tags are the
1978                        # only indirect objects, and that they are the only objects for which
1979                        # we want to use tag instead of shortlog as action
1980                        my ($type, $name) = qw();
1981                        my $indirect = ($ref =~ s/\^\{\}$//);
1982                        # e.g. tags/v2.6.11 or heads/next
1983                        if ($ref =~ m!^(.*?)s?/(.*)$!) {
1984                                $type = $1;
1985                                $name = $2;
1986                        } else {
1987                                $type = "ref";
1988                                $name = $ref;
1989                        }
1990
1991                        my $class = $type;
1992                        $class .= " indirect" if $indirect;
1993
1994                        my $dest_action = "shortlog";
1995
1996                        if ($indirect) {
1997                                $dest_action = "tag" unless $action eq "tag";
1998                        } elsif ($action =~ /^(history|(short)?log)$/) {
1999                                $dest_action = $action;
2000                        }
2001
2002                        my $dest = "";
2003                        $dest .= "refs/" unless $ref =~ m!^refs/!;
2004                        $dest .= $ref;
2005
2006                        my $link = $cgi->a({
2007                                -href => href(
2008                                        action=>$dest_action,
2009                                        hash=>$dest
2010                                )}, $name);
2011
2012                        $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
2013                                $link . "</span>";
2014                }
2015        }
2016
2017        if ($markers) {
2018                return ' <span class="refs">'. $markers . '</span>';
2019        } else {
2020                return "";
2021        }
2022}
2023
2024# format, perhaps shortened and with markers, title line
2025sub format_subject_html {
2026        my ($long, $short, $href, $extra) = @_;
2027        $extra = '' unless defined($extra);
2028
2029        if (length($short) < length($long)) {
2030                $long =~ s/[[:cntrl:]]/?/g;
2031                return $cgi->a({-href => $href, -class => "list subject",
2032                                -title => to_utf8($long)},
2033                       esc_html($short)) . $extra;
2034        } else {
2035                return $cgi->a({-href => $href, -class => "list subject"},
2036                       esc_html($long)) . $extra;
2037        }
2038}
2039
2040# Rather than recomputing the url for an email multiple times, we cache it
2041# after the first hit. This gives a visible benefit in views where the avatar
2042# for the same email is used repeatedly (e.g. shortlog).
2043# The cache is shared by all avatar engines (currently gravatar only), which
2044# are free to use it as preferred. Since only one avatar engine is used for any
2045# given page, there's no risk for cache conflicts.
2046our %avatar_cache = ();
2047
2048# Compute the picon url for a given email, by using the picon search service over at
2049# http://www.cs.indiana.edu/picons/search.html
2050sub picon_url {
2051        my $email = lc shift;
2052        if (!$avatar_cache{$email}) {
2053                my ($user, $domain) = split('@', $email);
2054                $avatar_cache{$email} =
2055                        "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
2056                        "$domain/$user/" .
2057                        "users+domains+unknown/up/single";
2058        }
2059        return $avatar_cache{$email};
2060}
2061
2062# Compute the gravatar url for a given email, if it's not in the cache already.
2063# Gravatar stores only the part of the URL before the size, since that's the
2064# one computationally more expensive. This also allows reuse of the cache for
2065# different sizes (for this particular engine).
2066sub gravatar_url {
2067        my $email = lc shift;
2068        my $size = shift;
2069        $avatar_cache{$email} ||=
2070                "http://www.gravatar.com/avatar/" .
2071                        Digest::MD5::md5_hex($email) . "?s=";
2072        return $avatar_cache{$email} . $size;
2073}
2074
2075# Insert an avatar for the given $email at the given $size if the feature
2076# is enabled.
2077sub git_get_avatar {
2078        my ($email, %opts) = @_;
2079        my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
2080        my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
2081        $opts{-size} ||= 'default';
2082        my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
2083        my $url = "";
2084        if ($git_avatar eq 'gravatar') {
2085                $url = gravatar_url($email, $size);
2086        } elsif ($git_avatar eq 'picon') {
2087                $url = picon_url($email);
2088        }
2089        # Other providers can be added by extending the if chain, defining $url
2090        # as needed. If no variant puts something in $url, we assume avatars
2091        # are completely disabled/unavailable.
2092        if ($url) {
2093                return $pre_white .
2094                       "<img width=\"$size\" " .
2095                            "class=\"avatar\" " .
2096                            "src=\"".esc_url($url)."\" " .
2097                            "alt=\"\" " .
2098                       "/>" . $post_white;
2099        } else {
2100                return "";
2101        }
2102}
2103
2104sub format_search_author {
2105        my ($author, $searchtype, $displaytext) = @_;
2106        my $have_search = gitweb_check_feature('search');
2107
2108        if ($have_search) {
2109                my $performed = "";
2110                if ($searchtype eq 'author') {
2111                        $performed = "authored";
2112                } elsif ($searchtype eq 'committer') {
2113                        $performed = "committed";
2114                }
2115
2116                return $cgi->a({-href => href(action=>"search", hash=>$hash,
2117                                searchtext=>$author,
2118                                searchtype=>$searchtype), class=>"list",
2119                                title=>"Search for commits $performed by $author"},
2120                                $displaytext);
2121
2122        } else {
2123                return $displaytext;
2124        }
2125}
2126
2127# format the author name of the given commit with the given tag
2128# the author name is chopped and escaped according to the other
2129# optional parameters (see chop_str).
2130sub format_author_html {
2131        my $tag = shift;
2132        my $co = shift;
2133        my $author = chop_and_escape_str($co->{'author_name'}, @_);
2134        return "<$tag class=\"author\">" .
2135               format_search_author($co->{'author_name'}, "author",
2136                       git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2137                       $author) .
2138               "</$tag>";
2139}
2140
2141# format git diff header line, i.e. "diff --(git|combined|cc) ..."
2142sub format_git_diff_header_line {
2143        my $line = shift;
2144        my $diffinfo = shift;
2145        my ($from, $to) = @_;
2146
2147        if ($diffinfo->{'nparents'}) {
2148                # combined diff
2149                $line =~ s!^(diff (.*?) )"?.*$!$1!;
2150                if ($to->{'href'}) {
2151                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2152                                         esc_path($to->{'file'}));
2153                } else { # file was deleted (no href)
2154                        $line .= esc_path($to->{'file'});
2155                }
2156        } else {
2157                # "ordinary" diff
2158                $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2159                if ($from->{'href'}) {
2160                        $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2161                                         'a/' . esc_path($from->{'file'}));
2162                } else { # file was added (no href)
2163                        $line .= 'a/' . esc_path($from->{'file'});
2164                }
2165                $line .= ' ';
2166                if ($to->{'href'}) {
2167                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2168                                         'b/' . esc_path($to->{'file'}));
2169                } else { # file was deleted
2170                        $line .= 'b/' . esc_path($to->{'file'});
2171                }
2172        }
2173
2174        return "<div class=\"diff header\">$line</div>\n";
2175}
2176
2177# format extended diff header line, before patch itself
2178sub format_extended_diff_header_line {
2179        my $line = shift;
2180        my $diffinfo = shift;
2181        my ($from, $to) = @_;
2182
2183        # match <path>
2184        if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2185                $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2186                                       esc_path($from->{'file'}));
2187        }
2188        if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2189                $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2190                                 esc_path($to->{'file'}));
2191        }
2192        # match single <mode>
2193        if ($line =~ m/\s(\d{6})$/) {
2194                $line .= '<span class="info"> (' .
2195                         file_type_long($1) .
2196                         ')</span>';
2197        }
2198        # match <hash>
2199        if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2200                # can match only for combined diff
2201                $line = 'index ';
2202                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2203                        if ($from->{'href'}[$i]) {
2204                                $line .= $cgi->a({-href=>$from->{'href'}[$i],
2205                                                  -class=>"hash"},
2206                                                 substr($diffinfo->{'from_id'}[$i],0,7));
2207                        } else {
2208                                $line .= '0' x 7;
2209                        }
2210                        # separator
2211                        $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2212                }
2213                $line .= '..';
2214                if ($to->{'href'}) {
2215                        $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2216                                         substr($diffinfo->{'to_id'},0,7));
2217                } else {
2218                        $line .= '0' x 7;
2219                }
2220
2221        } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2222                # can match only for ordinary diff
2223                my ($from_link, $to_link);
2224                if ($from->{'href'}) {
2225                        $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2226                                             substr($diffinfo->{'from_id'},0,7));
2227                } else {
2228                        $from_link = '0' x 7;
2229                }
2230                if ($to->{'href'}) {
2231                        $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2232                                           substr($diffinfo->{'to_id'},0,7));
2233                } else {
2234                        $to_link = '0' x 7;
2235                }
2236                my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2237                $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2238        }
2239
2240        return $line . "<br/>\n";
2241}
2242
2243# format from-file/to-file diff header
2244sub format_diff_from_to_header {
2245        my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2246        my $line;
2247        my $result = '';
2248
2249        $line = $from_line;
2250        #assert($line =~ m/^---/) if DEBUG;
2251        # no extra formatting for "^--- /dev/null"
2252        if (! $diffinfo->{'nparents'}) {
2253                # ordinary (single parent) diff
2254                if ($line =~ m!^--- "?a/!) {
2255                        if ($from->{'href'}) {
2256                                $line = '--- a/' .
2257                                        $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2258                                                esc_path($from->{'file'}));
2259                        } else {
2260                                $line = '--- a/' .
2261                                        esc_path($from->{'file'});
2262                        }
2263                }
2264                $result .= qq!<div class="diff from_file">$line</div>\n!;
2265
2266        } else {
2267                # combined diff (merge commit)
2268                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2269                        if ($from->{'href'}[$i]) {
2270                                $line = '--- ' .
2271                                        $cgi->a({-href=>href(action=>"blobdiff",
2272                                                             hash_parent=>$diffinfo->{'from_id'}[$i],
2273                                                             hash_parent_base=>$parents[$i],
2274                                                             file_parent=>$from->{'file'}[$i],
2275                                                             hash=>$diffinfo->{'to_id'},
2276                                                             hash_base=>$hash,
2277                                                             file_name=>$to->{'file'}),
2278                                                 -class=>"path",
2279                                                 -title=>"diff" . ($i+1)},
2280                                                $i+1) .
2281                                        '/' .
2282                                        $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2283                                                esc_path($from->{'file'}[$i]));
2284                        } else {
2285                                $line = '--- /dev/null';
2286                        }
2287                        $result .= qq!<div class="diff from_file">$line</div>\n!;
2288                }
2289        }
2290
2291        $line = $to_line;
2292        #assert($line =~ m/^\+\+\+/) if DEBUG;
2293        # no extra formatting for "^+++ /dev/null"
2294        if ($line =~ m!^\+\+\+ "?b/!) {
2295                if ($to->{'href'}) {
2296                        $line = '+++ b/' .
2297                                $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2298                                        esc_path($to->{'file'}));
2299                } else {
2300                        $line = '+++ b/' .
2301                                esc_path($to->{'file'});
2302                }
2303        }
2304        $result .= qq!<div class="diff to_file">$line</div>\n!;
2305
2306        return $result;
2307}
2308
2309# create note for patch simplified by combined diff
2310sub format_diff_cc_simplified {
2311        my ($diffinfo, @parents) = @_;
2312        my $result = '';
2313
2314        $result .= "<div class=\"diff header\">" .
2315                   "diff --cc ";
2316        if (!is_deleted($diffinfo)) {
2317                $result .= $cgi->a({-href => href(action=>"blob",
2318                                                  hash_base=>$hash,
2319                                                  hash=>$diffinfo->{'to_id'},
2320                                                  file_name=>$diffinfo->{'to_file'}),
2321                                    -class => "path"},
2322                                   esc_path($diffinfo->{'to_file'}));
2323        } else {
2324                $result .= esc_path($diffinfo->{'to_file'});
2325        }
2326        $result .= "</div>\n" . # class="diff header"
2327                   "<div class=\"diff nodifferences\">" .
2328                   "Simple merge" .
2329                   "</div>\n"; # class="diff nodifferences"
2330
2331        return $result;
2332}
2333
2334sub diff_line_class {
2335        my ($line, $from, $to) = @_;
2336
2337        # ordinary diff
2338        my $num_sign = 1;
2339        # combined diff
2340        if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2341                $num_sign = scalar @{$from->{'href'}};
2342        }
2343
2344        my @diff_line_classifier = (
2345                { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2346                { regexp => qr/^\\/,               class => "incomplete"  },
2347                { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2348                # classifier for context must come before classifier add/rem,
2349                # or we would have to use more complicated regexp, for example
2350                # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2351                { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2352                { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2353        );
2354        for my $clsfy (@diff_line_classifier) {
2355                return $clsfy->{'class'}
2356                        if ($line =~ $clsfy->{'regexp'});
2357        }
2358
2359        # fallback
2360        return "";
2361}
2362
2363# assumes that $from and $to are defined and correctly filled,
2364# and that $line holds a line of chunk header for unified diff
2365sub format_unidiff_chunk_header {
2366        my ($line, $from, $to) = @_;
2367
2368        my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2369                $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2370
2371        $from_lines = 0 unless defined $from_lines;
2372        $to_lines   = 0 unless defined $to_lines;
2373
2374        if ($from->{'href'}) {
2375                $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2376                                     -class=>"list"}, $from_text);
2377        }
2378        if ($to->{'href'}) {
2379                $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2380                                     -class=>"list"}, $to_text);
2381        }
2382        $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2383                "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2384        return $line;
2385}
2386
2387# assumes that $from and $to are defined and correctly filled,
2388# and that $line holds a line of chunk header for combined diff
2389sub format_cc_diff_chunk_header {
2390        my ($line, $from, $to) = @_;
2391
2392        my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2393        my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2394
2395        @from_text = split(' ', $ranges);
2396        for (my $i = 0; $i < @from_text; ++$i) {
2397                ($from_start[$i], $from_nlines[$i]) =
2398                        (split(',', substr($from_text[$i], 1)), 0);
2399        }
2400
2401        $to_text   = pop @from_text;
2402        $to_start  = pop @from_start;
2403        $to_nlines = pop @from_nlines;
2404
2405        $line = "<span class=\"chunk_info\">$prefix ";
2406        for (my $i = 0; $i < @from_text; ++$i) {
2407                if ($from->{'href'}[$i]) {
2408                        $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2409                                          -class=>"list"}, $from_text[$i]);
2410                } else {
2411                        $line .= $from_text[$i];
2412                }
2413                $line .= " ";
2414        }
2415        if ($to->{'href'}) {
2416                $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2417                                  -class=>"list"}, $to_text);
2418        } else {
2419                $line .= $to_text;
2420        }
2421        $line .= " $prefix</span>" .
2422                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2423        return $line;
2424}
2425
2426# process patch (diff) line (not to be used for diff headers),
2427# returning class and HTML-formatted (but not wrapped) line
2428sub process_diff_line {
2429        my $line = shift;
2430        my ($from, $to) = @_;
2431
2432        my $diff_class = diff_line_class($line, $from, $to);
2433
2434        chomp $line;
2435        $line = untabify($line);
2436
2437        if ($from && $to && $line =~ m/^\@{2} /) {
2438                $line = format_unidiff_chunk_header($line, $from, $to);
2439                return $diff_class, $line;
2440
2441        } elsif ($from && $to && $line =~ m/^\@{3}/) {
2442                $line = format_cc_diff_chunk_header($line, $from, $to);
2443                return $diff_class, $line;
2444
2445        }
2446        return $diff_class, esc_html($line, -nbsp=>1);
2447}
2448
2449# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2450# linked.  Pass the hash of the tree/commit to snapshot.
2451sub format_snapshot_links {
2452        my ($hash) = @_;
2453        my $num_fmts = @snapshot_fmts;
2454        if ($num_fmts > 1) {
2455                # A parenthesized list of links bearing format names.
2456                # e.g. "snapshot (_tar.gz_ _zip_)"
2457                return "snapshot (" . join(' ', map
2458                        $cgi->a({
2459                                -href => href(
2460                                        action=>"snapshot",
2461                                        hash=>$hash,
2462                                        snapshot_format=>$_
2463                                )
2464                        }, $known_snapshot_formats{$_}{'display'})
2465                , @snapshot_fmts) . ")";
2466        } elsif ($num_fmts == 1) {
2467                # A single "snapshot" link whose tooltip bears the format name.
2468                # i.e. "_snapshot_"
2469                my ($fmt) = @snapshot_fmts;
2470                return
2471                        $cgi->a({
2472                                -href => href(
2473                                        action=>"snapshot",
2474                                        hash=>$hash,
2475                                        snapshot_format=>$fmt
2476                                ),
2477                                -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2478                        }, "snapshot");
2479        } else { # $num_fmts == 0
2480                return undef;
2481        }
2482}
2483
2484## ......................................................................
2485## functions returning values to be passed, perhaps after some
2486## transformation, to other functions; e.g. returning arguments to href()
2487
2488# returns hash to be passed to href to generate gitweb URL
2489# in -title key it returns description of link
2490sub get_feed_info {
2491        my $format = shift || 'Atom';
2492        my %res = (action => lc($format));
2493
2494        # feed links are possible only for project views
2495        return unless (defined $project);
2496        # some views should link to OPML, or to generic project feed,
2497        # or don't have specific feed yet (so they should use generic)
2498        return if (!$action || $action =~ /^(?:tags|heads|forks|tag|search)$/x);
2499
2500        my $branch;
2501        # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2502        # from tag links; this also makes possible to detect branch links
2503        if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2504            (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2505                $branch = $1;
2506        }
2507        # find log type for feed description (title)
2508        my $type = 'log';
2509        if (defined $file_name) {
2510                $type  = "history of $file_name";
2511                $type .= "/" if ($action eq 'tree');
2512                $type .= " on '$branch'" if (defined $branch);
2513        } else {
2514                $type = "log of $branch" if (defined $branch);
2515        }
2516
2517        $res{-title} = $type;
2518        $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2519        $res{'file_name'} = $file_name;
2520
2521        return %res;
2522}
2523
2524## ----------------------------------------------------------------------
2525## git utility subroutines, invoking git commands
2526
2527# returns path to the core git executable and the --git-dir parameter as list
2528sub git_cmd {
2529        $number_of_git_cmds++;
2530        return $GIT, '--git-dir='.$git_dir;
2531}
2532
2533# quote the given arguments for passing them to the shell
2534# quote_command("command", "arg 1", "arg with ' and ! characters")
2535# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2536# Try to avoid using this function wherever possible.
2537sub quote_command {
2538        return join(' ',
2539                map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2540}
2541
2542# get HEAD ref of given project as hash
2543sub git_get_head_hash {
2544        return git_get_full_hash(shift, 'HEAD');
2545}
2546
2547sub git_get_full_hash {
2548        return git_get_hash(@_);
2549}
2550
2551sub git_get_short_hash {
2552        return git_get_hash(@_, '--short=7');
2553}
2554
2555sub git_get_hash {
2556        my ($project, $hash, @options) = @_;
2557        my $o_git_dir = $git_dir;
2558        my $retval = undef;
2559        $git_dir = "$projectroot/$project";
2560        if (open my $fd, '-|', git_cmd(), 'rev-parse',
2561            '--verify', '-q', @options, $hash) {
2562                $retval = <$fd>;
2563                chomp $retval if defined $retval;
2564                close $fd;
2565        }
2566        if (defined $o_git_dir) {
2567                $git_dir = $o_git_dir;
2568        }
2569        return $retval;
2570}
2571
2572# get type of given object
2573sub git_get_type {
2574        my $hash = shift;
2575
2576        open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2577        my $type = <$fd>;
2578        close $fd or return;
2579        chomp $type;
2580        return $type;
2581}
2582
2583# repository configuration
2584our $config_file = '';
2585our %config;
2586
2587# store multiple values for single key as anonymous array reference
2588# single values stored directly in the hash, not as [ <value> ]
2589sub hash_set_multi {
2590        my ($hash, $key, $value) = @_;
2591
2592        if (!exists $hash->{$key}) {
2593                $hash->{$key} = $value;
2594        } elsif (!ref $hash->{$key}) {
2595                $hash->{$key} = [ $hash->{$key}, $value ];
2596        } else {
2597                push @{$hash->{$key}}, $value;
2598        }
2599}
2600
2601# return hash of git project configuration
2602# optionally limited to some section, e.g. 'gitweb'
2603sub git_parse_project_config {
2604        my $section_regexp = shift;
2605        my %config;
2606
2607        local $/ = "\0";
2608
2609        open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2610                or return;
2611
2612        while (my $keyval = <$fh>) {
2613                chomp $keyval;
2614                my ($key, $value) = split(/\n/, $keyval, 2);
2615
2616                hash_set_multi(\%config, $key, $value)
2617                        if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2618        }
2619        close $fh;
2620
2621        return %config;
2622}
2623
2624# convert config value to boolean: 'true' or 'false'
2625# no value, number > 0, 'true' and 'yes' values are true
2626# rest of values are treated as false (never as error)
2627sub config_to_bool {
2628        my $val = shift;
2629
2630        return 1 if !defined $val;             # section.key
2631
2632        # strip leading and trailing whitespace
2633        $val =~ s/^\s+//;
2634        $val =~ s/\s+$//;
2635
2636        return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2637                ($val =~ /^(?:true|yes)$/i));  # section.key = true
2638}
2639
2640# convert config value to simple decimal number
2641# an optional value suffix of 'k', 'm', or 'g' will cause the value
2642# to be multiplied by 1024, 1048576, or 1073741824
2643sub config_to_int {
2644        my $val = shift;
2645
2646        # strip leading and trailing whitespace
2647        $val =~ s/^\s+//;
2648        $val =~ s/\s+$//;
2649
2650        if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2651                $unit = lc($unit);
2652                # unknown unit is treated as 1
2653                return $num * ($unit eq 'g' ? 1073741824 :
2654                               $unit eq 'm' ?    1048576 :
2655                               $unit eq 'k' ?       1024 : 1);
2656        }
2657        return $val;
2658}
2659
2660# convert config value to array reference, if needed
2661sub config_to_multi {
2662        my $val = shift;
2663
2664        return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2665}
2666
2667sub git_get_project_config {
2668        my ($key, $type) = @_;
2669
2670        return unless defined $git_dir;
2671
2672        # key sanity check
2673        return unless ($key);
2674        # only subsection, if exists, is case sensitive,
2675        # and not lowercased by 'git config -z -l'
2676        if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2677                $key = join(".", lc($hi), $mi, lc($lo));
2678        } else {
2679                $key = lc($key);
2680        }
2681        $key =~ s/^gitweb\.//;
2682        return if ($key =~ m/\W/);
2683
2684        # type sanity check
2685        if (defined $type) {
2686                $type =~ s/^--//;
2687                $type = undef
2688                        unless ($type eq 'bool' || $type eq 'int');
2689        }
2690
2691        # get config
2692        if (!defined $config_file ||
2693            $config_file ne "$git_dir/config") {
2694                %config = git_parse_project_config('gitweb');
2695                $config_file = "$git_dir/config";
2696        }
2697
2698        # check if config variable (key) exists
2699        return unless exists $config{"gitweb.$key"};
2700
2701        # ensure given type
2702        if (!defined $type) {
2703                return $config{"gitweb.$key"};
2704        } elsif ($type eq 'bool') {
2705                # backward compatibility: 'git config --bool' returns true/false
2706                return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2707        } elsif ($type eq 'int') {
2708                return config_to_int($config{"gitweb.$key"});
2709        }
2710        return $config{"gitweb.$key"};
2711}
2712
2713# get hash of given path at given ref
2714sub git_get_hash_by_path {
2715        my $base = shift;
2716        my $path = shift || return undef;
2717        my $type = shift;
2718
2719        $path =~ s,/+$,,;
2720
2721        open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2722                or die_error(500, "Open git-ls-tree failed");
2723        my $line = <$fd>;
2724        close $fd or return undef;
2725
2726        if (!defined $line) {
2727                # there is no tree or hash given by $path at $base
2728                return undef;
2729        }
2730
2731        #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2732        $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2733        if (defined $type && $type ne $2) {
2734                # type doesn't match
2735                return undef;
2736        }
2737        return $3;
2738}
2739
2740# get path of entry with given hash at given tree-ish (ref)
2741# used to get 'from' filename for combined diff (merge commit) for renames
2742sub git_get_path_by_hash {
2743        my $base = shift || return;
2744        my $hash = shift || return;
2745
2746        local $/ = "\0";
2747
2748        open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2749                or return undef;
2750        while (my $line = <$fd>) {
2751                chomp $line;
2752
2753                #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2754                #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2755                if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2756                        close $fd;
2757                        return $1;
2758                }
2759        }
2760        close $fd;
2761        return undef;
2762}
2763
2764## ......................................................................
2765## git utility functions, directly accessing git repository
2766
2767# get the value of config variable either from file named as the variable
2768# itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2769# configuration variable in the repository config file.
2770sub git_get_file_or_project_config {
2771        my ($path, $name) = @_;
2772
2773        $git_dir = "$projectroot/$path";
2774        open my $fd, '<', "$git_dir/$name"
2775                or return git_get_project_config($name);
2776        my $conf = <$fd>;
2777        close $fd;
2778        if (defined $conf) {
2779                chomp $conf;
2780        }
2781        return $conf;
2782}
2783
2784sub git_get_project_description {
2785        my $path = shift;
2786        return git_get_file_or_project_config($path, 'description');
2787}
2788
2789sub git_get_project_category {
2790        my $path = shift;
2791        return git_get_file_or_project_config($path, 'category');
2792}
2793
2794
2795# supported formats:
2796# * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2797#   - if its contents is a number, use it as tag weight,
2798#   - otherwise add a tag with weight 1
2799# * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2800#   the same value multiple times increases tag weight
2801# * `gitweb.ctag' multi-valued repo config variable
2802sub git_get_project_ctags {
2803        my $project = shift;
2804        my $ctags = {};
2805
2806        $git_dir = "$projectroot/$project";
2807        if (opendir my $dh, "$git_dir/ctags") {
2808                my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2809                foreach my $tagfile (@files) {
2810                        open my $ct, '<', $tagfile
2811                                or next;
2812                        my $val = <$ct>;
2813                        chomp $val if $val;
2814                        close $ct;
2815
2816                        (my $ctag = $tagfile) =~ s#.*/##;
2817                        if ($val =~ /^\d+$/) {
2818                                $ctags->{$ctag} = $val;
2819                        } else {
2820                                $ctags->{$ctag} = 1;
2821                        }
2822                }
2823                closedir $dh;
2824
2825        } elsif (open my $fh, '<', "$git_dir/ctags") {
2826                while (my $line = <$fh>) {
2827                        chomp $line;
2828                        $ctags->{$line}++ if $line;
2829                }
2830                close $fh;
2831
2832        } else {
2833                my $taglist = config_to_multi(git_get_project_config('ctag'));
2834                foreach my $tag (@$taglist) {
2835                        $ctags->{$tag}++;
2836                }
2837        }
2838
2839        return $ctags;
2840}
2841
2842# return hash, where keys are content tags ('ctags'),
2843# and values are sum of weights of given tag in every project
2844sub git_gather_all_ctags {
2845        my $projects = shift;
2846        my $ctags = {};
2847
2848        foreach my $p (@$projects) {
2849                foreach my $ct (keys %{$p->{'ctags'}}) {
2850                        $ctags->{$ct} += $p->{'ctags'}->{$ct};
2851                }
2852        }
2853
2854        return $ctags;
2855}
2856
2857sub git_populate_project_tagcloud {
2858        my $ctags = shift;
2859
2860        # First, merge different-cased tags; tags vote on casing
2861        my %ctags_lc;
2862        foreach (keys %$ctags) {
2863                $ctags_lc{lc $_}->{count} += $ctags->{$_};
2864                if (not $ctags_lc{lc $_}->{topcount}
2865                    or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2866                        $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2867                        $ctags_lc{lc $_}->{topname} = $_;
2868                }
2869        }
2870
2871        my $cloud;
2872        my $matched = $input_params{'ctag'};
2873        if (eval { require HTML::TagCloud; 1; }) {
2874                $cloud = HTML::TagCloud->new;
2875                foreach my $ctag (sort keys %ctags_lc) {
2876                        # Pad the title with spaces so that the cloud looks
2877                        # less crammed.
2878                        my $title = esc_html($ctags_lc{$ctag}->{topname});
2879                        $title =~ s/ /&nbsp;/g;
2880                        $title =~ s/^/&nbsp;/g;
2881                        $title =~ s/$/&nbsp;/g;
2882                        if (defined $matched && $matched eq $ctag) {
2883                                $title = qq(<span class="match">$title</span>);
2884                        }
2885                        $cloud->add($title, href(project=>undef, ctag=>$ctag),
2886                                    $ctags_lc{$ctag}->{count});
2887                }
2888        } else {
2889                $cloud = {};
2890                foreach my $ctag (keys %ctags_lc) {
2891                        my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2892                        if (defined $matched && $matched eq $ctag) {
2893                                $title = qq(<span class="match">$title</span>);
2894                        }
2895                        $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2896                        $cloud->{$ctag}{ctag} =
2897                                $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2898                }
2899        }
2900        return $cloud;
2901}
2902
2903sub git_show_project_tagcloud {
2904        my ($cloud, $count) = @_;
2905        if (ref $cloud eq 'HTML::TagCloud') {
2906                return $cloud->html_and_css($count);
2907        } else {
2908                my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2909                return
2910                        '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2911                        join (', ', map {
2912                                $cloud->{$_}->{'ctag'}
2913                        } splice(@tags, 0, $count)) .
2914                        '</div>';
2915        }
2916}
2917
2918sub git_get_project_url_list {
2919        my $path = shift;
2920
2921        $git_dir = "$projectroot/$path";
2922        open my $fd, '<', "$git_dir/cloneurl"
2923                or return wantarray ?
2924                @{ config_to_multi(git_get_project_config('url')) } :
2925                   config_to_multi(git_get_project_config('url'));
2926        my @git_project_url_list = map { chomp; $_ } <$fd>;
2927        close $fd;
2928
2929        return wantarray ? @git_project_url_list : \@git_project_url_list;
2930}
2931
2932sub git_get_projects_list {
2933        my $filter = shift || '';
2934        my $paranoid = shift;
2935        my @list;
2936
2937        if (-d $projects_list) {
2938                # search in directory
2939                my $dir = $projects_list;
2940                # remove the trailing "/"
2941                $dir =~ s!/+$!!;
2942                my $pfxlen = length("$dir");
2943                my $pfxdepth = ($dir =~ tr!/!!);
2944                # when filtering, search only given subdirectory
2945                if ($filter && !$paranoid) {
2946                        $dir .= "/$filter";
2947                        $dir =~ s!/+$!!;
2948                }
2949
2950                File::Find::find({
2951                        follow_fast => 1, # follow symbolic links
2952                        follow_skip => 2, # ignore duplicates
2953                        dangling_symlinks => 0, # ignore dangling symlinks, silently
2954                        wanted => sub {
2955                                # global variables
2956                                our $project_maxdepth;
2957                                our $projectroot;
2958                                # skip project-list toplevel, if we get it.
2959                                return if (m!^[/.]$!);
2960                                # only directories can be git repositories
2961                                return unless (-d $_);
2962                                # don't traverse too deep (Find is super slow on os x)
2963                                # $project_maxdepth excludes depth of $projectroot
2964                                if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2965                                        $File::Find::prune = 1;
2966                                        return;
2967                                }
2968
2969                                my $path = substr($File::Find::name, $pfxlen + 1);
2970                                # paranoidly only filter here
2971                                if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
2972                                        next;
2973                                }
2974                                # we check related file in $projectroot
2975                                if (check_export_ok("$projectroot/$path")) {
2976                                        push @list, { path => $path };
2977                                        $File::Find::prune = 1;
2978                                }
2979                        },
2980                }, "$dir");
2981
2982        } elsif (-f $projects_list) {
2983                # read from file(url-encoded):
2984                # 'git%2Fgit.git Linus+Torvalds'
2985                # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2986                # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2987                open my $fd, '<', $projects_list or return;
2988        PROJECT:
2989                while (my $line = <$fd>) {
2990                        chomp $line;
2991                        my ($path, $owner) = split ' ', $line;
2992                        $path = unescape($path);
2993                        $owner = unescape($owner);
2994                        if (!defined $path) {
2995                                next;
2996                        }
2997                        # if $filter is rpovided, check if $path begins with $filter
2998                        if ($filter && $path !~ m!^\Q$filter\E/!) {
2999                                next;
3000                        }
3001                        if (check_export_ok("$projectroot/$path")) {
3002                                my $pr = {
3003                                        path => $path,
3004                                        owner => to_utf8($owner),
3005                                };
3006                                push @list, $pr;
3007                        }
3008                }
3009                close $fd;
3010        }
3011        return @list;
3012}
3013
3014# written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
3015# as side effects it sets 'forks' field to list of forks for forked projects
3016sub filter_forks_from_projects_list {
3017        my $projects = shift;
3018
3019        my %trie; # prefix tree of directories (path components)
3020        # generate trie out of those directories that might contain forks
3021        foreach my $pr (@$projects) {
3022                my $path = $pr->{'path'};
3023                $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
3024                next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
3025                next unless ($path);      # skip '.git' repository: tests, git-instaweb
3026                next unless (-d "$projectroot/$path"); # containing directory exists
3027                $pr->{'forks'} = [];      # there can be 0 or more forks of project
3028
3029                # add to trie
3030                my @dirs = split('/', $path);
3031                # walk the trie, until either runs out of components or out of trie
3032                my $ref = \%trie;
3033                while (scalar @dirs &&
3034                       exists($ref->{$dirs[0]})) {
3035                        $ref = $ref->{shift @dirs};
3036                }
3037                # create rest of trie structure from rest of components
3038                foreach my $dir (@dirs) {
3039                        $ref = $ref->{$dir} = {};
3040                }
3041                # create end marker, store $pr as a data
3042                $ref->{''} = $pr if (!exists $ref->{''});
3043        }
3044
3045        # filter out forks, by finding shortest prefix match for paths
3046        my @filtered;
3047 PROJECT:
3048        foreach my $pr (@$projects) {
3049                # trie lookup
3050                my $ref = \%trie;
3051        DIR:
3052                foreach my $dir (split('/', $pr->{'path'})) {
3053                        if (exists $ref->{''}) {
3054                                # found [shortest] prefix, is a fork - skip it
3055                                push @{$ref->{''}{'forks'}}, $pr;
3056                                next PROJECT;
3057                        }
3058                        if (!exists $ref->{$dir}) {
3059                                # not in trie, cannot have prefix, not a fork
3060                                push @filtered, $pr;
3061                                next PROJECT;
3062                        }
3063                        # If the dir is there, we just walk one step down the trie.
3064                        $ref = $ref->{$dir};
3065                }
3066                # we ran out of trie
3067                # (shouldn't happen: it's either no match, or end marker)
3068                push @filtered, $pr;
3069        }
3070
3071        return @filtered;
3072}
3073
3074# note: fill_project_list_info must be run first,
3075# for 'descr_long' and 'ctags' to be filled
3076sub search_projects_list {
3077        my ($projlist, %opts) = @_;
3078        my $tagfilter  = $opts{'tagfilter'};
3079        my $search_re = $opts{'search_regexp'};
3080
3081        return @$projlist
3082                unless ($tagfilter || $search_re);
3083
3084        # searching projects require filling to be run before it;
3085        fill_project_list_info($projlist,
3086                               $tagfilter  ? 'ctags' : (),
3087                               $search_re ? ('path', 'descr') : ());
3088        my @projects;
3089 PROJECT:
3090        foreach my $pr (@$projlist) {
3091
3092                if ($tagfilter) {
3093                        next unless ref($pr->{'ctags'}) eq 'HASH';
3094                        next unless
3095                                grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
3096                }
3097
3098                if ($search_re) {
3099                        next unless
3100                                $pr->{'path'} =~ /$search_re/ ||
3101                                $pr->{'descr_long'} =~ /$search_re/;
3102                }
3103
3104                push @projects, $pr;
3105        }
3106
3107        return @projects;
3108}
3109
3110our $gitweb_project_owner = undef;
3111sub git_get_project_list_from_file {
3112
3113        return if (defined $gitweb_project_owner);
3114
3115        $gitweb_project_owner = {};
3116        # read from file (url-encoded):
3117        # 'git%2Fgit.git Linus+Torvalds'
3118        # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3119        # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3120        if (-f $projects_list) {
3121                open(my $fd, '<', $projects_list);
3122                while (my $line = <$fd>) {
3123                        chomp $line;
3124                        my ($pr, $ow) = split ' ', $line;
3125                        $pr = unescape($pr);
3126                        $ow = unescape($ow);
3127                        $gitweb_project_owner->{$pr} = to_utf8($ow);
3128                }
3129                close $fd;
3130        }
3131}
3132
3133sub git_get_project_owner {
3134        my $project = shift;
3135        my $owner;
3136
3137        return undef unless $project;
3138        $git_dir = "$projectroot/$project";
3139
3140        if (!defined $gitweb_project_owner) {
3141                git_get_project_list_from_file();
3142        }
3143
3144        if (exists $gitweb_project_owner->{$project}) {
3145                $owner = $gitweb_project_owner->{$project};
3146        }
3147        if (!defined $owner){
3148                $owner = git_get_project_config('owner');
3149        }
3150        if (!defined $owner) {
3151                $owner = get_file_owner("$git_dir");
3152        }
3153
3154        return $owner;
3155}
3156
3157sub git_get_last_activity {
3158        my ($path) = @_;
3159        my $fd;
3160
3161        $git_dir = "$projectroot/$path";
3162        open($fd, "-|", git_cmd(), 'for-each-ref',
3163             '--format=%(committer)',
3164             '--sort=-committerdate',
3165             '--count=1',
3166             'refs/heads') or return;
3167        my $most_recent = <$fd>;
3168        close $fd or return;
3169        if (defined $most_recent &&
3170            $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3171                my $timestamp = $1;
3172                my $age = time - $timestamp;
3173                return ($age, age_string($age));
3174        }
3175        return (undef, undef);
3176}
3177
3178# Implementation note: when a single remote is wanted, we cannot use 'git
3179# remote show -n' because that command always work (assuming it's a remote URL
3180# if it's not defined), and we cannot use 'git remote show' because that would
3181# try to make a network roundtrip. So the only way to find if that particular
3182# remote is defined is to walk the list provided by 'git remote -v' and stop if
3183# and when we find what we want.
3184sub git_get_remotes_list {
3185        my $wanted = shift;
3186        my %remotes = ();
3187
3188        open my $fd, '-|' , git_cmd(), 'remote', '-v';
3189        return unless $fd;
3190        while (my $remote = <$fd>) {
3191                chomp $remote;
3192                $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3193                next if $wanted and not $remote eq $wanted;
3194                my ($url, $key) = ($1, $2);
3195
3196                $remotes{$remote} ||= { 'heads' => () };
3197                $remotes{$remote}{$key} = $url;
3198        }
3199        close $fd or return;
3200        return wantarray ? %remotes : \%remotes;
3201}
3202
3203# Takes a hash of remotes as first parameter and fills it by adding the
3204# available remote heads for each of the indicated remotes.
3205sub fill_remote_heads {
3206        my $remotes = shift;
3207        my @heads = map { "remotes/$_" } keys %$remotes;
3208        my @remoteheads = git_get_heads_list(undef, @heads);
3209        foreach my $remote (keys %$remotes) {
3210                $remotes->{$remote}{'heads'} = [ grep {
3211                        $_->{'name'} =~ s!^$remote/!!
3212                        } @remoteheads ];
3213        }
3214}
3215
3216sub git_get_references {
3217        my $type = shift || "";
3218        my %refs;
3219        # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3220        # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3221        open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3222                ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3223                or return;
3224
3225        while (my $line = <$fd>) {
3226                chomp $line;
3227                if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3228                        if (defined $refs{$1}) {
3229                                push @{$refs{$1}}, $2;
3230                        } else {
3231                                $refs{$1} = [ $2 ];
3232                        }
3233                }
3234        }
3235        close $fd or return;
3236        return \%refs;
3237}
3238
3239sub git_get_rev_name_tags {
3240        my $hash = shift || return undef;
3241
3242        open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3243                or return;
3244        my $name_rev = <$fd>;
3245        close $fd;
3246
3247        if ($name_rev =~ m|^$hash tags/(.*)$|) {
3248                return $1;
3249        } else {
3250                # catches also '$hash undefined' output
3251                return undef;
3252        }
3253}
3254
3255## ----------------------------------------------------------------------
3256## parse to hash functions
3257
3258sub parse_date {
3259        my $epoch = shift;
3260        my $tz = shift || "-0000";
3261
3262        my %date;
3263        my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3264        my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3265        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3266        $date{'hour'} = $hour;
3267        $date{'minute'} = $min;
3268        $date{'mday'} = $mday;
3269        $date{'day'} = $days[$wday];
3270        $date{'month'} = $months[$mon];
3271        $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3272                             $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3273        $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3274                             $mday, $months[$mon], $hour ,$min;
3275        $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3276                             1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3277
3278        my ($tz_sign, $tz_hour, $tz_min) =
3279                ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3280        $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3281        my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3282        ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3283        $date{'hour_local'} = $hour;
3284        $date{'minute_local'} = $min;
3285        $date{'tz_local'} = $tz;
3286        $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3287                                  1900+$year, $mon+1, $mday,
3288                                  $hour, $min, $sec, $tz);
3289        return %date;
3290}
3291
3292sub parse_tag {
3293        my $tag_id = shift;
3294        my %tag;
3295        my @comment;
3296
3297        open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3298        $tag{'id'} = $tag_id;
3299        while (my $line = <$fd>) {
3300                chomp $line;
3301                if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3302                        $tag{'object'} = $1;
3303                } elsif ($line =~ m/^type (.+)$/) {
3304                        $tag{'type'} = $1;
3305                } elsif ($line =~ m/^tag (.+)$/) {
3306                        $tag{'name'} = $1;
3307                } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3308                        $tag{'author'} = $1;
3309                        $tag{'author_epoch'} = $2;
3310                        $tag{'author_tz'} = $3;
3311                        if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3312                                $tag{'author_name'}  = $1;
3313                                $tag{'author_email'} = $2;
3314                        } else {
3315                                $tag{'author_name'} = $tag{'author'};
3316                        }
3317                } elsif ($line =~ m/--BEGIN/) {
3318                        push @comment, $line;
3319                        last;
3320                } elsif ($line eq "") {
3321                        last;
3322                }
3323        }
3324        push @comment, <$fd>;
3325        $tag{'comment'} = \@comment;
3326        close $fd or return;
3327        if (!defined $tag{'name'}) {
3328                return
3329        };
3330        return %tag
3331}
3332
3333sub parse_commit_text {
3334        my ($commit_text, $withparents) = @_;
3335        my @commit_lines = split '\n', $commit_text;
3336        my %co;
3337
3338        pop @commit_lines; # Remove '\0'
3339
3340        if (! @commit_lines) {
3341                return;
3342        }
3343
3344        my $header = shift @commit_lines;
3345        if ($header !~ m/^[0-9a-fA-F]{40}/) {
3346                return;
3347        }
3348        ($co{'id'}, my @parents) = split ' ', $header;
3349        while (my $line = shift @commit_lines) {
3350                last if $line eq "\n";
3351                if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3352                        $co{'tree'} = $1;
3353                } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3354                        push @parents, $1;
3355                } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3356                        $co{'author'} = to_utf8($1);
3357                        $co{'author_epoch'} = $2;
3358                        $co{'author_tz'} = $3;
3359                        if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3360                                $co{'author_name'}  = $1;
3361                                $co{'author_email'} = $2;
3362                        } else {
3363                                $co{'author_name'} = $co{'author'};
3364                        }
3365                } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3366                        $co{'committer'} = to_utf8($1);
3367                        $co{'committer_epoch'} = $2;
3368                        $co{'committer_tz'} = $3;
3369                        if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3370                                $co{'committer_name'}  = $1;
3371                                $co{'committer_email'} = $2;
3372                        } else {
3373                                $co{'committer_name'} = $co{'committer'};
3374                        }
3375                }
3376        }
3377        if (!defined $co{'tree'}) {
3378                return;
3379        };
3380        $co{'parents'} = \@parents;
3381        $co{'parent'} = $parents[0];
3382
3383        foreach my $title (@commit_lines) {
3384                $title =~ s/^    //;
3385                if ($title ne "") {
3386                        $co{'title'} = chop_str($title, 80, 5);
3387                        # remove leading stuff of merges to make the interesting part visible
3388                        if (length($title) > 50) {
3389                                $title =~ s/^Automatic //;
3390                                $title =~ s/^merge (of|with) /Merge ... /i;
3391                                if (length($title) > 50) {
3392                                        $title =~ s/(http|rsync):\/\///;
3393                                }
3394                                if (length($title) > 50) {
3395                                        $title =~ s/(master|www|rsync)\.//;
3396                                }
3397                                if (length($title) > 50) {
3398                                        $title =~ s/kernel.org:?//;
3399                                }
3400                                if (length($title) > 50) {
3401                                        $title =~ s/\/pub\/scm//;
3402                                }
3403                        }
3404                        $co{'title_short'} = chop_str($title, 50, 5);
3405                        last;
3406                }
3407        }
3408        if (! defined $co{'title'} || $co{'title'} eq "") {
3409                $co{'title'} = $co{'title_short'} = '(no commit message)';
3410        }
3411        # remove added spaces
3412        foreach my $line (@commit_lines) {
3413                $line =~ s/^    //;
3414        }
3415        $co{'comment'} = \@commit_lines;
3416
3417        my $age = time - $co{'committer_epoch'};
3418        $co{'age'} = $age;
3419        $co{'age_string'} = age_string($age);
3420        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3421        if ($age > 60*60*24*7*2) {
3422                $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3423                $co{'age_string_age'} = $co{'age_string'};
3424        } else {
3425                $co{'age_string_date'} = $co{'age_string'};
3426                $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3427        }
3428        return %co;
3429}
3430
3431sub parse_commit {
3432        my ($commit_id) = @_;
3433        my %co;
3434
3435        local $/ = "\0";
3436
3437        open my $fd, "-|", git_cmd(), "rev-list",
3438                "--parents",
3439                "--header",
3440                "--max-count=1",
3441                $commit_id,
3442                "--",
3443                or die_error(500, "Open git-rev-list failed");
3444        %co = parse_commit_text(<$fd>, 1);
3445        close $fd;
3446
3447        return %co;
3448}
3449
3450sub parse_commits {
3451        my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3452        my @cos;
3453
3454        $maxcount ||= 1;
3455        $skip ||= 0;
3456
3457        local $/ = "\0";
3458
3459        open my $fd, "-|", git_cmd(), "rev-list",
3460                "--header",
3461                @args,
3462                ("--max-count=" . $maxcount),
3463                ("--skip=" . $skip),
3464                @extra_options,
3465                $commit_id,
3466                "--",
3467                ($filename ? ($filename) : ())
3468                or die_error(500, "Open git-rev-list failed");
3469        while (my $line = <$fd>) {
3470                my %co = parse_commit_text($line);
3471                push @cos, \%co;
3472        }
3473        close $fd;
3474
3475        return wantarray ? @cos : \@cos;
3476}
3477
3478# parse line of git-diff-tree "raw" output
3479sub parse_difftree_raw_line {
3480        my $line = shift;
3481        my %res;
3482
3483        # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3484        # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3485        if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3486                $res{'from_mode'} = $1;
3487                $res{'to_mode'} = $2;
3488                $res{'from_id'} = $3;
3489                $res{'to_id'} = $4;
3490                $res{'status'} = $5;
3491                $res{'similarity'} = $6;
3492                if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3493                        ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3494                } else {
3495                        $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3496                }
3497        }
3498        # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3499        # combined diff (for merge commit)
3500        elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3501                $res{'nparents'}  = length($1);
3502                $res{'from_mode'} = [ split(' ', $2) ];
3503                $res{'to_mode'} = pop @{$res{'from_mode'}};
3504                $res{'from_id'} = [ split(' ', $3) ];
3505                $res{'to_id'} = pop @{$res{'from_id'}};
3506                $res{'status'} = [ split('', $4) ];
3507                $res{'to_file'} = unquote($5);
3508        }
3509        # 'c512b523472485aef4fff9e57b229d9d243c967f'
3510        elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3511                $res{'commit'} = $1;
3512        }
3513
3514        return wantarray ? %res : \%res;
3515}
3516
3517# wrapper: return parsed line of git-diff-tree "raw" output
3518# (the argument might be raw line, or parsed info)
3519sub parsed_difftree_line {
3520        my $line_or_ref = shift;
3521
3522        if (ref($line_or_ref) eq "HASH") {
3523                # pre-parsed (or generated by hand)
3524                return $line_or_ref;
3525        } else {
3526                return parse_difftree_raw_line($line_or_ref);
3527        }
3528}
3529
3530# parse line of git-ls-tree output
3531sub parse_ls_tree_line {
3532        my $line = shift;
3533        my %opts = @_;
3534        my %res;
3535
3536        if ($opts{'-l'}) {
3537                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3538                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3539
3540                $res{'mode'} = $1;
3541                $res{'type'} = $2;
3542                $res{'hash'} = $3;
3543                $res{'size'} = $4;
3544                if ($opts{'-z'}) {
3545                        $res{'name'} = $5;
3546                } else {
3547                        $res{'name'} = unquote($5);
3548                }
3549        } else {
3550                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3551                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3552
3553                $res{'mode'} = $1;
3554                $res{'type'} = $2;
3555                $res{'hash'} = $3;
3556                if ($opts{'-z'}) {
3557                        $res{'name'} = $4;
3558                } else {
3559                        $res{'name'} = unquote($4);
3560                }
3561        }
3562
3563        return wantarray ? %res : \%res;
3564}
3565
3566# generates _two_ hashes, references to which are passed as 2 and 3 argument
3567sub parse_from_to_diffinfo {
3568        my ($diffinfo, $from, $to, @parents) = @_;
3569
3570        if ($diffinfo->{'nparents'}) {
3571                # combined diff
3572                $from->{'file'} = [];
3573                $from->{'href'} = [];
3574                fill_from_file_info($diffinfo, @parents)
3575                        unless exists $diffinfo->{'from_file'};
3576                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3577                        $from->{'file'}[$i] =
3578                                defined $diffinfo->{'from_file'}[$i] ?
3579                                        $diffinfo->{'from_file'}[$i] :
3580                                        $diffinfo->{'to_file'};
3581                        if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3582                                $from->{'href'}[$i] = href(action=>"blob",
3583                                                           hash_base=>$parents[$i],
3584                                                           hash=>$diffinfo->{'from_id'}[$i],
3585                                                           file_name=>$from->{'file'}[$i]);
3586                        } else {
3587                                $from->{'href'}[$i] = undef;
3588                        }
3589                }
3590        } else {
3591                # ordinary (not combined) diff
3592                $from->{'file'} = $diffinfo->{'from_file'};
3593                if ($diffinfo->{'status'} ne "A") { # not new (added) file
3594                        $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3595                                               hash=>$diffinfo->{'from_id'},
3596                                               file_name=>$from->{'file'});
3597                } else {
3598                        delete $from->{'href'};
3599                }
3600        }
3601
3602        $to->{'file'} = $diffinfo->{'to_file'};
3603        if (!is_deleted($diffinfo)) { # file exists in result
3604                $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3605                                     hash=>$diffinfo->{'to_id'},
3606                                     file_name=>$to->{'file'});
3607        } else {
3608                delete $to->{'href'};
3609        }
3610}
3611
3612## ......................................................................
3613## parse to array of hashes functions
3614
3615sub git_get_heads_list {
3616        my ($limit, @classes) = @_;
3617        @classes = ('heads') unless @classes;
3618        my @patterns = map { "refs/$_" } @classes;
3619        my @headslist;
3620
3621        open my $fd, '-|', git_cmd(), 'for-each-ref',
3622                ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3623                '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3624                @patterns
3625                or return;
3626        while (my $line = <$fd>) {
3627                my %ref_item;
3628
3629                chomp $line;
3630                my ($refinfo, $committerinfo) = split(/\0/, $line);
3631                my ($hash, $name, $title) = split(' ', $refinfo, 3);
3632                my ($committer, $epoch, $tz) =
3633                        ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3634                $ref_item{'fullname'}  = $name;
3635                $name =~ s!^refs/(?:head|remote)s/!!;
3636
3637                $ref_item{'name'}  = $name;
3638                $ref_item{'id'}    = $hash;
3639                $ref_item{'title'} = $title || '(no commit message)';
3640                $ref_item{'epoch'} = $epoch;
3641                if ($epoch) {
3642                        $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3643                } else {
3644                        $ref_item{'age'} = "unknown";
3645                }
3646
3647                push @headslist, \%ref_item;
3648        }
3649        close $fd;
3650
3651        return wantarray ? @headslist : \@headslist;
3652}
3653
3654sub git_get_tags_list {
3655        my $limit = shift;
3656        my @tagslist;
3657
3658        open my $fd, '-|', git_cmd(), 'for-each-ref',
3659                ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3660                '--format=%(objectname) %(objecttype) %(refname) '.
3661                '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3662                'refs/tags'
3663                or return;
3664        while (my $line = <$fd>) {
3665                my %ref_item;
3666
3667                chomp $line;
3668                my ($refinfo, $creatorinfo) = split(/\0/, $line);
3669                my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3670                my ($creator, $epoch, $tz) =
3671                        ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3672                $ref_item{'fullname'} = $name;
3673                $name =~ s!^refs/tags/!!;
3674
3675                $ref_item{'type'} = $type;
3676                $ref_item{'id'} = $id;
3677                $ref_item{'name'} = $name;
3678                if ($type eq "tag") {
3679                        $ref_item{'subject'} = $title;
3680                        $ref_item{'reftype'} = $reftype;
3681                        $ref_item{'refid'}   = $refid;
3682                } else {
3683                        $ref_item{'reftype'} = $type;
3684                        $ref_item{'refid'}   = $id;
3685                }
3686
3687                if ($type eq "tag" || $type eq "commit") {
3688                        $ref_item{'epoch'} = $epoch;
3689                        if ($epoch) {
3690                                $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3691                        } else {
3692                                $ref_item{'age'} = "unknown";
3693                        }
3694                }
3695
3696                push @tagslist, \%ref_item;
3697        }
3698        close $fd;
3699
3700        return wantarray ? @tagslist : \@tagslist;
3701}
3702
3703## ----------------------------------------------------------------------
3704## filesystem-related functions
3705
3706sub get_file_owner {
3707        my $path = shift;
3708
3709        my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3710        my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3711        if (!defined $gcos) {
3712                return undef;
3713        }
3714        my $owner = $gcos;
3715        $owner =~ s/[,;].*$//;
3716        return to_utf8($owner);
3717}
3718
3719# assume that file exists
3720sub insert_file {
3721        my $filename = shift;
3722
3723        open my $fd, '<', $filename;
3724        print map { to_utf8($_) } <$fd>;
3725        close $fd;
3726}
3727
3728## ......................................................................
3729## mimetype related functions
3730
3731sub mimetype_guess_file {
3732        my $filename = shift;
3733        my $mimemap = shift;
3734        -r $mimemap or return undef;
3735
3736        my %mimemap;
3737        open(my $mh, '<', $mimemap) or return undef;
3738        while (<$mh>) {
3739                next if m/^#/; # skip comments
3740                my ($mimetype, @exts) = split(/\s+/);
3741                foreach my $ext (@exts) {
3742                        $mimemap{$ext} = $mimetype;
3743                }
3744        }
3745        close($mh);
3746
3747        $filename =~ /\.([^.]*)$/;
3748        return $mimemap{$1};
3749}
3750
3751sub mimetype_guess {
3752        my $filename = shift;
3753        my $mime;
3754        $filename =~ /\./ or return undef;
3755
3756        if ($mimetypes_file) {
3757                my $file = $mimetypes_file;
3758                if ($file !~ m!^/!) { # if it is relative path
3759                        # it is relative to project
3760                        $file = "$projectroot/$project/$file";
3761                }
3762                $mime = mimetype_guess_file($filename, $file);
3763        }
3764        $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3765        return $mime;
3766}
3767
3768sub blob_mimetype {
3769        my $fd = shift;
3770        my $filename = shift;
3771
3772        if ($filename) {
3773                my $mime = mimetype_guess($filename);
3774                $mime and return $mime;
3775        }
3776
3777        # just in case
3778        return $default_blob_plain_mimetype unless $fd;
3779
3780        if (-T $fd) {
3781                return 'text/plain';
3782        } elsif (! $filename) {
3783                return 'application/octet-stream';
3784        } elsif ($filename =~ m/\.png$/i) {
3785                return 'image/png';
3786        } elsif ($filename =~ m/\.gif$/i) {
3787                return 'image/gif';
3788        } elsif ($filename =~ m/\.jpe?g$/i) {
3789                return 'image/jpeg';
3790        } else {
3791                return 'application/octet-stream';
3792        }
3793}
3794
3795sub blob_contenttype {
3796        my ($fd, $file_name, $type) = @_;
3797
3798        $type ||= blob_mimetype($fd, $file_name);
3799        if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3800                $type .= "; charset=$default_text_plain_charset";
3801        }
3802
3803        return $type;
3804}
3805
3806# guess file syntax for syntax highlighting; return undef if no highlighting
3807# the name of syntax can (in the future) depend on syntax highlighter used
3808sub guess_file_syntax {
3809        my ($highlight, $mimetype, $file_name) = @_;
3810        return undef unless ($highlight && defined $file_name);
3811        my $basename = basename($file_name, '.in');
3812        return $highlight_basename{$basename}
3813                if exists $highlight_basename{$basename};
3814
3815        $basename =~ /\.([^.]*)$/;
3816        my $ext = $1 or return undef;
3817        return $highlight_ext{$ext}
3818                if exists $highlight_ext{$ext};
3819
3820        return undef;
3821}
3822
3823# run highlighter and return FD of its output,
3824# or return original FD if no highlighting
3825sub run_highlighter {
3826        my ($fd, $highlight, $syntax) = @_;
3827        return $fd unless ($highlight && defined $syntax);
3828
3829        close $fd;
3830        open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3831                  quote_command($highlight_bin).
3832                  " --replace-tabs=8 --fragment --syntax $syntax |"
3833                or die_error(500, "Couldn't open file or run syntax highlighter");
3834        return $fd;
3835}
3836
3837## ======================================================================
3838## functions printing HTML: header, footer, error page
3839
3840sub get_page_title {
3841        my $title = to_utf8($site_name);
3842
3843        unless (defined $project) {
3844                if (defined $project_filter) {
3845                        $title .= " - projects in '" . esc_path($project_filter) . "'";
3846                }
3847                return $title;
3848        }
3849        $title .= " - " . to_utf8($project);
3850
3851        return $title unless (defined $action);
3852        $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3853
3854        return $title unless (defined $file_name);
3855        $title .= " - " . esc_path($file_name);
3856        if ($action eq "tree" && $file_name !~ m|/$|) {
3857                $title .= "/";
3858        }
3859
3860        return $title;
3861}
3862
3863sub get_content_type_html {
3864        # require explicit support from the UA if we are to send the page as
3865        # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3866        # we have to do this because MSIE sometimes globs '*/*', pretending to
3867        # support xhtml+xml but choking when it gets what it asked for.
3868        if (defined $cgi->http('HTTP_ACCEPT') &&
3869            $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3870            $cgi->Accept('application/xhtml+xml') != 0) {
3871                return 'application/xhtml+xml';
3872        } else {
3873                return 'text/html';
3874        }
3875}
3876
3877sub print_feed_meta {
3878        if (defined $project) {
3879                my %href_params = get_feed_info();
3880                if (!exists $href_params{'-title'}) {
3881                        $href_params{'-title'} = 'log';
3882                }
3883
3884                foreach my $format (qw(RSS Atom)) {
3885                        my $type = lc($format);
3886                        my %link_attr = (
3887                                '-rel' => 'alternate',
3888                                '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3889                                '-type' => "application/$type+xml"
3890                        );
3891
3892                        $href_params{'action'} = $type;
3893                        $link_attr{'-href'} = href(%href_params);
3894                        print "<link ".
3895                              "rel=\"$link_attr{'-rel'}\" ".
3896                              "title=\"$link_attr{'-title'}\" ".
3897                              "href=\"$link_attr{'-href'}\" ".
3898                              "type=\"$link_attr{'-type'}\" ".
3899                              "/>\n";
3900
3901                        $href_params{'extra_options'} = '--no-merges';
3902                        $link_attr{'-href'} = href(%href_params);
3903                        $link_attr{'-title'} .= ' (no merges)';
3904                        print "<link ".
3905                              "rel=\"$link_attr{'-rel'}\" ".
3906                              "title=\"$link_attr{'-title'}\" ".
3907                              "href=\"$link_attr{'-href'}\" ".
3908                              "type=\"$link_attr{'-type'}\" ".
3909                              "/>\n";
3910                }
3911
3912        } else {
3913                printf('<link rel="alternate" title="%s projects list" '.
3914                       'href="%s" type="text/plain; charset=utf-8" />'."\n",
3915                       esc_attr($site_name), href(project=>undef, action=>"project_index"));
3916                printf('<link rel="alternate" title="%s projects feeds" '.
3917                       'href="%s" type="text/x-opml" />'."\n",
3918                       esc_attr($site_name), href(project=>undef, action=>"opml"));
3919        }
3920}
3921
3922sub print_header_links {
3923        my $status = shift;
3924
3925        # print out each stylesheet that exist, providing backwards capability
3926        # for those people who defined $stylesheet in a config file
3927        if (defined $stylesheet) {
3928                print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3929        } else {
3930                foreach my $stylesheet (@stylesheets) {
3931                        next unless $stylesheet;
3932                        print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3933                }
3934        }
3935        print_feed_meta()
3936                if ($status eq '200 OK');
3937        if (defined $favicon) {
3938                print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3939        }
3940}
3941
3942sub print_nav_breadcrumbs_path {
3943        my $dirprefix = undef;
3944        while (my $part = shift) {
3945                $dirprefix .= "/" if defined $dirprefix;
3946                $dirprefix .= $part;
3947                print $cgi->a({-href => href(project => undef,
3948                                             project_filter => $dirprefix,
3949                                             action => "project_list")},
3950                              esc_html($part)) . " / ";
3951        }
3952}
3953
3954sub print_nav_breadcrumbs {
3955        my %opts = @_;
3956
3957        print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3958        if (defined $project) {
3959                my @dirname = split '/', $project;
3960                my $projectbasename = pop @dirname;
3961                print_nav_breadcrumbs_path(@dirname);
3962                print $cgi->a({-href => href(action=>"summary")}, esc_html($projectbasename));
3963                if (defined $action) {
3964                        my $action_print = $action ;
3965                        if (defined $opts{-action_extra}) {
3966                                $action_print = $cgi->a({-href => href(action=>$action)},
3967                                        $action);
3968                        }
3969                        print " / $action_print";
3970                }
3971                if (defined $opts{-action_extra}) {
3972                        print " / $opts{-action_extra}";
3973                }
3974                print "\n";
3975        } elsif (defined $project_filter) {
3976                print_nav_breadcrumbs_path(split '/', $project_filter);
3977        }
3978}
3979
3980sub print_search_form {
3981        if (!defined $searchtext) {
3982                $searchtext = "";
3983        }
3984        my $search_hash;
3985        if (defined $hash_base) {
3986                $search_hash = $hash_base;
3987        } elsif (defined $hash) {
3988                $search_hash = $hash;
3989        } else {
3990                $search_hash = "HEAD";
3991        }
3992        my $action = $my_uri;
3993        my $use_pathinfo = gitweb_check_feature('pathinfo');
3994        if ($use_pathinfo) {
3995                $action .= "/".esc_url($project);
3996        }
3997        print $cgi->startform(-method => "get", -action => $action) .
3998              "<div class=\"search\">\n" .
3999              (!$use_pathinfo &&
4000              $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
4001              $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
4002              $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
4003              $cgi->popup_menu(-name => 'st', -default => 'commit',
4004                               -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
4005              $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
4006              " search:\n",
4007              $cgi->textfield(-name => "s", -value => $searchtext, -override => 1) . "\n" .
4008              "<span title=\"Extended regular expression\">" .
4009              $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
4010                             -checked => $search_use_regexp) .
4011              "</span>" .
4012              "</div>" .
4013              $cgi->end_form() . "\n";
4014}
4015
4016sub git_header_html {
4017        my $status = shift || "200 OK";
4018        my $expires = shift;
4019        my %opts = @_;
4020
4021        my $title = get_page_title();
4022        my $content_type = get_content_type_html();
4023        print $cgi->header(-type=>$content_type, -charset => 'utf-8',
4024                           -status=> $status, -expires => $expires)
4025                unless ($opts{'-no_http_header'});
4026        my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
4027        print <<EOF;
4028<?xml version="1.0" encoding="utf-8"?>
4029<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
4030<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
4031<!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
4032<!-- git core binaries version $git_version -->
4033<head>
4034<meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
4035<meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
4036<meta name="robots" content="index, nofollow"/>
4037<title>$title</title>
4038EOF
4039        # the stylesheet, favicon etc urls won't work correctly with path_info
4040        # unless we set the appropriate base URL
4041        if ($ENV{'PATH_INFO'}) {
4042                print "<base href=\"".esc_url($base_url)."\" />\n";
4043        }
4044        print_header_links($status);
4045
4046        if (defined $site_html_head_string) {
4047                print to_utf8($site_html_head_string);
4048        }
4049
4050        print "</head>\n" .
4051              "<body>\n";
4052
4053        if (defined $site_header && -f $site_header) {
4054                insert_file($site_header);
4055        }
4056
4057        print "<div class=\"page_header\">\n";
4058        if (defined $logo) {
4059                print $cgi->a({-href => esc_url($logo_url),
4060                               -title => $logo_label},
4061                              $cgi->img({-src => esc_url($logo),
4062                                         -width => 72, -height => 27,
4063                                         -alt => "git",
4064                                         -class => "logo"}));
4065        }
4066        print_nav_breadcrumbs(%opts);
4067        print "</div>\n";
4068
4069        my $have_search = gitweb_check_feature('search');
4070        if (defined $project && $have_search) {
4071                print_search_form();
4072        }
4073}
4074
4075sub git_footer_html {
4076        my $feed_class = 'rss_logo';
4077
4078        print "<div class=\"page_footer\">\n";
4079        if (defined $project) {
4080                my $descr = git_get_project_description($project);
4081                if (defined $descr) {
4082                        print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
4083                }
4084
4085                my %href_params = get_feed_info();
4086                if (!%href_params) {
4087                        $feed_class .= ' generic';
4088                }
4089                $href_params{'-title'} ||= 'log';
4090
4091                foreach my $format (qw(RSS Atom)) {
4092                        $href_params{'action'} = lc($format);
4093                        print $cgi->a({-href => href(%href_params),
4094                                      -title => "$href_params{'-title'} $format feed",
4095                                      -class => $feed_class}, $format)."\n";
4096                }
4097
4098        } else {
4099                print $cgi->a({-href => href(project=>undef, action=>"opml",
4100                                             project_filter => $project_filter),
4101                              -class => $feed_class}, "OPML") . " ";
4102                print $cgi->a({-href => href(project=>undef, action=>"project_index",
4103                                             project_filter => $project_filter),
4104                              -class => $feed_class}, "TXT") . "\n";
4105        }
4106        print "</div>\n"; # class="page_footer"
4107
4108        if (defined $t0 && gitweb_check_feature('timed')) {
4109                print "<div id=\"generating_info\">\n";
4110                print 'This page took '.
4111                      '<span id="generating_time" class="time_span">'.
4112                      tv_interval($t0, [ gettimeofday() ]).
4113                      ' seconds </span>'.
4114                      ' and '.
4115                      '<span id="generating_cmd">'.
4116                      $number_of_git_cmds.
4117                      '</span> git commands '.
4118                      " to generate.\n";
4119                print "</div>\n"; # class="page_footer"
4120        }
4121
4122        if (defined $site_footer && -f $site_footer) {
4123                insert_file($site_footer);
4124        }
4125
4126        print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
4127        if (defined $action &&
4128            $action eq 'blame_incremental') {
4129                print qq!<script type="text/javascript">\n!.
4130                      qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
4131                      qq!           "!. href() .qq!");\n!.
4132                      qq!</script>\n!;
4133        } else {
4134                my ($jstimezone, $tz_cookie, $datetime_class) =
4135                        gitweb_get_feature('javascript-timezone');
4136
4137                print qq!<script type="text/javascript">\n!.
4138                      qq!window.onload = function () {\n!;
4139                if (gitweb_check_feature('javascript-actions')) {
4140                        print qq!       fixLinks();\n!;
4141                }
4142                if ($jstimezone && $tz_cookie && $datetime_class) {
4143                        print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4144                              qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4145                }
4146                print qq!};\n!.
4147                      qq!</script>\n!;
4148        }
4149
4150        print "</body>\n" .
4151              "</html>";
4152}
4153
4154# die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4155# Example: die_error(404, 'Hash not found')
4156# By convention, use the following status codes (as defined in RFC 2616):
4157# 400: Invalid or missing CGI parameters, or
4158#      requested object exists but has wrong type.
4159# 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4160#      this server or project.
4161# 404: Requested object/revision/project doesn't exist.
4162# 500: The server isn't configured properly, or
4163#      an internal error occurred (e.g. failed assertions caused by bugs), or
4164#      an unknown error occurred (e.g. the git binary died unexpectedly).
4165# 503: The server is currently unavailable (because it is overloaded,
4166#      or down for maintenance).  Generally, this is a temporary state.
4167sub die_error {
4168        my $status = shift || 500;
4169        my $error = esc_html(shift) || "Internal Server Error";
4170        my $extra = shift;
4171        my %opts = @_;
4172
4173        my %http_responses = (
4174                400 => '400 Bad Request',
4175                403 => '403 Forbidden',
4176                404 => '404 Not Found',
4177                500 => '500 Internal Server Error',
4178                503 => '503 Service Unavailable',
4179        );
4180        git_header_html($http_responses{$status}, undef, %opts);
4181        print <<EOF;
4182<div class="page_body">
4183<br /><br />
4184$status - $error
4185<br />
4186EOF
4187        if (defined $extra) {
4188                print "<hr />\n" .
4189                      "$extra\n";
4190        }
4191        print "</div>\n";
4192
4193        git_footer_html();
4194        goto DONE_GITWEB
4195                unless ($opts{'-error_handler'});
4196}
4197
4198## ----------------------------------------------------------------------
4199## functions printing or outputting HTML: navigation
4200
4201sub git_print_page_nav {
4202        my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4203        $extra = '' if !defined $extra; # pager or formats
4204
4205        my @navs = qw(summary shortlog log commit commitdiff tree);
4206        if ($suppress) {
4207                @navs = grep { $_ ne $suppress } @navs;
4208        }
4209
4210        my %arg = map { $_ => {action=>$_} } @navs;
4211        if (defined $head) {
4212                for (qw(commit commitdiff)) {
4213                        $arg{$_}{'hash'} = $head;
4214                }
4215                if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4216                        for (qw(shortlog log)) {
4217                                $arg{$_}{'hash'} = $head;
4218                        }
4219                }
4220        }
4221
4222        $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4223        $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4224
4225        my @actions = gitweb_get_feature('actions');
4226        my %repl = (
4227                '%' => '%',
4228                'n' => $project,         # project name
4229                'f' => $git_dir,         # project path within filesystem
4230                'h' => $treehead || '',  # current hash ('h' parameter)
4231                'b' => $treebase || '',  # hash base ('hb' parameter)
4232        );
4233        while (@actions) {
4234                my ($label, $link, $pos) = splice(@actions,0,3);
4235                # insert
4236                @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4237                # munch munch
4238                $link =~ s/%([%nfhb])/$repl{$1}/g;
4239                $arg{$label}{'_href'} = $link;
4240        }
4241
4242        print "<div class=\"page_nav\">\n" .
4243                (join " | ",
4244                 map { $_ eq $current ?
4245                       $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4246                 } @navs);
4247        print "<br/>\n$extra<br/>\n" .
4248              "</div>\n";
4249}
4250
4251# returns a submenu for the nagivation of the refs views (tags, heads,
4252# remotes) with the current view disabled and the remotes view only
4253# available if the feature is enabled
4254sub format_ref_views {
4255        my ($current) = @_;
4256        my @ref_views = qw{tags heads};
4257        push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4258        return join " | ", map {
4259                $_ eq $current ? $_ :
4260                $cgi->a({-href => href(action=>$_)}, $_)
4261        } @ref_views
4262}
4263
4264sub format_paging_nav {
4265        my ($action, $page, $has_next_link) = @_;
4266        my $paging_nav;
4267
4268
4269        if ($page > 0) {
4270                $paging_nav .=
4271                        $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4272                        " &sdot; " .
4273                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
4274                                 -accesskey => "p", -title => "Alt-p"}, "prev");
4275        } else {
4276                $paging_nav .= "first &sdot; prev";
4277        }
4278
4279        if ($has_next_link) {
4280                $paging_nav .= " &sdot; " .
4281                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
4282                                 -accesskey => "n", -title => "Alt-n"}, "next");
4283        } else {
4284                $paging_nav .= " &sdot; next";
4285        }
4286
4287        return $paging_nav;
4288}
4289
4290## ......................................................................
4291## functions printing or outputting HTML: div
4292
4293sub git_print_header_div {
4294        my ($action, $title, $hash, $hash_base) = @_;
4295        my %args = ();
4296
4297        $args{'action'} = $action;
4298        $args{'hash'} = $hash if $hash;
4299        $args{'hash_base'} = $hash_base if $hash_base;
4300
4301        print "<div class=\"header\">\n" .
4302              $cgi->a({-href => href(%args), -class => "title"},
4303              $title ? $title : $action) .
4304              "\n</div>\n";
4305}
4306
4307sub format_repo_url {
4308        my ($name, $url) = @_;
4309        return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4310}
4311
4312# Group output by placing it in a DIV element and adding a header.
4313# Options for start_div() can be provided by passing a hash reference as the
4314# first parameter to the function.
4315# Options to git_print_header_div() can be provided by passing an array
4316# reference. This must follow the options to start_div if they are present.
4317# The content can be a scalar, which is output as-is, a scalar reference, which
4318# is output after html escaping, an IO handle passed either as *handle or
4319# *handle{IO}, or a function reference. In the latter case all following
4320# parameters will be taken as argument to the content function call.
4321sub git_print_section {
4322        my ($div_args, $header_args, $content);
4323        my $arg = shift;
4324        if (ref($arg) eq 'HASH') {
4325                $div_args = $arg;
4326                $arg = shift;
4327        }
4328        if (ref($arg) eq 'ARRAY') {
4329                $header_args = $arg;
4330                $arg = shift;
4331        }
4332        $content = $arg;
4333
4334        print $cgi->start_div($div_args);
4335        git_print_header_div(@$header_args);
4336
4337        if (ref($content) eq 'CODE') {
4338                $content->(@_);
4339        } elsif (ref($content) eq 'SCALAR') {
4340                print esc_html($$content);
4341        } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4342                print <$content>;
4343        } elsif (!ref($content) && defined($content)) {
4344                print $content;
4345        }
4346
4347        print $cgi->end_div;
4348}
4349
4350sub format_timestamp_html {
4351        my $date = shift;
4352        my $strtime = $date->{'rfc2822'};
4353
4354        my (undef, undef, $datetime_class) =
4355                gitweb_get_feature('javascript-timezone');
4356        if ($datetime_class) {
4357                $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4358        }
4359
4360        my $localtime_format = '(%02d:%02d %s)';
4361        if ($date->{'hour_local'} < 6) {
4362                $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4363        }
4364        $strtime .= ' ' .
4365                    sprintf($localtime_format,
4366                            $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4367
4368        return $strtime;
4369}
4370
4371# Outputs the author name and date in long form
4372sub git_print_authorship {
4373        my $co = shift;
4374        my %opts = @_;
4375        my $tag = $opts{-tag} || 'div';
4376        my $author = $co->{'author_name'};
4377
4378        my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4379        print "<$tag class=\"author_date\">" .
4380              format_search_author($author, "author", esc_html($author)) .
4381              " [".format_timestamp_html(\%ad)."]".
4382              git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4383              "</$tag>\n";
4384}
4385
4386# Outputs table rows containing the full author or committer information,
4387# in the format expected for 'commit' view (& similar).
4388# Parameters are a commit hash reference, followed by the list of people
4389# to output information for. If the list is empty it defaults to both
4390# author and committer.
4391sub git_print_authorship_rows {
4392        my $co = shift;
4393        # too bad we can't use @people = @_ || ('author', 'committer')
4394        my @people = @_;
4395        @people = ('author', 'committer') unless @people;
4396        foreach my $who (@people) {
4397                my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4398                print "<tr><td>$who</td><td>" .
4399                      format_search_author($co->{"${who}_name"}, $who,
4400                                           esc_html($co->{"${who}_name"})) . " " .
4401                      format_search_author($co->{"${who}_email"}, $who,
4402                                           esc_html("<" . $co->{"${who}_email"} . ">")) .
4403                      "</td><td rowspan=\"2\">" .
4404                      git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4405                      "</td></tr>\n" .
4406                      "<tr>" .
4407                      "<td></td><td>" .
4408                      format_timestamp_html(\%wd) .
4409                      "</td>" .
4410                      "</tr>\n";
4411        }
4412}
4413
4414sub git_print_page_path {
4415        my $name = shift;
4416        my $type = shift;
4417        my $hb = shift;
4418
4419
4420        print "<div class=\"page_path\">";
4421        print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4422                      -title => 'tree root'}, to_utf8("[$project]"));
4423        print " / ";
4424        if (defined $name) {
4425                my @dirname = split '/', $name;
4426                my $basename = pop @dirname;
4427                my $fullname = '';
4428
4429                foreach my $dir (@dirname) {
4430                        $fullname .= ($fullname ? '/' : '') . $dir;
4431                        print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4432                                                     hash_base=>$hb),
4433                                      -title => $fullname}, esc_path($dir));
4434                        print " / ";
4435                }
4436                if (defined $type && $type eq 'blob') {
4437                        print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4438                                                     hash_base=>$hb),
4439                                      -title => $name}, esc_path($basename));
4440                } elsif (defined $type && $type eq 'tree') {
4441                        print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4442                                                     hash_base=>$hb),
4443                                      -title => $name}, esc_path($basename));
4444                        print " / ";
4445                } else {
4446                        print esc_path($basename);
4447                }
4448        }
4449        print "<br/></div>\n";
4450}
4451
4452sub git_print_log {
4453        my $log = shift;
4454        my %opts = @_;
4455
4456        if ($opts{'-remove_title'}) {
4457                # remove title, i.e. first line of log
4458                shift @$log;
4459        }
4460        # remove leading empty lines
4461        while (defined $log->[0] && $log->[0] eq "") {
4462                shift @$log;
4463        }
4464
4465        # print log
4466        my $signoff = 0;
4467        my $empty = 0;
4468        foreach my $line (@$log) {
4469                if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4470                        $signoff = 1;
4471                        $empty = 0;
4472                        if (! $opts{'-remove_signoff'}) {
4473                                print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4474                                next;
4475                        } else {
4476                                # remove signoff lines
4477                                next;
4478                        }
4479                } else {
4480                        $signoff = 0;
4481                }
4482
4483                # print only one empty line
4484                # do not print empty line after signoff
4485                if ($line eq "") {
4486                        next if ($empty || $signoff);
4487                        $empty = 1;
4488                } else {
4489                        $empty = 0;
4490                }
4491
4492                print format_log_line_html($line) . "<br/>\n";
4493        }
4494
4495        if ($opts{'-final_empty_line'}) {
4496                # end with single empty line
4497                print "<br/>\n" unless $empty;
4498        }
4499}
4500
4501# return link target (what link points to)
4502sub git_get_link_target {
4503        my $hash = shift;
4504        my $link_target;
4505
4506        # read link
4507        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4508                or return;
4509        {
4510                local $/ = undef;
4511                $link_target = <$fd>;
4512        }
4513        close $fd
4514                or return;
4515
4516        return $link_target;
4517}
4518
4519# given link target, and the directory (basedir) the link is in,
4520# return target of link relative to top directory (top tree);
4521# return undef if it is not possible (including absolute links).
4522sub normalize_link_target {
4523        my ($link_target, $basedir) = @_;
4524
4525        # absolute symlinks (beginning with '/') cannot be normalized
4526        return if (substr($link_target, 0, 1) eq '/');
4527
4528        # normalize link target to path from top (root) tree (dir)
4529        my $path;
4530        if ($basedir) {
4531                $path = $basedir . '/' . $link_target;
4532        } else {
4533                # we are in top (root) tree (dir)
4534                $path = $link_target;
4535        }
4536
4537        # remove //, /./, and /../
4538        my @path_parts;
4539        foreach my $part (split('/', $path)) {
4540                # discard '.' and ''
4541                next if (!$part || $part eq '.');
4542                # handle '..'
4543                if ($part eq '..') {
4544                        if (@path_parts) {
4545                                pop @path_parts;
4546                        } else {
4547                                # link leads outside repository (outside top dir)
4548                                return;
4549                        }
4550                } else {
4551                        push @path_parts, $part;
4552                }
4553        }
4554        $path = join('/', @path_parts);
4555
4556        return $path;
4557}
4558
4559# print tree entry (row of git_tree), but without encompassing <tr> element
4560sub git_print_tree_entry {
4561        my ($t, $basedir, $hash_base, $have_blame) = @_;
4562
4563        my %base_key = ();
4564        $base_key{'hash_base'} = $hash_base if defined $hash_base;
4565
4566        # The format of a table row is: mode list link.  Where mode is
4567        # the mode of the entry, list is the name of the entry, an href,
4568        # and link is the action links of the entry.
4569
4570        print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4571        if (exists $t->{'size'}) {
4572                print "<td class=\"size\">$t->{'size'}</td>\n";
4573        }
4574        if ($t->{'type'} eq "blob") {
4575                print "<td class=\"list\">" .
4576                        $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4577                                               file_name=>"$basedir$t->{'name'}", %base_key),
4578                                -class => "list"}, esc_path($t->{'name'}));
4579                if (S_ISLNK(oct $t->{'mode'})) {
4580                        my $link_target = git_get_link_target($t->{'hash'});
4581                        if ($link_target) {
4582                                my $norm_target = normalize_link_target($link_target, $basedir);
4583                                if (defined $norm_target) {
4584                                        print " -> " .
4585                                              $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4586                                                                     file_name=>$norm_target),
4587                                                       -title => $norm_target}, esc_path($link_target));
4588                                } else {
4589                                        print " -> " . esc_path($link_target);
4590                                }
4591                        }
4592                }
4593                print "</td>\n";
4594                print "<td class=\"link\">";
4595                print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4596                                             file_name=>"$basedir$t->{'name'}", %base_key)},
4597                              "blob");
4598                if ($have_blame) {
4599                        print " | " .
4600                              $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4601                                                     file_name=>"$basedir$t->{'name'}", %base_key)},
4602                                      "blame");
4603                }
4604                if (defined $hash_base) {
4605                        print " | " .
4606                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4607                                                     hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4608                                      "history");
4609                }
4610                print " | " .
4611                        $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4612                                               file_name=>"$basedir$t->{'name'}")},
4613                                "raw");
4614                print "</td>\n";
4615
4616        } elsif ($t->{'type'} eq "tree") {
4617                print "<td class=\"list\">";
4618                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4619                                             file_name=>"$basedir$t->{'name'}",
4620                                             %base_key)},
4621                              esc_path($t->{'name'}));
4622                print "</td>\n";
4623                print "<td class=\"link\">";
4624                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4625                                             file_name=>"$basedir$t->{'name'}",
4626                                             %base_key)},
4627                              "tree");
4628                if (defined $hash_base) {
4629                        print " | " .
4630                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4631                                                     file_name=>"$basedir$t->{'name'}")},
4632                                      "history");
4633                }
4634                print "</td>\n";
4635        } else {
4636                # unknown object: we can only present history for it
4637                # (this includes 'commit' object, i.e. submodule support)
4638                print "<td class=\"list\">" .
4639                      esc_path($t->{'name'}) .
4640                      "</td>\n";
4641                print "<td class=\"link\">";
4642                if (defined $hash_base) {
4643                        print $cgi->a({-href => href(action=>"history",
4644                                                     hash_base=>$hash_base,
4645                                                     file_name=>"$basedir$t->{'name'}")},
4646                                      "history");
4647                }
4648                print "</td>\n";
4649        }
4650}
4651
4652## ......................................................................
4653## functions printing large fragments of HTML
4654
4655# get pre-image filenames for merge (combined) diff
4656sub fill_from_file_info {
4657        my ($diff, @parents) = @_;
4658
4659        $diff->{'from_file'} = [ ];
4660        $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4661        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4662                if ($diff->{'status'}[$i] eq 'R' ||
4663                    $diff->{'status'}[$i] eq 'C') {
4664                        $diff->{'from_file'}[$i] =
4665                                git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4666                }
4667        }
4668
4669        return $diff;
4670}
4671
4672# is current raw difftree line of file deletion
4673sub is_deleted {
4674        my $diffinfo = shift;
4675
4676        return $diffinfo->{'to_id'} eq ('0' x 40);
4677}
4678
4679# does patch correspond to [previous] difftree raw line
4680# $diffinfo  - hashref of parsed raw diff format
4681# $patchinfo - hashref of parsed patch diff format
4682#              (the same keys as in $diffinfo)
4683sub is_patch_split {
4684        my ($diffinfo, $patchinfo) = @_;
4685
4686        return defined $diffinfo && defined $patchinfo
4687                && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4688}
4689
4690
4691sub git_difftree_body {
4692        my ($difftree, $hash, @parents) = @_;
4693        my ($parent) = $parents[0];
4694        my $have_blame = gitweb_check_feature('blame');
4695        print "<div class=\"list_head\">\n";
4696        if ($#{$difftree} > 10) {
4697                print(($#{$difftree} + 1) . " files changed:\n");
4698        }
4699        print "</div>\n";
4700
4701        print "<table class=\"" .
4702              (@parents > 1 ? "combined " : "") .
4703              "diff_tree\">\n";
4704
4705        # header only for combined diff in 'commitdiff' view
4706        my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4707        if ($has_header) {
4708                # table header
4709                print "<thead><tr>\n" .
4710                       "<th></th><th></th>\n"; # filename, patchN link
4711                for (my $i = 0; $i < @parents; $i++) {
4712                        my $par = $parents[$i];
4713                        print "<th>" .
4714                              $cgi->a({-href => href(action=>"commitdiff",
4715                                                     hash=>$hash, hash_parent=>$par),
4716                                       -title => 'commitdiff to parent number ' .
4717                                                  ($i+1) . ': ' . substr($par,0,7)},
4718                                      $i+1) .
4719                              "&nbsp;</th>\n";
4720                }
4721                print "</tr></thead>\n<tbody>\n";
4722        }
4723
4724        my $alternate = 1;
4725        my $patchno = 0;
4726        foreach my $line (@{$difftree}) {
4727                my $diff = parsed_difftree_line($line);
4728
4729                if ($alternate) {
4730                        print "<tr class=\"dark\">\n";
4731                } else {
4732                        print "<tr class=\"light\">\n";
4733                }
4734                $alternate ^= 1;
4735
4736                if (exists $diff->{'nparents'}) { # combined diff
4737
4738                        fill_from_file_info($diff, @parents)
4739                                unless exists $diff->{'from_file'};
4740
4741                        if (!is_deleted($diff)) {
4742                                # file exists in the result (child) commit
4743                                print "<td>" .
4744                                      $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4745                                                             file_name=>$diff->{'to_file'},
4746                                                             hash_base=>$hash),
4747                                              -class => "list"}, esc_path($diff->{'to_file'})) .
4748                                      "</td>\n";
4749                        } else {
4750                                print "<td>" .
4751                                      esc_path($diff->{'to_file'}) .
4752                                      "</td>\n";
4753                        }
4754
4755                        if ($action eq 'commitdiff') {
4756                                # link to patch
4757                                $patchno++;
4758                                print "<td class=\"link\">" .
4759                                      $cgi->a({-href => href(-anchor=>"patch$patchno")},
4760                                              "patch") .
4761                                      " | " .
4762                                      "</td>\n";
4763                        }
4764
4765                        my $has_history = 0;
4766                        my $not_deleted = 0;
4767                        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4768                                my $hash_parent = $parents[$i];
4769                                my $from_hash = $diff->{'from_id'}[$i];
4770                                my $from_path = $diff->{'from_file'}[$i];
4771                                my $status = $diff->{'status'}[$i];
4772
4773                                $has_history ||= ($status ne 'A');
4774                                $not_deleted ||= ($status ne 'D');
4775
4776                                if ($status eq 'A') {
4777                                        print "<td  class=\"link\" align=\"right\"> | </td>\n";
4778                                } elsif ($status eq 'D') {
4779                                        print "<td class=\"link\">" .
4780                                              $cgi->a({-href => href(action=>"blob",
4781                                                                     hash_base=>$hash,
4782                                                                     hash=>$from_hash,
4783                                                                     file_name=>$from_path)},
4784                                                      "blob" . ($i+1)) .
4785                                              " | </td>\n";
4786                                } else {
4787                                        if ($diff->{'to_id'} eq $from_hash) {
4788                                                print "<td class=\"link nochange\">";
4789                                        } else {
4790                                                print "<td class=\"link\">";
4791                                        }
4792                                        print $cgi->a({-href => href(action=>"blobdiff",
4793                                                                     hash=>$diff->{'to_id'},
4794                                                                     hash_parent=>$from_hash,
4795                                                                     hash_base=>$hash,
4796                                                                     hash_parent_base=>$hash_parent,
4797                                                                     file_name=>$diff->{'to_file'},
4798                                                                     file_parent=>$from_path)},
4799                                                      "diff" . ($i+1)) .
4800                                              " | </td>\n";
4801                                }
4802                        }
4803
4804                        print "<td class=\"link\">";
4805                        if ($not_deleted) {
4806                                print $cgi->a({-href => href(action=>"blob",
4807                                                             hash=>$diff->{'to_id'},
4808                                                             file_name=>$diff->{'to_file'},
4809                                                             hash_base=>$hash)},
4810                                              "blob");
4811                                print " | " if ($has_history);
4812                        }
4813                        if ($has_history) {
4814                                print $cgi->a({-href => href(action=>"history",
4815                                                             file_name=>$diff->{'to_file'},
4816                                                             hash_base=>$hash)},
4817                                              "history");
4818                        }
4819                        print "</td>\n";
4820
4821                        print "</tr>\n";
4822                        next; # instead of 'else' clause, to avoid extra indent
4823                }
4824                # else ordinary diff
4825
4826                my ($to_mode_oct, $to_mode_str, $to_file_type);
4827                my ($from_mode_oct, $from_mode_str, $from_file_type);
4828                if ($diff->{'to_mode'} ne ('0' x 6)) {
4829                        $to_mode_oct = oct $diff->{'to_mode'};
4830                        if (S_ISREG($to_mode_oct)) { # only for regular file
4831                                $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4832                        }
4833                        $to_file_type = file_type($diff->{'to_mode'});
4834                }
4835                if ($diff->{'from_mode'} ne ('0' x 6)) {
4836                        $from_mode_oct = oct $diff->{'from_mode'};
4837                        if (S_ISREG($from_mode_oct)) { # only for regular file
4838                                $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4839                        }
4840                        $from_file_type = file_type($diff->{'from_mode'});
4841                }
4842
4843                if ($diff->{'status'} eq "A") { # created
4844                        my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4845                        $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4846                        $mode_chng   .= "]</span>";
4847                        print "<td>";
4848                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4849                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4850                                      -class => "list"}, esc_path($diff->{'file'}));
4851                        print "</td>\n";
4852                        print "<td>$mode_chng</td>\n";
4853                        print "<td class=\"link\">";
4854                        if ($action eq 'commitdiff') {
4855                                # link to patch
4856                                $patchno++;
4857                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4858                                              "patch") .
4859                                      " | ";
4860                        }
4861                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4862                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4863                                      "blob");
4864                        print "</td>\n";
4865
4866                } elsif ($diff->{'status'} eq "D") { # deleted
4867                        my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4868                        print "<td>";
4869                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4870                                                     hash_base=>$parent, file_name=>$diff->{'file'}),
4871                                       -class => "list"}, esc_path($diff->{'file'}));
4872                        print "</td>\n";
4873                        print "<td>$mode_chng</td>\n";
4874                        print "<td class=\"link\">";
4875                        if ($action eq 'commitdiff') {
4876                                # link to patch
4877                                $patchno++;
4878                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4879                                              "patch") .
4880                                      " | ";
4881                        }
4882                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4883                                                     hash_base=>$parent, file_name=>$diff->{'file'})},
4884                                      "blob") . " | ";
4885                        if ($have_blame) {
4886                                print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4887                                                             file_name=>$diff->{'file'})},
4888                                              "blame") . " | ";
4889                        }
4890                        print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4891                                                     file_name=>$diff->{'file'})},
4892                                      "history");
4893                        print "</td>\n";
4894
4895                } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4896                        my $mode_chnge = "";
4897                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4898                                $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4899                                if ($from_file_type ne $to_file_type) {
4900                                        $mode_chnge .= " from $from_file_type to $to_file_type";
4901                                }
4902                                if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4903                                        if ($from_mode_str && $to_mode_str) {
4904                                                $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4905                                        } elsif ($to_mode_str) {
4906                                                $mode_chnge .= " mode: $to_mode_str";
4907                                        }
4908                                }
4909                                $mode_chnge .= "]</span>\n";
4910                        }
4911                        print "<td>";
4912                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4913                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4914                                      -class => "list"}, esc_path($diff->{'file'}));
4915                        print "</td>\n";
4916                        print "<td>$mode_chnge</td>\n";
4917                        print "<td class=\"link\">";
4918                        if ($action eq 'commitdiff') {
4919                                # link to patch
4920                                $patchno++;
4921                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4922                                              "patch") .
4923                                      " | ";
4924                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4925                                # "commit" view and modified file (not onlu mode changed)
4926                                print $cgi->a({-href => href(action=>"blobdiff",
4927                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4928                                                             hash_base=>$hash, hash_parent_base=>$parent,
4929                                                             file_name=>$diff->{'file'})},
4930                                              "diff") .
4931                                      " | ";
4932                        }
4933                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4934                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4935                                       "blob") . " | ";
4936                        if ($have_blame) {
4937                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4938                                                             file_name=>$diff->{'file'})},
4939                                              "blame") . " | ";
4940                        }
4941                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4942                                                     file_name=>$diff->{'file'})},
4943                                      "history");
4944                        print "</td>\n";
4945
4946                } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4947                        my %status_name = ('R' => 'moved', 'C' => 'copied');
4948                        my $nstatus = $status_name{$diff->{'status'}};
4949                        my $mode_chng = "";
4950                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4951                                # mode also for directories, so we cannot use $to_mode_str
4952                                $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4953                        }
4954                        print "<td>" .
4955                              $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4956                                                     hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4957                                      -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4958                              "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4959                              $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4960                                                     hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4961                                      -class => "list"}, esc_path($diff->{'from_file'})) .
4962                              " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4963                              "<td class=\"link\">";
4964                        if ($action eq 'commitdiff') {
4965                                # link to patch
4966                                $patchno++;
4967                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4968                                              "patch") .
4969                                      " | ";
4970                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4971                                # "commit" view and modified file (not only pure rename or copy)
4972                                print $cgi->a({-href => href(action=>"blobdiff",
4973                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4974                                                             hash_base=>$hash, hash_parent_base=>$parent,
4975                                                             file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4976                                              "diff") .
4977                                      " | ";
4978                        }
4979                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4980                                                     hash_base=>$parent, file_name=>$diff->{'to_file'})},
4981                                      "blob") . " | ";
4982                        if ($have_blame) {
4983                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4984                                                             file_name=>$diff->{'to_file'})},
4985                                              "blame") . " | ";
4986                        }
4987                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4988                                                    file_name=>$diff->{'to_file'})},
4989                                      "history");
4990                        print "</td>\n";
4991
4992                } # we should not encounter Unmerged (U) or Unknown (X) status
4993                print "</tr>\n";
4994        }
4995        print "</tbody>" if $has_header;
4996        print "</table>\n";
4997}
4998
4999sub print_sidebyside_diff_chunk {
5000        my @chunk = @_;
5001        my (@ctx, @rem, @add);
5002
5003        return unless @chunk;
5004
5005        # incomplete last line might be among removed or added lines,
5006        # or both, or among context lines: find which
5007        for (my $i = 1; $i < @chunk; $i++) {
5008                if ($chunk[$i][0] eq 'incomplete') {
5009                        $chunk[$i][0] = $chunk[$i-1][0];
5010                }
5011        }
5012
5013        # guardian
5014        push @chunk, ["", ""];
5015
5016        foreach my $line_info (@chunk) {
5017                my ($class, $line) = @$line_info;
5018
5019                # print chunk headers
5020                if ($class && $class eq 'chunk_header') {
5021                        print $line;
5022                        next;
5023                }
5024
5025                ## print from accumulator when type of class of lines change
5026                # empty contents block on start rem/add block, or end of chunk
5027                if (@ctx && (!$class || $class eq 'rem' || $class eq 'add')) {
5028                        print join '',
5029                                '<div class="chunk_block ctx">',
5030                                        '<div class="old">',
5031                                        @ctx,
5032                                        '</div>',
5033                                        '<div class="new">',
5034                                        @ctx,
5035                                        '</div>',
5036                                '</div>';
5037                        @ctx = ();
5038                }
5039                # empty add/rem block on start context block, or end of chunk
5040                if ((@rem || @add) && (!$class || $class eq 'ctx')) {
5041                        if (!@add) {
5042                                # pure removal
5043                                print join '',
5044                                        '<div class="chunk_block rem">',
5045                                                '<div class="old">',
5046                                                @rem,
5047                                                '</div>',
5048                                        '</div>';
5049                        } elsif (!@rem) {
5050                                # pure addition
5051                                print join '',
5052                                        '<div class="chunk_block add">',
5053                                                '<div class="new">',
5054                                                @add,
5055                                                '</div>',
5056                                        '</div>';
5057                        } else {
5058                                # assume that it is change
5059                                print join '',
5060                                        '<div class="chunk_block chg">',
5061                                                '<div class="old">',
5062                                                @rem,
5063                                                '</div>',
5064                                                '<div class="new">',
5065                                                @add,
5066                                                '</div>',
5067                                        '</div>';
5068                        }
5069                        @rem = @add = ();
5070                }
5071
5072                ## adding lines to accumulator
5073                # guardian value
5074                last unless $line;
5075                # rem, add or change
5076                if ($class eq 'rem') {
5077                        push @rem, $line;
5078                } elsif ($class eq 'add') {
5079                        push @add, $line;
5080                }
5081                # context line
5082                if ($class eq 'ctx') {
5083                        push @ctx, $line;
5084                }
5085        }
5086}
5087
5088sub git_patchset_body {
5089        my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
5090        my ($hash_parent) = $hash_parents[0];
5091
5092        my $is_combined = (@hash_parents > 1);
5093        my $patch_idx = 0;
5094        my $patch_number = 0;
5095        my $patch_line;
5096        my $diffinfo;
5097        my $to_name;
5098        my (%from, %to);
5099        my @chunk; # for side-by-side diff
5100
5101        print "<div class=\"patchset\">\n";
5102
5103        # skip to first patch
5104        while ($patch_line = <$fd>) {
5105                chomp $patch_line;
5106
5107                last if ($patch_line =~ m/^diff /);
5108        }
5109
5110 PATCH:
5111        while ($patch_line) {
5112
5113                # parse "git diff" header line
5114                if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
5115                        # $1 is from_name, which we do not use
5116                        $to_name = unquote($2);
5117                        $to_name =~ s!^b/!!;
5118                } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
5119                        # $1 is 'cc' or 'combined', which we do not use
5120                        $to_name = unquote($2);
5121                } else {
5122                        $to_name = undef;
5123                }
5124
5125                # check if current patch belong to current raw line
5126                # and parse raw git-diff line if needed
5127                if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
5128                        # this is continuation of a split patch
5129                        print "<div class=\"patch cont\">\n";
5130                } else {
5131                        # advance raw git-diff output if needed
5132                        $patch_idx++ if defined $diffinfo;
5133
5134                        # read and prepare patch information
5135                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5136
5137                        # compact combined diff output can have some patches skipped
5138                        # find which patch (using pathname of result) we are at now;
5139                        if ($is_combined) {
5140                                while ($to_name ne $diffinfo->{'to_file'}) {
5141                                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5142                                              format_diff_cc_simplified($diffinfo, @hash_parents) .
5143                                              "</div>\n";  # class="patch"
5144
5145                                        $patch_idx++;
5146                                        $patch_number++;
5147
5148                                        last if $patch_idx > $#$difftree;
5149                                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5150                                }
5151                        }
5152
5153                        # modifies %from, %to hashes
5154                        parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5155
5156                        # this is first patch for raw difftree line with $patch_idx index
5157                        # we index @$difftree array from 0, but number patches from 1
5158                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5159                }
5160
5161                # git diff header
5162                #assert($patch_line =~ m/^diff /) if DEBUG;
5163                #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5164                $patch_number++;
5165                # print "git diff" header
5166                print format_git_diff_header_line($patch_line, $diffinfo,
5167                                                  \%from, \%to);
5168
5169                # print extended diff header
5170                print "<div class=\"diff extended_header\">\n";
5171        EXTENDED_HEADER:
5172                while ($patch_line = <$fd>) {
5173                        chomp $patch_line;
5174
5175                        last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5176
5177                        print format_extended_diff_header_line($patch_line, $diffinfo,
5178                                                               \%from, \%to);
5179                }
5180                print "</div>\n"; # class="diff extended_header"
5181
5182                # from-file/to-file diff header
5183                if (! $patch_line) {
5184                        print "</div>\n"; # class="patch"
5185                        last PATCH;
5186                }
5187                next PATCH if ($patch_line =~ m/^diff /);
5188                #assert($patch_line =~ m/^---/) if DEBUG;
5189
5190                my $last_patch_line = $patch_line;
5191                $patch_line = <$fd>;
5192                chomp $patch_line;
5193                #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5194
5195                print format_diff_from_to_header($last_patch_line, $patch_line,
5196                                                 $diffinfo, \%from, \%to,
5197                                                 @hash_parents);
5198
5199                # the patch itself
5200        LINE:
5201                while ($patch_line = <$fd>) {
5202                        chomp $patch_line;
5203
5204                        next PATCH if ($patch_line =~ m/^diff /);
5205
5206                        my ($class, $line) = process_diff_line($patch_line, \%from, \%to);
5207                        my $diff_classes = "diff";
5208                        $diff_classes .= " $class" if ($class);
5209                        $line = "<div class=\"$diff_classes\">$line</div>\n";
5210
5211                        if ($diff_style eq 'sidebyside' && !$is_combined) {
5212                                if ($class eq 'chunk_header') {
5213                                        print_sidebyside_diff_chunk(@chunk);
5214                                        @chunk = ( [ $class, $line ] );
5215                                } else {
5216                                        push @chunk, [ $class, $line ];
5217                                }
5218                        } else {
5219                                # default 'inline' style and unknown styles
5220                                print $line;
5221                        }
5222                }
5223
5224        } continue {
5225                if (@chunk) {
5226                        print_sidebyside_diff_chunk(@chunk);
5227                        @chunk = ();
5228                }
5229                print "</div>\n"; # class="patch"
5230        }
5231
5232        # for compact combined (--cc) format, with chunk and patch simplification
5233        # the patchset might be empty, but there might be unprocessed raw lines
5234        for (++$patch_idx if $patch_number > 0;
5235             $patch_idx < @$difftree;
5236             ++$patch_idx) {
5237                # read and prepare patch information
5238                $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5239
5240                # generate anchor for "patch" links in difftree / whatchanged part
5241                print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5242                      format_diff_cc_simplified($diffinfo, @hash_parents) .
5243                      "</div>\n";  # class="patch"
5244
5245                $patch_number++;
5246        }
5247
5248        if ($patch_number == 0) {
5249                if (@hash_parents > 1) {
5250                        print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5251                } else {
5252                        print "<div class=\"diff nodifferences\">No differences found</div>\n";
5253                }
5254        }
5255
5256        print "</div>\n"; # class="patchset"
5257}
5258
5259# . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5260
5261sub git_project_search_form {
5262        my ($searchtext, $search_use_regexp) = @_;
5263
5264        my $limit = '';
5265        if ($project_filter) {
5266                $limit = " in '$project_filter/'";
5267        }
5268
5269        print "<div class=\"projsearch\">\n";
5270        print $cgi->startform(-method => 'get', -action => $my_uri) .
5271              $cgi->hidden(-name => 'a', -value => 'project_list')  . "\n";
5272        print $cgi->hidden(-name => 'pf', -value => $project_filter). "\n"
5273                if (defined $project_filter);
5274        print $cgi->textfield(-name => 's', -value => $searchtext,
5275                              -title => "Search project by name and description$limit",
5276                              -size => 60) . "\n" .
5277              "<span title=\"Extended regular expression\">" .
5278              $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
5279                             -checked => $search_use_regexp) .
5280              "</span>\n" .
5281              $cgi->submit(-name => 'btnS', -value => 'Search') .
5282              $cgi->end_form() . "\n" .
5283              $cgi->a({-href => href(project => undef, searchtext => undef,
5284                                     project_filter => $project_filter)},
5285                      esc_html("List all projects$limit")) . "<br />\n";
5286        print "</div>\n";
5287}
5288
5289# entry for given @keys needs filling if at least one of keys in list
5290# is not present in %$project_info
5291sub project_info_needs_filling {
5292        my ($project_info, @keys) = @_;
5293
5294        # return List::MoreUtils::any { !exists $project_info->{$_} } @keys;
5295        foreach my $key (@keys) {
5296                if (!exists $project_info->{$key}) {
5297                        return 1;
5298                }
5299        }
5300        return;
5301}
5302
5303# fills project list info (age, description, owner, category, forks, etc.)
5304# for each project in the list, removing invalid projects from
5305# returned list, or fill only specified info.
5306#
5307# Invalid projects are removed from the returned list if and only if you
5308# ask 'age' or 'age_string' to be filled, because they are the only fields
5309# that run unconditionally git command that requires repository, and
5310# therefore do always check if project repository is invalid.
5311#
5312# USAGE:
5313# * fill_project_list_info(\@project_list, 'descr_long', 'ctags')
5314#   ensures that 'descr_long' and 'ctags' fields are filled
5315# * @project_list = fill_project_list_info(\@project_list)
5316#   ensures that all fields are filled (and invalid projects removed)
5317#
5318# NOTE: modifies $projlist, but does not remove entries from it
5319sub fill_project_list_info {
5320        my ($projlist, @wanted_keys) = @_;
5321        my @projects;
5322        my $filter_set = sub { return @_; };
5323        if (@wanted_keys) {
5324                my %wanted_keys = map { $_ => 1 } @wanted_keys;
5325                $filter_set = sub { return grep { $wanted_keys{$_} } @_; };
5326        }
5327
5328        my $show_ctags = gitweb_check_feature('ctags');
5329 PROJECT:
5330        foreach my $pr (@$projlist) {
5331                if (project_info_needs_filling($pr, $filter_set->('age', 'age_string'))) {
5332                        my (@activity) = git_get_last_activity($pr->{'path'});
5333                        unless (@activity) {
5334                                next PROJECT;
5335                        }
5336                        ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5337                }
5338                if (project_info_needs_filling($pr, $filter_set->('descr', 'descr_long'))) {
5339                        my $descr = git_get_project_description($pr->{'path'}) || "";
5340                        $descr = to_utf8($descr);
5341                        $pr->{'descr_long'} = $descr;
5342                        $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5343                }
5344                if (project_info_needs_filling($pr, $filter_set->('owner'))) {
5345                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5346                }
5347                if ($show_ctags &&
5348                    project_info_needs_filling($pr, $filter_set->('ctags'))) {
5349                        $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5350                }
5351                if ($projects_list_group_categories &&
5352                    project_info_needs_filling($pr, $filter_set->('category'))) {
5353                        my $cat = git_get_project_category($pr->{'path'}) ||
5354                                                           $project_list_default_category;
5355                        $pr->{'category'} = to_utf8($cat);
5356                }
5357
5358                push @projects, $pr;
5359        }
5360
5361        return @projects;
5362}
5363
5364sub sort_projects_list {
5365        my ($projlist, $order) = @_;
5366        my @projects;
5367
5368        my %order_info = (
5369                project => { key => 'path', type => 'str' },
5370                descr => { key => 'descr_long', type => 'str' },
5371                owner => { key => 'owner', type => 'str' },
5372                age => { key => 'age', type => 'num' }
5373        );
5374        my $oi = $order_info{$order};
5375        return @$projlist unless defined $oi;
5376        if ($oi->{'type'} eq 'str') {
5377                @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5378        } else {
5379                @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5380        }
5381
5382        return @projects;
5383}
5384
5385# returns a hash of categories, containing the list of project
5386# belonging to each category
5387sub build_projlist_by_category {
5388        my ($projlist, $from, $to) = @_;
5389        my %categories;
5390
5391        $from = 0 unless defined $from;
5392        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5393
5394        for (my $i = $from; $i <= $to; $i++) {
5395                my $pr = $projlist->[$i];
5396                push @{$categories{ $pr->{'category'} }}, $pr;
5397        }
5398
5399        return wantarray ? %categories : \%categories;
5400}
5401
5402# print 'sort by' <th> element, generating 'sort by $name' replay link
5403# if that order is not selected
5404sub print_sort_th {
5405        print format_sort_th(@_);
5406}
5407
5408sub format_sort_th {
5409        my ($name, $order, $header) = @_;
5410        my $sort_th = "";
5411        $header ||= ucfirst($name);
5412
5413        if ($order eq $name) {
5414                $sort_th .= "<th>$header</th>\n";
5415        } else {
5416                $sort_th .= "<th>" .
5417                            $cgi->a({-href => href(-replay=>1, order=>$name),
5418                                     -class => "header"}, $header) .
5419                            "</th>\n";
5420        }
5421
5422        return $sort_th;
5423}
5424
5425sub git_project_list_rows {
5426        my ($projlist, $from, $to, $check_forks) = @_;
5427
5428        $from = 0 unless defined $from;
5429        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5430
5431        my $alternate = 1;
5432        for (my $i = $from; $i <= $to; $i++) {
5433                my $pr = $projlist->[$i];
5434
5435                if ($alternate) {
5436                        print "<tr class=\"dark\">\n";
5437                } else {
5438                        print "<tr class=\"light\">\n";
5439                }
5440                $alternate ^= 1;
5441
5442                if ($check_forks) {
5443                        print "<td>";
5444                        if ($pr->{'forks'}) {
5445                                my $nforks = scalar @{$pr->{'forks'}};
5446                                if ($nforks > 0) {
5447                                        print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5448                                                       -title => "$nforks forks"}, "+");
5449                                } else {
5450                                        print $cgi->span({-title => "$nforks forks"}, "+");
5451                                }
5452                        }
5453                        print "</td>\n";
5454                }
5455                print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5456                                        -class => "list"},
5457                                       esc_html_match_hl($pr->{'path'}, $search_regexp)) .
5458                      "</td>\n" .
5459                      "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5460                                        -class => "list",
5461                                        -title => $pr->{'descr_long'}},
5462                                        $search_regexp
5463                                        ? esc_html_match_hl_chopped($pr->{'descr_long'},
5464                                                                    $pr->{'descr'}, $search_regexp)
5465                                        : esc_html($pr->{'descr'})) .
5466                      "</td>\n" .
5467                      "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5468                print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5469                      (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
5470                      "<td class=\"link\">" .
5471                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5472                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5473                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5474                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5475                      ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5476                      "</td>\n" .
5477                      "</tr>\n";
5478        }
5479}
5480
5481sub git_project_list_body {
5482        # actually uses global variable $project
5483        my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5484        my @projects = @$projlist;
5485
5486        my $check_forks = gitweb_check_feature('forks');
5487        my $show_ctags  = gitweb_check_feature('ctags');
5488        my $tagfilter = $show_ctags ? $input_params{'ctag'} : undef;
5489        $check_forks = undef
5490                if ($tagfilter || $search_regexp);
5491
5492        # filtering out forks before filling info allows to do less work
5493        @projects = filter_forks_from_projects_list(\@projects)
5494                if ($check_forks);
5495        # search_projects_list pre-fills required info
5496        @projects = search_projects_list(\@projects,
5497                                         'search_regexp' => $search_regexp,
5498                                         'tagfilter'  => $tagfilter)
5499                if ($tagfilter || $search_regexp);
5500        # fill the rest
5501        @projects = fill_project_list_info(\@projects);
5502
5503        $order ||= $default_projects_order;
5504        $from = 0 unless defined $from;
5505        $to = $#projects if (!defined $to || $#projects < $to);
5506
5507        # short circuit
5508        if ($from > $to) {
5509                print "<center>\n".
5510                      "<b>No such projects found</b><br />\n".
5511                      "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5512                      "</center>\n<br />\n";
5513                return;
5514        }
5515
5516        @projects = sort_projects_list(\@projects, $order);
5517
5518        if ($show_ctags) {
5519                my $ctags = git_gather_all_ctags(\@projects);
5520                my $cloud = git_populate_project_tagcloud($ctags);
5521                print git_show_project_tagcloud($cloud, 64);
5522        }
5523
5524        print "<table class=\"project_list\">\n";
5525        unless ($no_header) {
5526                print "<tr>\n";
5527                if ($check_forks) {
5528                        print "<th></th>\n";
5529                }
5530                print_sort_th('project', $order, 'Project');
5531                print_sort_th('descr', $order, 'Description');
5532                print_sort_th('owner', $order, 'Owner');
5533                print_sort_th('age', $order, 'Last Change');
5534                print "<th></th>\n" . # for links
5535                      "</tr>\n";
5536        }
5537
5538        if ($projects_list_group_categories) {
5539                # only display categories with projects in the $from-$to window
5540                @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5541                my %categories = build_projlist_by_category(\@projects, $from, $to);
5542                foreach my $cat (sort keys %categories) {
5543                        unless ($cat eq "") {
5544                                print "<tr>\n";
5545                                if ($check_forks) {
5546                                        print "<td></td>\n";
5547                                }
5548                                print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5549                                print "</tr>\n";
5550                        }
5551
5552                        git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5553                }
5554        } else {
5555                git_project_list_rows(\@projects, $from, $to, $check_forks);
5556        }
5557
5558        if (defined $extra) {
5559                print "<tr>\n";
5560                if ($check_forks) {
5561                        print "<td></td>\n";
5562                }
5563                print "<td colspan=\"5\">$extra</td>\n" .
5564                      "</tr>\n";
5565        }
5566        print "</table>\n";
5567}
5568
5569sub git_log_body {
5570        # uses global variable $project
5571        my ($commitlist, $from, $to, $refs, $extra) = @_;
5572
5573        $from = 0 unless defined $from;
5574        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5575
5576        for (my $i = 0; $i <= $to; $i++) {
5577                my %co = %{$commitlist->[$i]};
5578                next if !%co;
5579                my $commit = $co{'id'};
5580                my $ref = format_ref_marker($refs, $commit);
5581                git_print_header_div('commit',
5582                               "<span class=\"age\">$co{'age_string'}</span>" .
5583                               esc_html($co{'title'}) . $ref,
5584                               $commit);
5585                print "<div class=\"title_text\">\n" .
5586                      "<div class=\"log_link\">\n" .
5587                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5588                      " | " .
5589                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5590                      " | " .
5591                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5592                      "<br/>\n" .
5593                      "</div>\n";
5594                      git_print_authorship(\%co, -tag => 'span');
5595                      print "<br/>\n</div>\n";
5596
5597                print "<div class=\"log_body\">\n";
5598                git_print_log($co{'comment'}, -final_empty_line=> 1);
5599                print "</div>\n";
5600        }
5601        if ($extra) {
5602                print "<div class=\"page_nav\">\n";
5603                print "$extra\n";
5604                print "</div>\n";
5605        }
5606}
5607
5608sub git_shortlog_body {
5609        # uses global variable $project
5610        my ($commitlist, $from, $to, $refs, $extra) = @_;
5611
5612        $from = 0 unless defined $from;
5613        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5614
5615        print "<table class=\"shortlog\">\n";
5616        my $alternate = 1;
5617        for (my $i = $from; $i <= $to; $i++) {
5618                my %co = %{$commitlist->[$i]};
5619                my $commit = $co{'id'};
5620                my $ref = format_ref_marker($refs, $commit);
5621                if ($alternate) {
5622                        print "<tr class=\"dark\">\n";
5623                } else {
5624                        print "<tr class=\"light\">\n";
5625                }
5626                $alternate ^= 1;
5627                # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5628                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5629                      format_author_html('td', \%co, 10) . "<td>";
5630                print format_subject_html($co{'title'}, $co{'title_short'},
5631                                          href(action=>"commit", hash=>$commit), $ref);
5632                print "</td>\n" .
5633                      "<td class=\"link\">" .
5634                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5635                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5636                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5637                my $snapshot_links = format_snapshot_links($commit);
5638                if (defined $snapshot_links) {
5639                        print " | " . $snapshot_links;
5640                }
5641                print "</td>\n" .
5642                      "</tr>\n";
5643        }
5644        if (defined $extra) {
5645                print "<tr>\n" .
5646                      "<td colspan=\"4\">$extra</td>\n" .
5647                      "</tr>\n";
5648        }
5649        print "</table>\n";
5650}
5651
5652sub git_history_body {
5653        # Warning: assumes constant type (blob or tree) during history
5654        my ($commitlist, $from, $to, $refs, $extra,
5655            $file_name, $file_hash, $ftype) = @_;
5656
5657        $from = 0 unless defined $from;
5658        $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5659
5660        print "<table class=\"history\">\n";
5661        my $alternate = 1;
5662        for (my $i = $from; $i <= $to; $i++) {
5663                my %co = %{$commitlist->[$i]};
5664                if (!%co) {
5665                        next;
5666                }
5667                my $commit = $co{'id'};
5668
5669                my $ref = format_ref_marker($refs, $commit);
5670
5671                if ($alternate) {
5672                        print "<tr class=\"dark\">\n";
5673                } else {
5674                        print "<tr class=\"light\">\n";
5675                }
5676                $alternate ^= 1;
5677                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5678        # shortlog:   format_author_html('td', \%co, 10)
5679                      format_author_html('td', \%co, 15, 3) . "<td>";
5680                # originally git_history used chop_str($co{'title'}, 50)
5681                print format_subject_html($co{'title'}, $co{'title_short'},
5682                                          href(action=>"commit", hash=>$commit), $ref);
5683                print "</td>\n" .
5684                      "<td class=\"link\">" .
5685                      $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5686                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5687
5688                if ($ftype eq 'blob') {
5689                        my $blob_current = $file_hash;
5690                        my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5691                        if (defined $blob_current && defined $blob_parent &&
5692                                        $blob_current ne $blob_parent) {
5693                                print " | " .
5694                                        $cgi->a({-href => href(action=>"blobdiff",
5695                                                               hash=>$blob_current, hash_parent=>$blob_parent,
5696                                                               hash_base=>$hash_base, hash_parent_base=>$commit,
5697                                                               file_name=>$file_name)},
5698                                                "diff to current");
5699                        }
5700                }
5701                print "</td>\n" .
5702                      "</tr>\n";
5703        }
5704        if (defined $extra) {
5705                print "<tr>\n" .
5706                      "<td colspan=\"4\">$extra</td>\n" .
5707                      "</tr>\n";
5708        }
5709        print "</table>\n";
5710}
5711
5712sub git_tags_body {
5713        # uses global variable $project
5714        my ($taglist, $from, $to, $extra) = @_;
5715        $from = 0 unless defined $from;
5716        $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5717
5718        print "<table class=\"tags\">\n";
5719        my $alternate = 1;
5720        for (my $i = $from; $i <= $to; $i++) {
5721                my $entry = $taglist->[$i];
5722                my %tag = %$entry;
5723                my $comment = $tag{'subject'};
5724                my $comment_short;
5725                if (defined $comment) {
5726                        $comment_short = chop_str($comment, 30, 5);
5727                }
5728                if ($alternate) {
5729                        print "<tr class=\"dark\">\n";
5730                } else {
5731                        print "<tr class=\"light\">\n";
5732                }
5733                $alternate ^= 1;
5734                if (defined $tag{'age'}) {
5735                        print "<td><i>$tag{'age'}</i></td>\n";
5736                } else {
5737                        print "<td></td>\n";
5738                }
5739                print "<td>" .
5740                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5741                               -class => "list name"}, esc_html($tag{'name'})) .
5742                      "</td>\n" .
5743                      "<td>";
5744                if (defined $comment) {
5745                        print format_subject_html($comment, $comment_short,
5746                                                  href(action=>"tag", hash=>$tag{'id'}));
5747                }
5748                print "</td>\n" .
5749                      "<td class=\"selflink\">";
5750                if ($tag{'type'} eq "tag") {
5751                        print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5752                } else {
5753                        print "&nbsp;";
5754                }
5755                print "</td>\n" .
5756                      "<td class=\"link\">" . " | " .
5757                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5758                if ($tag{'reftype'} eq "commit") {
5759                        print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5760                              " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5761                } elsif ($tag{'reftype'} eq "blob") {
5762                        print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5763                }
5764                print "</td>\n" .
5765                      "</tr>";
5766        }
5767        if (defined $extra) {
5768                print "<tr>\n" .
5769                      "<td colspan=\"5\">$extra</td>\n" .
5770                      "</tr>\n";
5771        }
5772        print "</table>\n";
5773}
5774
5775sub git_heads_body {
5776        # uses global variable $project
5777        my ($headlist, $head_at, $from, $to, $extra) = @_;
5778        $from = 0 unless defined $from;
5779        $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5780
5781        print "<table class=\"heads\">\n";
5782        my $alternate = 1;
5783        for (my $i = $from; $i <= $to; $i++) {
5784                my $entry = $headlist->[$i];
5785                my %ref = %$entry;
5786                my $curr = defined $head_at && $ref{'id'} eq $head_at;
5787                if ($alternate) {
5788                        print "<tr class=\"dark\">\n";
5789                } else {
5790                        print "<tr class=\"light\">\n";
5791                }
5792                $alternate ^= 1;
5793                print "<td><i>$ref{'age'}</i></td>\n" .
5794                      ($curr ? "<td class=\"current_head\">" : "<td>") .
5795                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5796                               -class => "list name"},esc_html($ref{'name'})) .
5797                      "</td>\n" .
5798                      "<td class=\"link\">" .
5799                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5800                      $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5801                      $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5802                      "</td>\n" .
5803                      "</tr>";
5804        }
5805        if (defined $extra) {
5806                print "<tr>\n" .
5807                      "<td colspan=\"3\">$extra</td>\n" .
5808                      "</tr>\n";
5809        }
5810        print "</table>\n";
5811}
5812
5813# Display a single remote block
5814sub git_remote_block {
5815        my ($remote, $rdata, $limit, $head) = @_;
5816
5817        my $heads = $rdata->{'heads'};
5818        my $fetch = $rdata->{'fetch'};
5819        my $push = $rdata->{'push'};
5820
5821        my $urls_table = "<table class=\"projects_list\">\n" ;
5822
5823        if (defined $fetch) {
5824                if ($fetch eq $push) {
5825                        $urls_table .= format_repo_url("URL", $fetch);
5826                } else {
5827                        $urls_table .= format_repo_url("Fetch URL", $fetch);
5828                        $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5829                }
5830        } elsif (defined $push) {
5831                $urls_table .= format_repo_url("Push URL", $push);
5832        } else {
5833                $urls_table .= format_repo_url("", "No remote URL");
5834        }
5835
5836        $urls_table .= "</table>\n";
5837
5838        my $dots;
5839        if (defined $limit && $limit < @$heads) {
5840                $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5841        }
5842
5843        print $urls_table;
5844        git_heads_body($heads, $head, 0, $limit, $dots);
5845}
5846
5847# Display a list of remote names with the respective fetch and push URLs
5848sub git_remotes_list {
5849        my ($remotedata, $limit) = @_;
5850        print "<table class=\"heads\">\n";
5851        my $alternate = 1;
5852        my @remotes = sort keys %$remotedata;
5853
5854        my $limited = $limit && $limit < @remotes;
5855
5856        $#remotes = $limit - 1 if $limited;
5857
5858        while (my $remote = shift @remotes) {
5859                my $rdata = $remotedata->{$remote};
5860                my $fetch = $rdata->{'fetch'};
5861                my $push = $rdata->{'push'};
5862                if ($alternate) {
5863                        print "<tr class=\"dark\">\n";
5864                } else {
5865                        print "<tr class=\"light\">\n";
5866                }
5867                $alternate ^= 1;
5868                print "<td>" .
5869                      $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5870                               -class=> "list name"},esc_html($remote)) .
5871                      "</td>";
5872                print "<td class=\"link\">" .
5873                      (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5874                      " | " .
5875                      (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5876                      "</td>";
5877
5878                print "</tr>\n";
5879        }
5880
5881        if ($limited) {
5882                print "<tr>\n" .
5883                      "<td colspan=\"3\">" .
5884                      $cgi->a({-href => href(action=>"remotes")}, "...") .
5885                      "</td>\n" . "</tr>\n";
5886        }
5887
5888        print "</table>";
5889}
5890
5891# Display remote heads grouped by remote, unless there are too many
5892# remotes, in which case we only display the remote names
5893sub git_remotes_body {
5894        my ($remotedata, $limit, $head) = @_;
5895        if ($limit and $limit < keys %$remotedata) {
5896                git_remotes_list($remotedata, $limit);
5897        } else {
5898                fill_remote_heads($remotedata);
5899                while (my ($remote, $rdata) = each %$remotedata) {
5900                        git_print_section({-class=>"remote", -id=>$remote},
5901                                ["remotes", $remote, $remote], sub {
5902                                        git_remote_block($remote, $rdata, $limit, $head);
5903                                });
5904                }
5905        }
5906}
5907
5908sub git_search_message {
5909        my %co = @_;
5910
5911        my $greptype;
5912        if ($searchtype eq 'commit') {
5913                $greptype = "--grep=";
5914        } elsif ($searchtype eq 'author') {
5915                $greptype = "--author=";
5916        } elsif ($searchtype eq 'committer') {
5917                $greptype = "--committer=";
5918        }
5919        $greptype .= $searchtext;
5920        my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
5921                                       $greptype, '--regexp-ignore-case',
5922                                       $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
5923
5924        my $paging_nav = '';
5925        if ($page > 0) {
5926                $paging_nav .=
5927                        $cgi->a({-href => href(-replay=>1, page=>undef)},
5928                                "first") .
5929                        " &sdot; " .
5930                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
5931                                 -accesskey => "p", -title => "Alt-p"}, "prev");
5932        } else {
5933                $paging_nav .= "first &sdot; prev";
5934        }
5935        my $next_link = '';
5936        if ($#commitlist >= 100) {
5937                $next_link =
5938                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
5939                                 -accesskey => "n", -title => "Alt-n"}, "next");
5940                $paging_nav .= " &sdot; $next_link";
5941        } else {
5942                $paging_nav .= " &sdot; next";
5943        }
5944
5945        git_header_html();
5946
5947        git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
5948        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5949        if ($page == 0 && !@commitlist) {
5950                print "<p>No match.</p>\n";
5951        } else {
5952                git_search_grep_body(\@commitlist, 0, 99, $next_link);
5953        }
5954
5955        git_footer_html();
5956}
5957
5958sub git_search_changes {
5959        my %co = @_;
5960
5961        local $/ = "\n";
5962        open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
5963                '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
5964                ($search_use_regexp ? '--pickaxe-regex' : ())
5965                        or die_error(500, "Open git-log failed");
5966
5967        git_header_html();
5968
5969        git_print_page_nav('','', $hash,$co{'tree'},$hash);
5970        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5971
5972        print "<table class=\"pickaxe search\">\n";
5973        my $alternate = 1;
5974        undef %co;
5975        my @files;
5976        while (my $line = <$fd>) {
5977                chomp $line;
5978                next unless $line;
5979
5980                my %set = parse_difftree_raw_line($line);
5981                if (defined $set{'commit'}) {
5982                        # finish previous commit
5983                        if (%co) {
5984                                print "</td>\n" .
5985                                      "<td class=\"link\">" .
5986                                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5987                                              "commit") .
5988                                      " | " .
5989                                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5990                                                             hash_base=>$co{'id'})},
5991                                              "tree") .
5992                                      "</td>\n" .
5993                                      "</tr>\n";
5994                        }
5995
5996                        if ($alternate) {
5997                                print "<tr class=\"dark\">\n";
5998                        } else {
5999                                print "<tr class=\"light\">\n";
6000                        }
6001                        $alternate ^= 1;
6002                        %co = parse_commit($set{'commit'});
6003                        my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6004                        print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6005                              "<td><i>$author</i></td>\n" .
6006                              "<td>" .
6007                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6008                                      -class => "list subject"},
6009                                      chop_and_escape_str($co{'title'}, 50) . "<br/>");
6010                } elsif (defined $set{'to_id'}) {
6011                        next if ($set{'to_id'} =~ m/^0{40}$/);
6012
6013                        print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6014                                                     hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6015                                      -class => "list"},
6016                                      "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6017                              "<br/>\n";
6018                }
6019        }
6020        close $fd;
6021
6022        # finish last commit (warning: repetition!)
6023        if (%co) {
6024                print "</td>\n" .
6025                      "<td class=\"link\">" .
6026                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
6027                              "commit") .
6028                      " | " .
6029                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
6030                                             hash_base=>$co{'id'})},
6031                              "tree") .
6032                      "</td>\n" .
6033                      "</tr>\n";
6034        }
6035
6036        print "</table>\n";
6037
6038        git_footer_html();
6039}
6040
6041sub git_search_files {
6042        my %co = @_;
6043
6044        local $/ = "\n";
6045        open my $fd, "-|", git_cmd(), 'grep', '-n', '-z',
6046                $search_use_regexp ? ('-E', '-i') : '-F',
6047                $searchtext, $co{'tree'}
6048                        or die_error(500, "Open git-grep failed");
6049
6050        git_header_html();
6051
6052        git_print_page_nav('','', $hash,$co{'tree'},$hash);
6053        git_print_header_div('commit', esc_html($co{'title'}), $hash);
6054
6055        print "<table class=\"grep_search\">\n";
6056        my $alternate = 1;
6057        my $matches = 0;
6058        my $lastfile = '';
6059        my $file_href;
6060        while (my $line = <$fd>) {
6061                chomp $line;
6062                my ($file, $lno, $ltext, $binary);
6063                last if ($matches++ > 1000);
6064                if ($line =~ /^Binary file (.+) matches$/) {
6065                        $file = $1;
6066                        $binary = 1;
6067                } else {
6068                        ($file, $lno, $ltext) = split(/\0/, $line, 3);
6069                        $file =~ s/^$co{'tree'}://;
6070                }
6071                if ($file ne $lastfile) {
6072                        $lastfile and print "</td></tr>\n";
6073                        if ($alternate++) {
6074                                print "<tr class=\"dark\">\n";
6075                        } else {
6076                                print "<tr class=\"light\">\n";
6077                        }
6078                        $file_href = href(action=>"blob", hash_base=>$co{'id'},
6079                                          file_name=>$file);
6080                        print "<td class=\"list\">".
6081                                $cgi->a({-href => $file_href, -class => "list"}, esc_path($file));
6082                        print "</td><td>\n";
6083                        $lastfile = $file;
6084                }
6085                if ($binary) {
6086                        print "<div class=\"binary\">Binary file</div>\n";
6087                } else {
6088                        $ltext = untabify($ltext);
6089                        if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6090                                $ltext = esc_html($1, -nbsp=>1);
6091                                $ltext .= '<span class="match">';
6092                                $ltext .= esc_html($2, -nbsp=>1);
6093                                $ltext .= '</span>';
6094                                $ltext .= esc_html($3, -nbsp=>1);
6095                        } else {
6096                                $ltext = esc_html($ltext, -nbsp=>1);
6097                        }
6098                        print "<div class=\"pre\">" .
6099                                $cgi->a({-href => $file_href.'#l'.$lno,
6100                                        -class => "linenr"}, sprintf('%4i', $lno)) .
6101                                ' ' .  $ltext . "</div>\n";
6102                }
6103        }
6104        if ($lastfile) {
6105                print "</td></tr>\n";
6106                if ($matches > 1000) {
6107                        print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6108                }
6109        } else {
6110                print "<div class=\"diff nodifferences\">No matches found</div>\n";
6111        }
6112        close $fd;
6113
6114        print "</table>\n";
6115
6116        git_footer_html();
6117}
6118
6119sub git_search_grep_body {
6120        my ($commitlist, $from, $to, $extra) = @_;
6121        $from = 0 unless defined $from;
6122        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
6123
6124        print "<table class=\"commit_search\">\n";
6125        my $alternate = 1;
6126        for (my $i = $from; $i <= $to; $i++) {
6127                my %co = %{$commitlist->[$i]};
6128                if (!%co) {
6129                        next;
6130                }
6131                my $commit = $co{'id'};
6132                if ($alternate) {
6133                        print "<tr class=\"dark\">\n";
6134                } else {
6135                        print "<tr class=\"light\">\n";
6136                }
6137                $alternate ^= 1;
6138                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6139                      format_author_html('td', \%co, 15, 5) .
6140                      "<td>" .
6141                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6142                               -class => "list subject"},
6143                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
6144                my $comment = $co{'comment'};
6145                foreach my $line (@$comment) {
6146                        if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
6147                                my ($lead, $match, $trail) = ($1, $2, $3);
6148                                $match = chop_str($match, 70, 5, 'center');
6149                                my $contextlen = int((80 - length($match))/2);
6150                                $contextlen = 30 if ($contextlen > 30);
6151                                $lead  = chop_str($lead,  $contextlen, 10, 'left');
6152                                $trail = chop_str($trail, $contextlen, 10, 'right');
6153
6154                                $lead  = esc_html($lead);
6155                                $match = esc_html($match);
6156                                $trail = esc_html($trail);
6157
6158                                print "$lead<span class=\"match\">$match</span>$trail<br />";
6159                        }
6160                }
6161                print "</td>\n" .
6162                      "<td class=\"link\">" .
6163                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6164                      " | " .
6165                      $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
6166                      " | " .
6167                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6168                print "</td>\n" .
6169                      "</tr>\n";
6170        }
6171        if (defined $extra) {
6172                print "<tr>\n" .
6173                      "<td colspan=\"3\">$extra</td>\n" .
6174                      "</tr>\n";
6175        }
6176        print "</table>\n";
6177}
6178
6179## ======================================================================
6180## ======================================================================
6181## actions
6182
6183sub git_project_list {
6184        my $order = $input_params{'order'};
6185        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6186                die_error(400, "Unknown order parameter");
6187        }
6188
6189        my @list = git_get_projects_list($project_filter, $strict_export);
6190        if (!@list) {
6191                die_error(404, "No projects found");
6192        }
6193
6194        git_header_html();
6195        if (defined $home_text && -f $home_text) {
6196                print "<div class=\"index_include\">\n";
6197                insert_file($home_text);
6198                print "</div>\n";
6199        }
6200
6201        git_project_search_form($searchtext, $search_use_regexp);
6202        git_project_list_body(\@list, $order);
6203        git_footer_html();
6204}
6205
6206sub git_forks {
6207        my $order = $input_params{'order'};
6208        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6209                die_error(400, "Unknown order parameter");
6210        }
6211
6212        my $filter = $project;
6213        $filter =~ s/\.git$//;
6214        my @list = git_get_projects_list($filter);
6215        if (!@list) {
6216                die_error(404, "No forks found");
6217        }
6218
6219        git_header_html();
6220        git_print_page_nav('','');
6221        git_print_header_div('summary', "$project forks");
6222        git_project_list_body(\@list, $order);
6223        git_footer_html();
6224}
6225
6226sub git_project_index {
6227        my @projects = git_get_projects_list($project_filter, $strict_export);
6228        if (!@projects) {
6229                die_error(404, "No projects found");
6230        }
6231
6232        print $cgi->header(
6233                -type => 'text/plain',
6234                -charset => 'utf-8',
6235                -content_disposition => 'inline; filename="index.aux"');
6236
6237        foreach my $pr (@projects) {
6238                if (!exists $pr->{'owner'}) {
6239                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6240                }
6241
6242                my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6243                # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6244                $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6245                $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6246                $path  =~ s/ /\+/g;
6247                $owner =~ s/ /\+/g;
6248
6249                print "$path $owner\n";
6250        }
6251}
6252
6253sub git_summary {
6254        my $descr = git_get_project_description($project) || "none";
6255        my %co = parse_commit("HEAD");
6256        my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6257        my $head = $co{'id'};
6258        my $remote_heads = gitweb_check_feature('remote_heads');
6259
6260        my $owner = git_get_project_owner($project);
6261
6262        my $refs = git_get_references();
6263        # These get_*_list functions return one more to allow us to see if
6264        # there are more ...
6265        my @taglist  = git_get_tags_list(16);
6266        my @headlist = git_get_heads_list(16);
6267        my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6268        my @forklist;
6269        my $check_forks = gitweb_check_feature('forks');
6270
6271        if ($check_forks) {
6272                # find forks of a project
6273                my $filter = $project;
6274                $filter =~ s/\.git$//;
6275                @forklist = git_get_projects_list($filter);
6276                # filter out forks of forks
6277                @forklist = filter_forks_from_projects_list(\@forklist)
6278                        if (@forklist);
6279        }
6280
6281        git_header_html();
6282        git_print_page_nav('summary','', $head);
6283
6284        print "<div class=\"title\">&nbsp;</div>\n";
6285        print "<table class=\"projects_list\">\n" .
6286              "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
6287              "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6288        if (defined $cd{'rfc2822'}) {
6289                print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6290                      "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6291        }
6292
6293        # use per project git URL list in $projectroot/$project/cloneurl
6294        # or make project git URL from git base URL and project name
6295        my $url_tag = "URL";
6296        my @url_list = git_get_project_url_list($project);
6297        @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6298        foreach my $git_url (@url_list) {
6299                next unless $git_url;
6300                print format_repo_url($url_tag, $git_url);
6301                $url_tag = "";
6302        }
6303
6304        # Tag cloud
6305        my $show_ctags = gitweb_check_feature('ctags');
6306        if ($show_ctags) {
6307                my $ctags = git_get_project_ctags($project);
6308                if (%$ctags) {
6309                        # without ability to add tags, don't show if there are none
6310                        my $cloud = git_populate_project_tagcloud($ctags);
6311                        print "<tr id=\"metadata_ctags\">" .
6312                              "<td>content tags</td>" .
6313                              "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6314                              "</tr>\n";
6315                }
6316        }
6317
6318        print "</table>\n";
6319
6320        # If XSS prevention is on, we don't include README.html.
6321        # TODO: Allow a readme in some safe format.
6322        if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6323                print "<div class=\"title\">readme</div>\n" .
6324                      "<div class=\"readme\">\n";
6325                insert_file("$projectroot/$project/README.html");
6326                print "\n</div>\n"; # class="readme"
6327        }
6328
6329        # we need to request one more than 16 (0..15) to check if
6330        # those 16 are all
6331        my @commitlist = $head ? parse_commits($head, 17) : ();
6332        if (@commitlist) {
6333                git_print_header_div('shortlog');
6334                git_shortlog_body(\@commitlist, 0, 15, $refs,
6335                                  $#commitlist <=  15 ? undef :
6336                                  $cgi->a({-href => href(action=>"shortlog")}, "..."));
6337        }
6338
6339        if (@taglist) {
6340                git_print_header_div('tags');
6341                git_tags_body(\@taglist, 0, 15,
6342                              $#taglist <=  15 ? undef :
6343                              $cgi->a({-href => href(action=>"tags")}, "..."));
6344        }
6345
6346        if (@headlist) {
6347                git_print_header_div('heads');
6348                git_heads_body(\@headlist, $head, 0, 15,
6349                               $#headlist <= 15 ? undef :
6350                               $cgi->a({-href => href(action=>"heads")}, "..."));
6351        }
6352
6353        if (%remotedata) {
6354                git_print_header_div('remotes');
6355                git_remotes_body(\%remotedata, 15, $head);
6356        }
6357
6358        if (@forklist) {
6359                git_print_header_div('forks');
6360                git_project_list_body(\@forklist, 'age', 0, 15,
6361                                      $#forklist <= 15 ? undef :
6362                                      $cgi->a({-href => href(action=>"forks")}, "..."),
6363                                      'no_header');
6364        }
6365
6366        git_footer_html();
6367}
6368
6369sub git_tag {
6370        my %tag = parse_tag($hash);
6371
6372        if (! %tag) {
6373                die_error(404, "Unknown tag object");
6374        }
6375
6376        my $head = git_get_head_hash($project);
6377        git_header_html();
6378        git_print_page_nav('','', $head,undef,$head);
6379        git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6380        print "<div class=\"title_text\">\n" .
6381              "<table class=\"object_header\">\n" .
6382              "<tr>\n" .
6383              "<td>object</td>\n" .
6384              "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6385                               $tag{'object'}) . "</td>\n" .
6386              "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6387                                              $tag{'type'}) . "</td>\n" .
6388              "</tr>\n";
6389        if (defined($tag{'author'})) {
6390                git_print_authorship_rows(\%tag, 'author');
6391        }
6392        print "</table>\n\n" .
6393              "</div>\n";
6394        print "<div class=\"page_body\">";
6395        my $comment = $tag{'comment'};
6396        foreach my $line (@$comment) {
6397                chomp $line;
6398                print esc_html($line, -nbsp=>1) . "<br/>\n";
6399        }
6400        print "</div>\n";
6401        git_footer_html();
6402}
6403
6404sub git_blame_common {
6405        my $format = shift || 'porcelain';
6406        if ($format eq 'porcelain' && $input_params{'javascript'}) {
6407                $format = 'incremental';
6408                $action = 'blame_incremental'; # for page title etc
6409        }
6410
6411        # permissions
6412        gitweb_check_feature('blame')
6413                or die_error(403, "Blame view not allowed");
6414
6415        # error checking
6416        die_error(400, "No file name given") unless $file_name;
6417        $hash_base ||= git_get_head_hash($project);
6418        die_error(404, "Couldn't find base commit") unless $hash_base;
6419        my %co = parse_commit($hash_base)
6420                or die_error(404, "Commit not found");
6421        my $ftype = "blob";
6422        if (!defined $hash) {
6423                $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6424                        or die_error(404, "Error looking up file");
6425        } else {
6426                $ftype = git_get_type($hash);
6427                if ($ftype !~ "blob") {
6428                        die_error(400, "Object is not a blob");
6429                }
6430        }
6431
6432        my $fd;
6433        if ($format eq 'incremental') {
6434                # get file contents (as base)
6435                open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6436                        or die_error(500, "Open git-cat-file failed");
6437        } elsif ($format eq 'data') {
6438                # run git-blame --incremental
6439                open $fd, "-|", git_cmd(), "blame", "--incremental",
6440                        $hash_base, "--", $file_name
6441                        or die_error(500, "Open git-blame --incremental failed");
6442        } else {
6443                # run git-blame --porcelain
6444                open $fd, "-|", git_cmd(), "blame", '-p',
6445                        $hash_base, '--', $file_name
6446                        or die_error(500, "Open git-blame --porcelain failed");
6447        }
6448
6449        # incremental blame data returns early
6450        if ($format eq 'data') {
6451                print $cgi->header(
6452                        -type=>"text/plain", -charset => "utf-8",
6453                        -status=> "200 OK");
6454                local $| = 1; # output autoflush
6455                while (my $line = <$fd>) {
6456                        print to_utf8($line);
6457                }
6458                close $fd
6459                        or print "ERROR $!\n";
6460
6461                print 'END';
6462                if (defined $t0 && gitweb_check_feature('timed')) {
6463                        print ' '.
6464                              tv_interval($t0, [ gettimeofday() ]).
6465                              ' '.$number_of_git_cmds;
6466                }
6467                print "\n";
6468
6469                return;
6470        }
6471
6472        # page header
6473        git_header_html();
6474        my $formats_nav =
6475                $cgi->a({-href => href(action=>"blob", -replay=>1)},
6476                        "blob") .
6477                " | ";
6478        if ($format eq 'incremental') {
6479                $formats_nav .=
6480                        $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6481                                "blame") . " (non-incremental)";
6482        } else {
6483                $formats_nav .=
6484                        $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6485                                "blame") . " (incremental)";
6486        }
6487        $formats_nav .=
6488                " | " .
6489                $cgi->a({-href => href(action=>"history", -replay=>1)},
6490                        "history") .
6491                " | " .
6492                $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6493                        "HEAD");
6494        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6495        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6496        git_print_page_path($file_name, $ftype, $hash_base);
6497
6498        # page body
6499        if ($format eq 'incremental') {
6500                print "<noscript>\n<div class=\"error\"><center><b>\n".
6501                      "This page requires JavaScript to run.\n Use ".
6502                      $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6503                              'this page').
6504                      " instead.\n".
6505                      "</b></center></div>\n</noscript>\n";
6506
6507                print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6508        }
6509
6510        print qq!<div class="page_body">\n!;
6511        print qq!<div id="progress_info">... / ...</div>\n!
6512                if ($format eq 'incremental');
6513        print qq!<table id="blame_table" class="blame" width="100%">\n!.
6514              #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6515              qq!<thead>\n!.
6516              qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6517              qq!</thead>\n!.
6518              qq!<tbody>\n!;
6519
6520        my @rev_color = qw(light dark);
6521        my $num_colors = scalar(@rev_color);
6522        my $current_color = 0;
6523
6524        if ($format eq 'incremental') {
6525                my $color_class = $rev_color[$current_color];
6526
6527                #contents of a file
6528                my $linenr = 0;
6529        LINE:
6530                while (my $line = <$fd>) {
6531                        chomp $line;
6532                        $linenr++;
6533
6534                        print qq!<tr id="l$linenr" class="$color_class">!.
6535                              qq!<td class="sha1"><a href=""> </a></td>!.
6536                              qq!<td class="linenr">!.
6537                              qq!<a class="linenr" href="">$linenr</a></td>!;
6538                        print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6539                        print qq!</tr>\n!;
6540                }
6541
6542        } else { # porcelain, i.e. ordinary blame
6543                my %metainfo = (); # saves information about commits
6544
6545                # blame data
6546        LINE:
6547                while (my $line = <$fd>) {
6548                        chomp $line;
6549                        # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6550                        # no <lines in group> for subsequent lines in group of lines
6551                        my ($full_rev, $orig_lineno, $lineno, $group_size) =
6552                           ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6553                        if (!exists $metainfo{$full_rev}) {
6554                                $metainfo{$full_rev} = { 'nprevious' => 0 };
6555                        }
6556                        my $meta = $metainfo{$full_rev};
6557                        my $data;
6558                        while ($data = <$fd>) {
6559                                chomp $data;
6560                                last if ($data =~ s/^\t//); # contents of line
6561                                if ($data =~ /^(\S+)(?: (.*))?$/) {
6562                                        $meta->{$1} = $2 unless exists $meta->{$1};
6563                                }
6564                                if ($data =~ /^previous /) {
6565                                        $meta->{'nprevious'}++;
6566                                }
6567                        }
6568                        my $short_rev = substr($full_rev, 0, 8);
6569                        my $author = $meta->{'author'};
6570                        my %date =
6571                                parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6572                        my $date = $date{'iso-tz'};
6573                        if ($group_size) {
6574                                $current_color = ($current_color + 1) % $num_colors;
6575                        }
6576                        my $tr_class = $rev_color[$current_color];
6577                        $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6578                        $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6579                        $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6580                        print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6581                        if ($group_size) {
6582                                print "<td class=\"sha1\"";
6583                                print " title=\"". esc_html($author) . ", $date\"";
6584                                print " rowspan=\"$group_size\"" if ($group_size > 1);
6585                                print ">";
6586                                print $cgi->a({-href => href(action=>"commit",
6587                                                             hash=>$full_rev,
6588                                                             file_name=>$file_name)},
6589                                              esc_html($short_rev));
6590                                if ($group_size >= 2) {
6591                                        my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6592                                        if (@author_initials) {
6593                                                print "<br />" .
6594                                                      esc_html(join('', @author_initials));
6595                                                #           or join('.', ...)
6596                                        }
6597                                }
6598                                print "</td>\n";
6599                        }
6600                        # 'previous' <sha1 of parent commit> <filename at commit>
6601                        if (exists $meta->{'previous'} &&
6602                            $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6603                                $meta->{'parent'} = $1;
6604                                $meta->{'file_parent'} = unquote($2);
6605                        }
6606                        my $linenr_commit =
6607                                exists($meta->{'parent'}) ?
6608                                $meta->{'parent'} : $full_rev;
6609                        my $linenr_filename =
6610                                exists($meta->{'file_parent'}) ?
6611                                $meta->{'file_parent'} : unquote($meta->{'filename'});
6612                        my $blamed = href(action => 'blame',
6613                                          file_name => $linenr_filename,
6614                                          hash_base => $linenr_commit);
6615                        print "<td class=\"linenr\">";
6616                        print $cgi->a({ -href => "$blamed#l$orig_lineno",
6617                                        -class => "linenr" },
6618                                      esc_html($lineno));
6619                        print "</td>";
6620                        print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6621                        print "</tr>\n";
6622                } # end while
6623
6624        }
6625
6626        # footer
6627        print "</tbody>\n".
6628              "</table>\n"; # class="blame"
6629        print "</div>\n";   # class="blame_body"
6630        close $fd
6631                or print "Reading blob failed\n";
6632
6633        git_footer_html();
6634}
6635
6636sub git_blame {
6637        git_blame_common();
6638}
6639
6640sub git_blame_incremental {
6641        git_blame_common('incremental');
6642}
6643
6644sub git_blame_data {
6645        git_blame_common('data');
6646}
6647
6648sub git_tags {
6649        my $head = git_get_head_hash($project);
6650        git_header_html();
6651        git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6652        git_print_header_div('summary', $project);
6653
6654        my @tagslist = git_get_tags_list();
6655        if (@tagslist) {
6656                git_tags_body(\@tagslist);
6657        }
6658        git_footer_html();
6659}
6660
6661sub git_heads {
6662        my $head = git_get_head_hash($project);
6663        git_header_html();
6664        git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6665        git_print_header_div('summary', $project);
6666
6667        my @headslist = git_get_heads_list();
6668        if (@headslist) {
6669                git_heads_body(\@headslist, $head);
6670        }
6671        git_footer_html();
6672}
6673
6674# used both for single remote view and for list of all the remotes
6675sub git_remotes {
6676        gitweb_check_feature('remote_heads')
6677                or die_error(403, "Remote heads view is disabled");
6678
6679        my $head = git_get_head_hash($project);
6680        my $remote = $input_params{'hash'};
6681
6682        my $remotedata = git_get_remotes_list($remote);
6683        die_error(500, "Unable to get remote information") unless defined $remotedata;
6684
6685        unless (%$remotedata) {
6686                die_error(404, defined $remote ?
6687                        "Remote $remote not found" :
6688                        "No remotes found");
6689        }
6690
6691        git_header_html(undef, undef, -action_extra => $remote);
6692        git_print_page_nav('', '',  $head, undef, $head,
6693                format_ref_views($remote ? '' : 'remotes'));
6694
6695        fill_remote_heads($remotedata);
6696        if (defined $remote) {
6697                git_print_header_div('remotes', "$remote remote for $project");
6698                git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6699        } else {
6700                git_print_header_div('summary', "$project remotes");
6701                git_remotes_body($remotedata, undef, $head);
6702        }
6703
6704        git_footer_html();
6705}
6706
6707sub git_blob_plain {
6708        my $type = shift;
6709        my $expires;
6710
6711        if (!defined $hash) {
6712                if (defined $file_name) {
6713                        my $base = $hash_base || git_get_head_hash($project);
6714                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6715                                or die_error(404, "Cannot find file");
6716                } else {
6717                        die_error(400, "No file name defined");
6718                }
6719        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6720                # blobs defined by non-textual hash id's can be cached
6721                $expires = "+1d";
6722        }
6723
6724        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6725                or die_error(500, "Open git-cat-file blob '$hash' failed");
6726
6727        # content-type (can include charset)
6728        $type = blob_contenttype($fd, $file_name, $type);
6729
6730        # "save as" filename, even when no $file_name is given
6731        my $save_as = "$hash";
6732        if (defined $file_name) {
6733                $save_as = $file_name;
6734        } elsif ($type =~ m/^text\//) {
6735                $save_as .= '.txt';
6736        }
6737
6738        # With XSS prevention on, blobs of all types except a few known safe
6739        # ones are served with "Content-Disposition: attachment" to make sure
6740        # they don't run in our security domain.  For certain image types,
6741        # blob view writes an <img> tag referring to blob_plain view, and we
6742        # want to be sure not to break that by serving the image as an
6743        # attachment (though Firefox 3 doesn't seem to care).
6744        my $sandbox = $prevent_xss &&
6745                $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6746
6747        # serve text/* as text/plain
6748        if ($prevent_xss &&
6749            ($type =~ m!^text/[a-z]+\b(.*)$! ||
6750             ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
6751                my $rest = $1;
6752                $rest = defined $rest ? $rest : '';
6753                $type = "text/plain$rest";
6754        }
6755
6756        print $cgi->header(
6757                -type => $type,
6758                -expires => $expires,
6759                -content_disposition =>
6760                        ($sandbox ? 'attachment' : 'inline')
6761                        . '; filename="' . $save_as . '"');
6762        local $/ = undef;
6763        binmode STDOUT, ':raw';
6764        print <$fd>;
6765        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6766        close $fd;
6767}
6768
6769sub git_blob {
6770        my $expires;
6771
6772        if (!defined $hash) {
6773                if (defined $file_name) {
6774                        my $base = $hash_base || git_get_head_hash($project);
6775                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6776                                or die_error(404, "Cannot find file");
6777                } else {
6778                        die_error(400, "No file name defined");
6779                }
6780        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6781                # blobs defined by non-textual hash id's can be cached
6782                $expires = "+1d";
6783        }
6784
6785        my $have_blame = gitweb_check_feature('blame');
6786        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6787                or die_error(500, "Couldn't cat $file_name, $hash");
6788        my $mimetype = blob_mimetype($fd, $file_name);
6789        # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6790        if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6791                close $fd;
6792                return git_blob_plain($mimetype);
6793        }
6794        # we can have blame only for text/* mimetype
6795        $have_blame &&= ($mimetype =~ m!^text/!);
6796
6797        my $highlight = gitweb_check_feature('highlight');
6798        my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6799        $fd = run_highlighter($fd, $highlight, $syntax)
6800                if $syntax;
6801
6802        git_header_html(undef, $expires);
6803        my $formats_nav = '';
6804        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6805                if (defined $file_name) {
6806                        if ($have_blame) {
6807                                $formats_nav .=
6808                                        $cgi->a({-href => href(action=>"blame", -replay=>1)},
6809                                                "blame") .
6810                                        " | ";
6811                        }
6812                        $formats_nav .=
6813                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6814                                        "history") .
6815                                " | " .
6816                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6817                                        "raw") .
6818                                " | " .
6819                                $cgi->a({-href => href(action=>"blob",
6820                                                       hash_base=>"HEAD", file_name=>$file_name)},
6821                                        "HEAD");
6822                } else {
6823                        $formats_nav .=
6824                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6825                                        "raw");
6826                }
6827                git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6828                git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6829        } else {
6830                print "<div class=\"page_nav\">\n" .
6831                      "<br/><br/></div>\n" .
6832                      "<div class=\"title\">".esc_html($hash)."</div>\n";
6833        }
6834        git_print_page_path($file_name, "blob", $hash_base);
6835        print "<div class=\"page_body\">\n";
6836        if ($mimetype =~ m!^image/!) {
6837                print qq!<img type="!.esc_attr($mimetype).qq!"!;
6838                if ($file_name) {
6839                        print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
6840                }
6841                print qq! src="! .
6842                      href(action=>"blob_plain", hash=>$hash,
6843                           hash_base=>$hash_base, file_name=>$file_name) .
6844                      qq!" />\n!;
6845        } else {
6846                my $nr;
6847                while (my $line = <$fd>) {
6848                        chomp $line;
6849                        $nr++;
6850                        $line = untabify($line);
6851                        printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
6852                               $nr, esc_attr(href(-replay => 1)), $nr, $nr,
6853                               $syntax ? sanitize($line) : esc_html($line, -nbsp=>1);
6854                }
6855        }
6856        close $fd
6857                or print "Reading blob failed.\n";
6858        print "</div>";
6859        git_footer_html();
6860}
6861
6862sub git_tree {
6863        if (!defined $hash_base) {
6864                $hash_base = "HEAD";
6865        }
6866        if (!defined $hash) {
6867                if (defined $file_name) {
6868                        $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
6869                } else {
6870                        $hash = $hash_base;
6871                }
6872        }
6873        die_error(404, "No such tree") unless defined($hash);
6874
6875        my $show_sizes = gitweb_check_feature('show-sizes');
6876        my $have_blame = gitweb_check_feature('blame');
6877
6878        my @entries = ();
6879        {
6880                local $/ = "\0";
6881                open my $fd, "-|", git_cmd(), "ls-tree", '-z',
6882                        ($show_sizes ? '-l' : ()), @extra_options, $hash
6883                        or die_error(500, "Open git-ls-tree failed");
6884                @entries = map { chomp; $_ } <$fd>;
6885                close $fd
6886                        or die_error(404, "Reading tree failed");
6887        }
6888
6889        my $refs = git_get_references();
6890        my $ref = format_ref_marker($refs, $hash_base);
6891        git_header_html();
6892        my $basedir = '';
6893        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6894                my @views_nav = ();
6895                if (defined $file_name) {
6896                        push @views_nav,
6897                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6898                                        "history"),
6899                                $cgi->a({-href => href(action=>"tree",
6900                                                       hash_base=>"HEAD", file_name=>$file_name)},
6901                                        "HEAD"),
6902                }
6903                my $snapshot_links = format_snapshot_links($hash);
6904                if (defined $snapshot_links) {
6905                        # FIXME: Should be available when we have no hash base as well.
6906                        push @views_nav, $snapshot_links;
6907                }
6908                git_print_page_nav('tree','', $hash_base, undef, undef,
6909                                   join(' | ', @views_nav));
6910                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6911        } else {
6912                undef $hash_base;
6913                print "<div class=\"page_nav\">\n";
6914                print "<br/><br/></div>\n";
6915                print "<div class=\"title\">".esc_html($hash)."</div>\n";
6916        }
6917        if (defined $file_name) {
6918                $basedir = $file_name;
6919                if ($basedir ne '' && substr($basedir, -1) ne '/') {
6920                        $basedir .= '/';
6921                }
6922                git_print_page_path($file_name, 'tree', $hash_base);
6923        }
6924        print "<div class=\"page_body\">\n";
6925        print "<table class=\"tree\">\n";
6926        my $alternate = 1;
6927        # '..' (top directory) link if possible
6928        if (defined $hash_base &&
6929            defined $file_name && $file_name =~ m![^/]+$!) {
6930                if ($alternate) {
6931                        print "<tr class=\"dark\">\n";
6932                } else {
6933                        print "<tr class=\"light\">\n";
6934                }
6935                $alternate ^= 1;
6936
6937                my $up = $file_name;
6938                $up =~ s!/?[^/]+$!!;
6939                undef $up unless $up;
6940                # based on git_print_tree_entry
6941                print '<td class="mode">' . mode_str('040000') . "</td>\n";
6942                print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6943                print '<td class="list">';
6944                print $cgi->a({-href => href(action=>"tree",
6945                                             hash_base=>$hash_base,
6946                                             file_name=>$up)},
6947                              "..");
6948                print "</td>\n";
6949                print "<td class=\"link\"></td>\n";
6950
6951                print "</tr>\n";
6952        }
6953        foreach my $line (@entries) {
6954                my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6955
6956                if ($alternate) {
6957                        print "<tr class=\"dark\">\n";
6958                } else {
6959                        print "<tr class=\"light\">\n";
6960                }
6961                $alternate ^= 1;
6962
6963                git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6964
6965                print "</tr>\n";
6966        }
6967        print "</table>\n" .
6968              "</div>";
6969        git_footer_html();
6970}
6971
6972sub snapshot_name {
6973        my ($project, $hash) = @_;
6974
6975        # path/to/project.git  -> project
6976        # path/to/project/.git -> project
6977        my $name = to_utf8($project);
6978        $name =~ s,([^/])/*\.git$,$1,;
6979        $name = basename($name);
6980        # sanitize name
6981        $name =~ s/[[:cntrl:]]/?/g;
6982
6983        my $ver = $hash;
6984        if ($hash =~ /^[0-9a-fA-F]+$/) {
6985                # shorten SHA-1 hash
6986                my $full_hash = git_get_full_hash($project, $hash);
6987                if ($full_hash =~ /^$hash/ && length($hash) > 7) {
6988                        $ver = git_get_short_hash($project, $hash);
6989                }
6990        } elsif ($hash =~ m!^refs/tags/(.*)$!) {
6991                # tags don't need shortened SHA-1 hash
6992                $ver = $1;
6993        } else {
6994                # branches and other need shortened SHA-1 hash
6995                if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
6996                        $ver = $1;
6997                }
6998                $ver .= '-' . git_get_short_hash($project, $hash);
6999        }
7000        # in case of hierarchical branch names
7001        $ver =~ s!/!.!g;
7002
7003        # name = project-version_string
7004        $name = "$name-$ver";
7005
7006        return wantarray ? ($name, $name) : $name;
7007}
7008
7009sub git_snapshot {
7010        my $format = $input_params{'snapshot_format'};
7011        if (!@snapshot_fmts) {
7012                die_error(403, "Snapshots not allowed");
7013        }
7014        # default to first supported snapshot format
7015        $format ||= $snapshot_fmts[0];
7016        if ($format !~ m/^[a-z0-9]+$/) {
7017                die_error(400, "Invalid snapshot format parameter");
7018        } elsif (!exists($known_snapshot_formats{$format})) {
7019                die_error(400, "Unknown snapshot format");
7020        } elsif ($known_snapshot_formats{$format}{'disabled'}) {
7021                die_error(403, "Snapshot format not allowed");
7022        } elsif (!grep($_ eq $format, @snapshot_fmts)) {
7023                die_error(403, "Unsupported snapshot format");
7024        }
7025
7026        my $type = git_get_type("$hash^{}");
7027        if (!$type) {
7028                die_error(404, 'Object does not exist');
7029        }  elsif ($type eq 'blob') {
7030                die_error(400, 'Object is not a tree-ish');
7031        }
7032
7033        my ($name, $prefix) = snapshot_name($project, $hash);
7034        my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
7035        my $cmd = quote_command(
7036                git_cmd(), 'archive',
7037                "--format=$known_snapshot_formats{$format}{'format'}",
7038                "--prefix=$prefix/", $hash);
7039        if (exists $known_snapshot_formats{$format}{'compressor'}) {
7040                $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
7041        }
7042
7043        $filename =~ s/(["\\])/\\$1/g;
7044        print $cgi->header(
7045                -type => $known_snapshot_formats{$format}{'type'},
7046                -content_disposition => 'inline; filename="' . $filename . '"',
7047                -status => '200 OK');
7048
7049        open my $fd, "-|", $cmd
7050                or die_error(500, "Execute git-archive failed");
7051        binmode STDOUT, ':raw';
7052        print <$fd>;
7053        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
7054        close $fd;
7055}
7056
7057sub git_log_generic {
7058        my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
7059
7060        my $head = git_get_head_hash($project);
7061        if (!defined $base) {
7062                $base = $head;
7063        }
7064        if (!defined $page) {
7065                $page = 0;
7066        }
7067        my $refs = git_get_references();
7068
7069        my $commit_hash = $base;
7070        if (defined $parent) {
7071                $commit_hash = "$parent..$base";
7072        }
7073        my @commitlist =
7074                parse_commits($commit_hash, 101, (100 * $page),
7075                              defined $file_name ? ($file_name, "--full-history") : ());
7076
7077        my $ftype;
7078        if (!defined $file_hash && defined $file_name) {
7079                # some commits could have deleted file in question,
7080                # and not have it in tree, but one of them has to have it
7081                for (my $i = 0; $i < @commitlist; $i++) {
7082                        $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
7083                        last if defined $file_hash;
7084                }
7085        }
7086        if (defined $file_hash) {
7087                $ftype = git_get_type($file_hash);
7088        }
7089        if (defined $file_name && !defined $ftype) {
7090                die_error(500, "Unknown type of object");
7091        }
7092        my %co;
7093        if (defined $file_name) {
7094                %co = parse_commit($base)
7095                        or die_error(404, "Unknown commit object");
7096        }
7097
7098
7099        my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
7100        my $next_link = '';
7101        if ($#commitlist >= 100) {
7102                $next_link =
7103                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
7104                                 -accesskey => "n", -title => "Alt-n"}, "next");
7105        }
7106        my $patch_max = gitweb_get_feature('patches');
7107        if ($patch_max && !defined $file_name) {
7108                if ($patch_max < 0 || @commitlist <= $patch_max) {
7109                        $paging_nav .= " &sdot; " .
7110                                $cgi->a({-href => href(action=>"patches", -replay=>1)},
7111                                        "patches");
7112                }
7113        }
7114
7115        git_header_html();
7116        git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
7117        if (defined $file_name) {
7118                git_print_header_div('commit', esc_html($co{'title'}), $base);
7119        } else {
7120                git_print_header_div('summary', $project)
7121        }
7122        git_print_page_path($file_name, $ftype, $hash_base)
7123                if (defined $file_name);
7124
7125        $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
7126                     $file_name, $file_hash, $ftype);
7127
7128        git_footer_html();
7129}
7130
7131sub git_log {
7132        git_log_generic('log', \&git_log_body,
7133                        $hash, $hash_parent);
7134}
7135
7136sub git_commit {
7137        $hash ||= $hash_base || "HEAD";
7138        my %co = parse_commit($hash)
7139            or die_error(404, "Unknown commit object");
7140
7141        my $parent  = $co{'parent'};
7142        my $parents = $co{'parents'}; # listref
7143
7144        # we need to prepare $formats_nav before any parameter munging
7145        my $formats_nav;
7146        if (!defined $parent) {
7147                # --root commitdiff
7148                $formats_nav .= '(initial)';
7149        } elsif (@$parents == 1) {
7150                # single parent commit
7151                $formats_nav .=
7152                        '(parent: ' .
7153                        $cgi->a({-href => href(action=>"commit",
7154                                               hash=>$parent)},
7155                                esc_html(substr($parent, 0, 7))) .
7156                        ')';
7157        } else {
7158                # merge commit
7159                $formats_nav .=
7160                        '(merge: ' .
7161                        join(' ', map {
7162                                $cgi->a({-href => href(action=>"commit",
7163                                                       hash=>$_)},
7164                                        esc_html(substr($_, 0, 7)));
7165                        } @$parents ) .
7166                        ')';
7167        }
7168        if (gitweb_check_feature('patches') && @$parents <= 1) {
7169                $formats_nav .= " | " .
7170                        $cgi->a({-href => href(action=>"patch", -replay=>1)},
7171                                "patch");
7172        }
7173
7174        if (!defined $parent) {
7175                $parent = "--root";
7176        }
7177        my @difftree;
7178        open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
7179                @diff_opts,
7180                (@$parents <= 1 ? $parent : '-c'),
7181                $hash, "--"
7182                or die_error(500, "Open git-diff-tree failed");
7183        @difftree = map { chomp; $_ } <$fd>;
7184        close $fd or die_error(404, "Reading git-diff-tree failed");
7185
7186        # non-textual hash id's can be cached
7187        my $expires;
7188        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7189                $expires = "+1d";
7190        }
7191        my $refs = git_get_references();
7192        my $ref = format_ref_marker($refs, $co{'id'});
7193
7194        git_header_html(undef, $expires);
7195        git_print_page_nav('commit', '',
7196                           $hash, $co{'tree'}, $hash,
7197                           $formats_nav);
7198
7199        if (defined $co{'parent'}) {
7200                git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
7201        } else {
7202                git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
7203        }
7204        print "<div class=\"title_text\">\n" .
7205              "<table class=\"object_header\">\n";
7206        git_print_authorship_rows(\%co);
7207        print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
7208        print "<tr>" .
7209              "<td>tree</td>" .
7210              "<td class=\"sha1\">" .
7211              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7212                       class => "list"}, $co{'tree'}) .
7213              "</td>" .
7214              "<td class=\"link\">" .
7215              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7216                      "tree");
7217        my $snapshot_links = format_snapshot_links($hash);
7218        if (defined $snapshot_links) {
7219                print " | " . $snapshot_links;
7220        }
7221        print "</td>" .
7222              "</tr>\n";
7223
7224        foreach my $par (@$parents) {
7225                print "<tr>" .
7226                      "<td>parent</td>" .
7227                      "<td class=\"sha1\">" .
7228                      $cgi->a({-href => href(action=>"commit", hash=>$par),
7229                               class => "list"}, $par) .
7230                      "</td>" .
7231                      "<td class=\"link\">" .
7232                      $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7233                      " | " .
7234                      $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7235                      "</td>" .
7236                      "</tr>\n";
7237        }
7238        print "</table>".
7239              "</div>\n";
7240
7241        print "<div class=\"page_body\">\n";
7242        git_print_log($co{'comment'});
7243        print "</div>\n";
7244
7245        git_difftree_body(\@difftree, $hash, @$parents);
7246
7247        git_footer_html();
7248}
7249
7250sub git_object {
7251        # object is defined by:
7252        # - hash or hash_base alone
7253        # - hash_base and file_name
7254        my $type;
7255
7256        # - hash or hash_base alone
7257        if ($hash || ($hash_base && !defined $file_name)) {
7258                my $object_id = $hash || $hash_base;
7259
7260                open my $fd, "-|", quote_command(
7261                        git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7262                        or die_error(404, "Object does not exist");
7263                $type = <$fd>;
7264                chomp $type;
7265                close $fd
7266                        or die_error(404, "Object does not exist");
7267
7268        # - hash_base and file_name
7269        } elsif ($hash_base && defined $file_name) {
7270                $file_name =~ s,/+$,,;
7271
7272                system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7273                        or die_error(404, "Base object does not exist");
7274
7275                # here errors should not hapen
7276                open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7277                        or die_error(500, "Open git-ls-tree failed");
7278                my $line = <$fd>;
7279                close $fd;
7280
7281                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7282                unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7283                        die_error(404, "File or directory for given base does not exist");
7284                }
7285                $type = $2;
7286                $hash = $3;
7287        } else {
7288                die_error(400, "Not enough information to find object");
7289        }
7290
7291        print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7292                                          hash=>$hash, hash_base=>$hash_base,
7293                                          file_name=>$file_name),
7294                             -status => '302 Found');
7295}
7296
7297sub git_blobdiff {
7298        my $format = shift || 'html';
7299        my $diff_style = $input_params{'diff_style'} || 'inline';
7300
7301        my $fd;
7302        my @difftree;
7303        my %diffinfo;
7304        my $expires;
7305
7306        # preparing $fd and %diffinfo for git_patchset_body
7307        # new style URI
7308        if (defined $hash_base && defined $hash_parent_base) {
7309                if (defined $file_name) {
7310                        # read raw output
7311                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7312                                $hash_parent_base, $hash_base,
7313                                "--", (defined $file_parent ? $file_parent : ()), $file_name
7314                                or die_error(500, "Open git-diff-tree failed");
7315                        @difftree = map { chomp; $_ } <$fd>;
7316                        close $fd
7317                                or die_error(404, "Reading git-diff-tree failed");
7318                        @difftree
7319                                or die_error(404, "Blob diff not found");
7320
7321                } elsif (defined $hash &&
7322                         $hash =~ /[0-9a-fA-F]{40}/) {
7323                        # try to find filename from $hash
7324
7325                        # read filtered raw output
7326                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7327                                $hash_parent_base, $hash_base, "--"
7328                                or die_error(500, "Open git-diff-tree failed");
7329                        @difftree =
7330                                # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7331                                # $hash == to_id
7332                                grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7333                                map { chomp; $_ } <$fd>;
7334                        close $fd
7335                                or die_error(404, "Reading git-diff-tree failed");
7336                        @difftree
7337                                or die_error(404, "Blob diff not found");
7338
7339                } else {
7340                        die_error(400, "Missing one of the blob diff parameters");
7341                }
7342
7343                if (@difftree > 1) {
7344                        die_error(400, "Ambiguous blob diff specification");
7345                }
7346
7347                %diffinfo = parse_difftree_raw_line($difftree[0]);
7348                $file_parent ||= $diffinfo{'from_file'} || $file_name;
7349                $file_name   ||= $diffinfo{'to_file'};
7350
7351                $hash_parent ||= $diffinfo{'from_id'};
7352                $hash        ||= $diffinfo{'to_id'};
7353
7354                # non-textual hash id's can be cached
7355                if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7356                    $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7357                        $expires = '+1d';
7358                }
7359
7360                # open patch output
7361                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7362                        '-p', ($format eq 'html' ? "--full-index" : ()),
7363                        $hash_parent_base, $hash_base,
7364                        "--", (defined $file_parent ? $file_parent : ()), $file_name
7365                        or die_error(500, "Open git-diff-tree failed");
7366        }
7367
7368        # old/legacy style URI -- not generated anymore since 1.4.3.
7369        if (!%diffinfo) {
7370                die_error('404 Not Found', "Missing one of the blob diff parameters")
7371        }
7372
7373        # header
7374        if ($format eq 'html') {
7375                my $formats_nav =
7376                        $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7377                                "raw");
7378                $formats_nav .= diff_style_nav($diff_style);
7379                git_header_html(undef, $expires);
7380                if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7381                        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7382                        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7383                } else {
7384                        print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7385                        print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7386                }
7387                if (defined $file_name) {
7388                        git_print_page_path($file_name, "blob", $hash_base);
7389                } else {
7390                        print "<div class=\"page_path\"></div>\n";
7391                }
7392
7393        } elsif ($format eq 'plain') {
7394                print $cgi->header(
7395                        -type => 'text/plain',
7396                        -charset => 'utf-8',
7397                        -expires => $expires,
7398                        -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7399
7400                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7401
7402        } else {
7403                die_error(400, "Unknown blobdiff format");
7404        }
7405
7406        # patch
7407        if ($format eq 'html') {
7408                print "<div class=\"page_body\">\n";
7409
7410                git_patchset_body($fd, $diff_style,
7411                                  [ \%diffinfo ], $hash_base, $hash_parent_base);
7412                close $fd;
7413
7414                print "</div>\n"; # class="page_body"
7415                git_footer_html();
7416
7417        } else {
7418                while (my $line = <$fd>) {
7419                        $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7420                        $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7421
7422                        print $line;
7423
7424                        last if $line =~ m!^\+\+\+!;
7425                }
7426                local $/ = undef;
7427                print <$fd>;
7428                close $fd;
7429        }
7430}
7431
7432sub git_blobdiff_plain {
7433        git_blobdiff('plain');
7434}
7435
7436# assumes that it is added as later part of already existing navigation,
7437# so it returns "| foo | bar" rather than just "foo | bar"
7438sub diff_style_nav {
7439        my ($diff_style, $is_combined) = @_;
7440        $diff_style ||= 'inline';
7441
7442        return "" if ($is_combined);
7443
7444        my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7445        my %styles = @styles;
7446        @styles =
7447                @styles[ map { $_ * 2 } 0..$#styles/2 ];
7448
7449        return join '',
7450                map { " | ".$_ }
7451                map {
7452                        $_ eq $diff_style ? $styles{$_} :
7453                        $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7454                } @styles;
7455}
7456
7457sub git_commitdiff {
7458        my %params = @_;
7459        my $format = $params{-format} || 'html';
7460        my $diff_style = $input_params{'diff_style'} || 'inline';
7461
7462        my ($patch_max) = gitweb_get_feature('patches');
7463        if ($format eq 'patch') {
7464                die_error(403, "Patch view not allowed") unless $patch_max;
7465        }
7466
7467        $hash ||= $hash_base || "HEAD";
7468        my %co = parse_commit($hash)
7469            or die_error(404, "Unknown commit object");
7470
7471        # choose format for commitdiff for merge
7472        if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7473                $hash_parent = '--cc';
7474        }
7475        # we need to prepare $formats_nav before almost any parameter munging
7476        my $formats_nav;
7477        if ($format eq 'html') {
7478                $formats_nav =
7479                        $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7480                                "raw");
7481                if ($patch_max && @{$co{'parents'}} <= 1) {
7482                        $formats_nav .= " | " .
7483                                $cgi->a({-href => href(action=>"patch", -replay=>1)},
7484                                        "patch");
7485                }
7486                $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7487
7488                if (defined $hash_parent &&
7489                    $hash_parent ne '-c' && $hash_parent ne '--cc') {
7490                        # commitdiff with two commits given
7491                        my $hash_parent_short = $hash_parent;
7492                        if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7493                                $hash_parent_short = substr($hash_parent, 0, 7);
7494                        }
7495                        $formats_nav .=
7496                                ' (from';
7497                        for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7498                                if ($co{'parents'}[$i] eq $hash_parent) {
7499                                        $formats_nav .= ' parent ' . ($i+1);
7500                                        last;
7501                                }
7502                        }
7503                        $formats_nav .= ': ' .
7504                                $cgi->a({-href => href(-replay=>1,
7505                                                       hash=>$hash_parent, hash_base=>undef)},
7506                                        esc_html($hash_parent_short)) .
7507                                ')';
7508                } elsif (!$co{'parent'}) {
7509                        # --root commitdiff
7510                        $formats_nav .= ' (initial)';
7511                } elsif (scalar @{$co{'parents'}} == 1) {
7512                        # single parent commit
7513                        $formats_nav .=
7514                                ' (parent: ' .
7515                                $cgi->a({-href => href(-replay=>1,
7516                                                       hash=>$co{'parent'}, hash_base=>undef)},
7517                                        esc_html(substr($co{'parent'}, 0, 7))) .
7518                                ')';
7519                } else {
7520                        # merge commit
7521                        if ($hash_parent eq '--cc') {
7522                                $formats_nav .= ' | ' .
7523                                        $cgi->a({-href => href(-replay=>1,
7524                                                               hash=>$hash, hash_parent=>'-c')},
7525                                                'combined');
7526                        } else { # $hash_parent eq '-c'
7527                                $formats_nav .= ' | ' .
7528                                        $cgi->a({-href => href(-replay=>1,
7529                                                               hash=>$hash, hash_parent=>'--cc')},
7530                                                'compact');
7531                        }
7532                        $formats_nav .=
7533                                ' (merge: ' .
7534                                join(' ', map {
7535                                        $cgi->a({-href => href(-replay=>1,
7536                                                               hash=>$_, hash_base=>undef)},
7537                                                esc_html(substr($_, 0, 7)));
7538                                } @{$co{'parents'}} ) .
7539                                ')';
7540                }
7541        }
7542
7543        my $hash_parent_param = $hash_parent;
7544        if (!defined $hash_parent_param) {
7545                # --cc for multiple parents, --root for parentless
7546                $hash_parent_param =
7547                        @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7548        }
7549
7550        # read commitdiff
7551        my $fd;
7552        my @difftree;
7553        if ($format eq 'html') {
7554                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7555                        "--no-commit-id", "--patch-with-raw", "--full-index",
7556                        $hash_parent_param, $hash, "--"
7557                        or die_error(500, "Open git-diff-tree failed");
7558
7559                while (my $line = <$fd>) {
7560                        chomp $line;
7561                        # empty line ends raw part of diff-tree output
7562                        last unless $line;
7563                        push @difftree, scalar parse_difftree_raw_line($line);
7564                }
7565
7566        } elsif ($format eq 'plain') {
7567                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7568                        '-p', $hash_parent_param, $hash, "--"
7569                        or die_error(500, "Open git-diff-tree failed");
7570        } elsif ($format eq 'patch') {
7571                # For commit ranges, we limit the output to the number of
7572                # patches specified in the 'patches' feature.
7573                # For single commits, we limit the output to a single patch,
7574                # diverging from the git-format-patch default.
7575                my @commit_spec = ();
7576                if ($hash_parent) {
7577                        if ($patch_max > 0) {
7578                                push @commit_spec, "-$patch_max";
7579                        }
7580                        push @commit_spec, '-n', "$hash_parent..$hash";
7581                } else {
7582                        if ($params{-single}) {
7583                                push @commit_spec, '-1';
7584                        } else {
7585                                if ($patch_max > 0) {
7586                                        push @commit_spec, "-$patch_max";
7587                                }
7588                                push @commit_spec, "-n";
7589                        }
7590                        push @commit_spec, '--root', $hash;
7591                }
7592                open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7593                        '--encoding=utf8', '--stdout', @commit_spec
7594                        or die_error(500, "Open git-format-patch failed");
7595        } else {
7596                die_error(400, "Unknown commitdiff format");
7597        }
7598
7599        # non-textual hash id's can be cached
7600        my $expires;
7601        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7602                $expires = "+1d";
7603        }
7604
7605        # write commit message
7606        if ($format eq 'html') {
7607                my $refs = git_get_references();
7608                my $ref = format_ref_marker($refs, $co{'id'});
7609
7610                git_header_html(undef, $expires);
7611                git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7612                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7613                print "<div class=\"title_text\">\n" .
7614                      "<table class=\"object_header\">\n";
7615                git_print_authorship_rows(\%co);
7616                print "</table>".
7617                      "</div>\n";
7618                print "<div class=\"page_body\">\n";
7619                if (@{$co{'comment'}} > 1) {
7620                        print "<div class=\"log\">\n";
7621                        git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7622                        print "</div>\n"; # class="log"
7623                }
7624
7625        } elsif ($format eq 'plain') {
7626                my $refs = git_get_references("tags");
7627                my $tagname = git_get_rev_name_tags($hash);
7628                my $filename = basename($project) . "-$hash.patch";
7629
7630                print $cgi->header(
7631                        -type => 'text/plain',
7632                        -charset => 'utf-8',
7633                        -expires => $expires,
7634                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7635                my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7636                print "From: " . to_utf8($co{'author'}) . "\n";
7637                print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7638                print "Subject: " . to_utf8($co{'title'}) . "\n";
7639
7640                print "X-Git-Tag: $tagname\n" if $tagname;
7641                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7642
7643                foreach my $line (@{$co{'comment'}}) {
7644                        print to_utf8($line) . "\n";
7645                }
7646                print "---\n\n";
7647        } elsif ($format eq 'patch') {
7648                my $filename = basename($project) . "-$hash.patch";
7649
7650                print $cgi->header(
7651                        -type => 'text/plain',
7652                        -charset => 'utf-8',
7653                        -expires => $expires,
7654                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7655        }
7656
7657        # write patch
7658        if ($format eq 'html') {
7659                my $use_parents = !defined $hash_parent ||
7660                        $hash_parent eq '-c' || $hash_parent eq '--cc';
7661                git_difftree_body(\@difftree, $hash,
7662                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7663                print "<br/>\n";
7664
7665                git_patchset_body($fd, $diff_style,
7666                                  \@difftree, $hash,
7667                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7668                close $fd;
7669                print "</div>\n"; # class="page_body"
7670                git_footer_html();
7671
7672        } elsif ($format eq 'plain') {
7673                local $/ = undef;
7674                print <$fd>;
7675                close $fd
7676                        or print "Reading git-diff-tree failed\n";
7677        } elsif ($format eq 'patch') {
7678                local $/ = undef;
7679                print <$fd>;
7680                close $fd
7681                        or print "Reading git-format-patch failed\n";
7682        }
7683}
7684
7685sub git_commitdiff_plain {
7686        git_commitdiff(-format => 'plain');
7687}
7688
7689# format-patch-style patches
7690sub git_patch {
7691        git_commitdiff(-format => 'patch', -single => 1);
7692}
7693
7694sub git_patches {
7695        git_commitdiff(-format => 'patch');
7696}
7697
7698sub git_history {
7699        git_log_generic('history', \&git_history_body,
7700                        $hash_base, $hash_parent_base,
7701                        $file_name, $hash);
7702}
7703
7704sub git_search {
7705        $searchtype ||= 'commit';
7706
7707        # check if appropriate features are enabled
7708        gitweb_check_feature('search')
7709                or die_error(403, "Search is disabled");
7710        if ($searchtype eq 'pickaxe') {
7711                # pickaxe may take all resources of your box and run for several minutes
7712                # with every query - so decide by yourself how public you make this feature
7713                gitweb_check_feature('pickaxe')
7714                        or die_error(403, "Pickaxe search is disabled");
7715        }
7716        if ($searchtype eq 'grep') {
7717                # grep search might be potentially CPU-intensive, too
7718                gitweb_check_feature('grep')
7719                        or die_error(403, "Grep search is disabled");
7720        }
7721
7722        if (!defined $searchtext) {
7723                die_error(400, "Text field is empty");
7724        }
7725        if (!defined $hash) {
7726                $hash = git_get_head_hash($project);
7727        }
7728        my %co = parse_commit($hash);
7729        if (!%co) {
7730                die_error(404, "Unknown commit object");
7731        }
7732        if (!defined $page) {
7733                $page = 0;
7734        }
7735
7736        if ($searchtype eq 'commit' ||
7737            $searchtype eq 'author' ||
7738            $searchtype eq 'committer') {
7739                git_search_message(%co);
7740        } elsif ($searchtype eq 'pickaxe') {
7741                git_search_changes(%co);
7742        } elsif ($searchtype eq 'grep') {
7743                git_search_files(%co);
7744        } else {
7745                die_error(400, "Unknown search type");
7746        }
7747}
7748
7749sub git_search_help {
7750        git_header_html();
7751        git_print_page_nav('','', $hash,$hash,$hash);
7752        print <<EOT;
7753<p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7754regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7755the pattern entered is recognized as the POSIX extended
7756<a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7757insensitive).</p>
7758<dl>
7759<dt><b>commit</b></dt>
7760<dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7761EOT
7762        my $have_grep = gitweb_check_feature('grep');
7763        if ($have_grep) {
7764                print <<EOT;
7765<dt><b>grep</b></dt>
7766<dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7767    a different one) are searched for the given pattern. On large trees, this search can take
7768a while and put some strain on the server, so please use it with some consideration. Note that
7769due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7770case-sensitive.</dd>
7771EOT
7772        }
7773        print <<EOT;
7774<dt><b>author</b></dt>
7775<dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7776<dt><b>committer</b></dt>
7777<dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7778EOT
7779        my $have_pickaxe = gitweb_check_feature('pickaxe');
7780        if ($have_pickaxe) {
7781                print <<EOT;
7782<dt><b>pickaxe</b></dt>
7783<dd>All commits that caused the string to appear or disappear from any file (changes that
7784added, removed or "modified" the string) will be listed. This search can take a while and
7785takes a lot of strain on the server, so please use it wisely. Note that since you may be
7786interested even in changes just changing the case as well, this search is case sensitive.</dd>
7787EOT
7788        }
7789        print "</dl>\n";
7790        git_footer_html();
7791}
7792
7793sub git_shortlog {
7794        git_log_generic('shortlog', \&git_shortlog_body,
7795                        $hash, $hash_parent);
7796}
7797
7798## ......................................................................
7799## feeds (RSS, Atom; OPML)
7800
7801sub git_feed {
7802        my $format = shift || 'atom';
7803        my $have_blame = gitweb_check_feature('blame');
7804
7805        # Atom: http://www.atomenabled.org/developers/syndication/
7806        # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7807        if ($format ne 'rss' && $format ne 'atom') {
7808                die_error(400, "Unknown web feed format");
7809        }
7810
7811        # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7812        my $head = $hash || 'HEAD';
7813        my @commitlist = parse_commits($head, 150, 0, $file_name);
7814
7815        my %latest_commit;
7816        my %latest_date;
7817        my $content_type = "application/$format+xml";
7818        if (defined $cgi->http('HTTP_ACCEPT') &&
7819                 $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7820                # browser (feed reader) prefers text/xml
7821                $content_type = 'text/xml';
7822        }
7823        if (defined($commitlist[0])) {
7824                %latest_commit = %{$commitlist[0]};
7825                my $latest_epoch = $latest_commit{'committer_epoch'};
7826                %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7827                my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7828                if (defined $if_modified) {
7829                        my $since;
7830                        if (eval { require HTTP::Date; 1; }) {
7831                                $since = HTTP::Date::str2time($if_modified);
7832                        } elsif (eval { require Time::ParseDate; 1; }) {
7833                                $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7834                        }
7835                        if (defined $since && $latest_epoch <= $since) {
7836                                print $cgi->header(
7837                                        -type => $content_type,
7838                                        -charset => 'utf-8',
7839                                        -last_modified => $latest_date{'rfc2822'},
7840                                        -status => '304 Not Modified');
7841                                return;
7842                        }
7843                }
7844                print $cgi->header(
7845                        -type => $content_type,
7846                        -charset => 'utf-8',
7847                        -last_modified => $latest_date{'rfc2822'});
7848        } else {
7849                print $cgi->header(
7850                        -type => $content_type,
7851                        -charset => 'utf-8');
7852        }
7853
7854        # Optimization: skip generating the body if client asks only
7855        # for Last-Modified date.
7856        return if ($cgi->request_method() eq 'HEAD');
7857
7858        # header variables
7859        my $title = "$site_name - $project/$action";
7860        my $feed_type = 'log';
7861        if (defined $hash) {
7862                $title .= " - '$hash'";
7863                $feed_type = 'branch log';
7864                if (defined $file_name) {
7865                        $title .= " :: $file_name";
7866                        $feed_type = 'history';
7867                }
7868        } elsif (defined $file_name) {
7869                $title .= " - $file_name";
7870                $feed_type = 'history';
7871        }
7872        $title .= " $feed_type";
7873        my $descr = git_get_project_description($project);
7874        if (defined $descr) {
7875                $descr = esc_html($descr);
7876        } else {
7877                $descr = "$project " .
7878                         ($format eq 'rss' ? 'RSS' : 'Atom') .
7879                         " feed";
7880        }
7881        my $owner = git_get_project_owner($project);
7882        $owner = esc_html($owner);
7883
7884        #header
7885        my $alt_url;
7886        if (defined $file_name) {
7887                $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7888        } elsif (defined $hash) {
7889                $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7890        } else {
7891                $alt_url = href(-full=>1, action=>"summary");
7892        }
7893        print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7894        if ($format eq 'rss') {
7895                print <<XML;
7896<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7897<channel>
7898XML
7899                print "<title>$title</title>\n" .
7900                      "<link>$alt_url</link>\n" .
7901                      "<description>$descr</description>\n" .
7902                      "<language>en</language>\n" .
7903                      # project owner is responsible for 'editorial' content
7904                      "<managingEditor>$owner</managingEditor>\n";
7905                if (defined $logo || defined $favicon) {
7906                        # prefer the logo to the favicon, since RSS
7907                        # doesn't allow both
7908                        my $img = esc_url($logo || $favicon);
7909                        print "<image>\n" .
7910                              "<url>$img</url>\n" .
7911                              "<title>$title</title>\n" .
7912                              "<link>$alt_url</link>\n" .
7913                              "</image>\n";
7914                }
7915                if (%latest_date) {
7916                        print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7917                        print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7918                }
7919                print "<generator>gitweb v.$version/$git_version</generator>\n";
7920        } elsif ($format eq 'atom') {
7921                print <<XML;
7922<feed xmlns="http://www.w3.org/2005/Atom">
7923XML
7924                print "<title>$title</title>\n" .
7925                      "<subtitle>$descr</subtitle>\n" .
7926                      '<link rel="alternate" type="text/html" href="' .
7927                      $alt_url . '" />' . "\n" .
7928                      '<link rel="self" type="' . $content_type . '" href="' .
7929                      $cgi->self_url() . '" />' . "\n" .
7930                      "<id>" . href(-full=>1) . "</id>\n" .
7931                      # use project owner for feed author
7932                      "<author><name>$owner</name></author>\n";
7933                if (defined $favicon) {
7934                        print "<icon>" . esc_url($favicon) . "</icon>\n";
7935                }
7936                if (defined $logo) {
7937                        # not twice as wide as tall: 72 x 27 pixels
7938                        print "<logo>" . esc_url($logo) . "</logo>\n";
7939                }
7940                if (! %latest_date) {
7941                        # dummy date to keep the feed valid until commits trickle in:
7942                        print "<updated>1970-01-01T00:00:00Z</updated>\n";
7943                } else {
7944                        print "<updated>$latest_date{'iso-8601'}</updated>\n";
7945                }
7946                print "<generator version='$version/$git_version'>gitweb</generator>\n";
7947        }
7948
7949        # contents
7950        for (my $i = 0; $i <= $#commitlist; $i++) {
7951                my %co = %{$commitlist[$i]};
7952                my $commit = $co{'id'};
7953                # we read 150, we always show 30 and the ones more recent than 48 hours
7954                if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7955                        last;
7956                }
7957                my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7958
7959                # get list of changed files
7960                open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7961                        $co{'parent'} || "--root",
7962                        $co{'id'}, "--", (defined $file_name ? $file_name : ())
7963                        or next;
7964                my @difftree = map { chomp; $_ } <$fd>;
7965                close $fd
7966                        or next;
7967
7968                # print element (entry, item)
7969                my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7970                if ($format eq 'rss') {
7971                        print "<item>\n" .
7972                              "<title>" . esc_html($co{'title'}) . "</title>\n" .
7973                              "<author>" . esc_html($co{'author'}) . "</author>\n" .
7974                              "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7975                              "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7976                              "<link>$co_url</link>\n" .
7977                              "<description>" . esc_html($co{'title'}) . "</description>\n" .
7978                              "<content:encoded>" .
7979                              "<![CDATA[\n";
7980                } elsif ($format eq 'atom') {
7981                        print "<entry>\n" .
7982                              "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7983                              "<updated>$cd{'iso-8601'}</updated>\n" .
7984                              "<author>\n" .
7985                              "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7986                        if ($co{'author_email'}) {
7987                                print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7988                        }
7989                        print "</author>\n" .
7990                              # use committer for contributor
7991                              "<contributor>\n" .
7992                              "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7993                        if ($co{'committer_email'}) {
7994                                print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7995                        }
7996                        print "</contributor>\n" .
7997                              "<published>$cd{'iso-8601'}</published>\n" .
7998                              "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7999                              "<id>$co_url</id>\n" .
8000                              "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
8001                              "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
8002                }
8003                my $comment = $co{'comment'};
8004                print "<pre>\n";
8005                foreach my $line (@$comment) {
8006                        $line = esc_html($line);
8007                        print "$line\n";
8008                }
8009                print "</pre><ul>\n";
8010                foreach my $difftree_line (@difftree) {
8011                        my %difftree = parse_difftree_raw_line($difftree_line);
8012                        next if !$difftree{'from_id'};
8013
8014                        my $file = $difftree{'file'} || $difftree{'to_file'};
8015
8016                        print "<li>" .
8017                              "[" .
8018                              $cgi->a({-href => href(-full=>1, action=>"blobdiff",
8019                                                     hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
8020                                                     hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
8021                                                     file_name=>$file, file_parent=>$difftree{'from_file'}),
8022                                      -title => "diff"}, 'D');
8023                        if ($have_blame) {
8024                                print $cgi->a({-href => href(-full=>1, action=>"blame",
8025                                                             file_name=>$file, hash_base=>$commit),
8026                                              -title => "blame"}, 'B');
8027                        }
8028                        # if this is not a feed of a file history
8029                        if (!defined $file_name || $file_name ne $file) {
8030                                print $cgi->a({-href => href(-full=>1, action=>"history",
8031                                                             file_name=>$file, hash=>$commit),
8032                                              -title => "history"}, 'H');
8033                        }
8034                        $file = esc_path($file);
8035                        print "] ".
8036                              "$file</li>\n";
8037                }
8038                if ($format eq 'rss') {
8039                        print "</ul>]]>\n" .
8040                              "</content:encoded>\n" .
8041                              "</item>\n";
8042                } elsif ($format eq 'atom') {
8043                        print "</ul>\n</div>\n" .
8044                              "</content>\n" .
8045                              "</entry>\n";
8046                }
8047        }
8048
8049        # end of feed
8050        if ($format eq 'rss') {
8051                print "</channel>\n</rss>\n";
8052        } elsif ($format eq 'atom') {
8053                print "</feed>\n";
8054        }
8055}
8056
8057sub git_rss {
8058        git_feed('rss');
8059}
8060
8061sub git_atom {
8062        git_feed('atom');
8063}
8064
8065sub git_opml {
8066        my @list = git_get_projects_list($project_filter, $strict_export);
8067        if (!@list) {
8068                die_error(404, "No projects found");
8069        }
8070
8071        print $cgi->header(
8072                -type => 'text/xml',
8073                -charset => 'utf-8',
8074                -content_disposition => 'inline; filename="opml.xml"');
8075
8076        my $title = esc_html($site_name);
8077        my $filter = " within subdirectory ";
8078        if (defined $project_filter) {
8079                $filter .= esc_html($project_filter);
8080        } else {
8081                $filter = "";
8082        }
8083        print <<XML;
8084<?xml version="1.0" encoding="utf-8"?>
8085<opml version="1.0">
8086<head>
8087  <title>$title OPML Export$filter</title>
8088</head>
8089<body>
8090<outline text="git RSS feeds">
8091XML
8092
8093        foreach my $pr (@list) {
8094                my %proj = %$pr;
8095                my $head = git_get_head_hash($proj{'path'});
8096                if (!defined $head) {
8097                        next;
8098                }
8099                $git_dir = "$projectroot/$proj{'path'}";
8100                my %co = parse_commit($head);
8101                if (!%co) {
8102                        next;
8103                }
8104
8105                my $path = esc_html(chop_str($proj{'path'}, 25, 5));
8106                my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
8107                my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
8108                print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
8109        }
8110        print <<XML;
8111</outline>
8112</body>
8113</opml>
8114XML
8115}