90836e633c145207ee8a919908feadc47fe5e3ae
   1#!/usr/bin/perl
   2
   3# gitweb - simple web interface to track changes in git repositories
   4#
   5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
   6# (C) 2005, Christian Gierke
   7#
   8# This program is licensed under the GPLv2
   9
  10use 5.008;
  11use strict;
  12use warnings;
  13use CGI qw(:standard :escapeHTML -nosticky);
  14use CGI::Util qw(unescape);
  15use CGI::Carp qw(fatalsToBrowser set_message);
  16use Encode;
  17use Fcntl ':mode';
  18use File::Find qw();
  19use File::Basename qw(basename);
  20use Time::HiRes qw(gettimeofday tv_interval);
  21binmode STDOUT, ':utf8';
  22
  23our $t0 = [ gettimeofday() ];
  24our $number_of_git_cmds = 0;
  25
  26BEGIN {
  27        CGI->compile() if $ENV{'MOD_PERL'};
  28}
  29
  30our $version = "++GIT_VERSION++";
  31
  32our ($my_url, $my_uri, $base_url, $path_info, $home_link);
  33sub evaluate_uri {
  34        our $cgi;
  35
  36        our $my_url = $cgi->url();
  37        our $my_uri = $cgi->url(-absolute => 1);
  38
  39        # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
  40        # needed and used only for URLs with nonempty PATH_INFO
  41        our $base_url = $my_url;
  42
  43        # When the script is used as DirectoryIndex, the URL does not contain the name
  44        # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
  45        # have to do it ourselves. We make $path_info global because it's also used
  46        # later on.
  47        #
  48        # Another issue with the script being the DirectoryIndex is that the resulting
  49        # $my_url data is not the full script URL: this is good, because we want
  50        # generated links to keep implying the script name if it wasn't explicitly
  51        # indicated in the URL we're handling, but it means that $my_url cannot be used
  52        # as base URL.
  53        # Therefore, if we needed to strip PATH_INFO, then we know that we have
  54        # to build the base URL ourselves:
  55        our $path_info = decode_utf8($ENV{"PATH_INFO"});
  56        if ($path_info) {
  57                if ($my_url =~ s,\Q$path_info\E$,, &&
  58                    $my_uri =~ s,\Q$path_info\E$,, &&
  59                    defined $ENV{'SCRIPT_NAME'}) {
  60                        $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
  61                }
  62        }
  63
  64        # target of the home link on top of all pages
  65        our $home_link = $my_uri || "/";
  66}
  67
  68# core git executable to use
  69# this can just be "git" if your webserver has a sensible PATH
  70our $GIT = "++GIT_BINDIR++/git";
  71
  72# absolute fs-path which will be prepended to the project path
  73#our $projectroot = "/pub/scm";
  74our $projectroot = "++GITWEB_PROJECTROOT++";
  75
  76# fs traversing limit for getting project list
  77# the number is relative to the projectroot
  78our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
  79
  80# string of the home link on top of all pages
  81our $home_link_str = "++GITWEB_HOME_LINK_STR++";
  82
  83# name of your site or organization to appear in page titles
  84# replace this with something more descriptive for clearer bookmarks
  85our $site_name = "++GITWEB_SITENAME++"
  86                 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
  87
  88# html snippet to include in the <head> section of each page
  89our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
  90# filename of html text to include at top of each page
  91our $site_header = "++GITWEB_SITE_HEADER++";
  92# html text to include at home page
  93our $home_text = "++GITWEB_HOMETEXT++";
  94# filename of html text to include at bottom of each page
  95our $site_footer = "++GITWEB_SITE_FOOTER++";
  96
  97# URI of stylesheets
  98our @stylesheets = ("++GITWEB_CSS++");
  99# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
 100our $stylesheet = undef;
 101# URI of GIT logo (72x27 size)
 102our $logo = "++GITWEB_LOGO++";
 103# URI of GIT favicon, assumed to be image/png type
 104our $favicon = "++GITWEB_FAVICON++";
 105# URI of gitweb.js (JavaScript code for gitweb)
 106our $javascript = "++GITWEB_JS++";
 107
 108# URI and label (title) of GIT logo link
 109#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
 110#our $logo_label = "git documentation";
 111our $logo_url = "http://git-scm.com/";
 112our $logo_label = "git homepage";
 113
 114# source of projects list
 115our $projects_list = "++GITWEB_LIST++";
 116
 117# the width (in characters) of the projects list "Description" column
 118our $projects_list_description_width = 25;
 119
 120# group projects by category on the projects list
 121# (enabled if this variable evaluates to true)
 122our $projects_list_group_categories = 0;
 123
 124# default category if none specified
 125# (leave the empty string for no category)
 126our $project_list_default_category = "";
 127
 128# default order of projects list
 129# valid values are none, project, descr, owner, and age
 130our $default_projects_order = "project";
 131
 132# show repository only if this file exists
 133# (only effective if this variable evaluates to true)
 134our $export_ok = "++GITWEB_EXPORT_OK++";
 135
 136# show repository only if this subroutine returns true
 137# when given the path to the project, for example:
 138#    sub { return -e "$_[0]/git-daemon-export-ok"; }
 139our $export_auth_hook = undef;
 140
 141# only allow viewing of repositories also shown on the overview page
 142our $strict_export = "++GITWEB_STRICT_EXPORT++";
 143
 144# list of git base URLs used for URL to where fetch project from,
 145# i.e. full URL is "$git_base_url/$project"
 146our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
 147
 148# default blob_plain mimetype and default charset for text/plain blob
 149our $default_blob_plain_mimetype = 'text/plain';
 150our $default_text_plain_charset  = undef;
 151
 152# file to use for guessing MIME types before trying /etc/mime.types
 153# (relative to the current git repository)
 154our $mimetypes_file = undef;
 155
 156# assume this charset if line contains non-UTF-8 characters;
 157# it should be valid encoding (see Encoding::Supported(3pm) for list),
 158# for which encoding all byte sequences are valid, for example
 159# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
 160# could be even 'utf-8' for the old behavior)
 161our $fallback_encoding = 'latin1';
 162
 163# rename detection options for git-diff and git-diff-tree
 164# - default is '-M', with the cost proportional to
 165#   (number of removed files) * (number of new files).
 166# - more costly is '-C' (which implies '-M'), with the cost proportional to
 167#   (number of changed files + number of removed files) * (number of new files)
 168# - even more costly is '-C', '--find-copies-harder' with cost
 169#   (number of files in the original tree) * (number of new files)
 170# - one might want to include '-B' option, e.g. '-B', '-M'
 171our @diff_opts = ('-M'); # taken from git_commit
 172
 173# Disables features that would allow repository owners to inject script into
 174# the gitweb domain.
 175our $prevent_xss = 0;
 176
 177# Path to the highlight executable to use (must be the one from
 178# http://www.andre-simon.de due to assumptions about parameters and output).
 179# Useful if highlight is not installed on your webserver's PATH.
 180# [Default: highlight]
 181our $highlight_bin = "++HIGHLIGHT_BIN++";
 182
 183# information about snapshot formats that gitweb is capable of serving
 184our %known_snapshot_formats = (
 185        # name => {
 186        #       'display' => display name,
 187        #       'type' => mime type,
 188        #       'suffix' => filename suffix,
 189        #       'format' => --format for git-archive,
 190        #       'compressor' => [compressor command and arguments]
 191        #                       (array reference, optional)
 192        #       'disabled' => boolean (optional)}
 193        #
 194        'tgz' => {
 195                'display' => 'tar.gz',
 196                'type' => 'application/x-gzip',
 197                'suffix' => '.tar.gz',
 198                'format' => 'tar',
 199                'compressor' => ['gzip', '-n']},
 200
 201        'tbz2' => {
 202                'display' => 'tar.bz2',
 203                'type' => 'application/x-bzip2',
 204                'suffix' => '.tar.bz2',
 205                'format' => 'tar',
 206                'compressor' => ['bzip2']},
 207
 208        'txz' => {
 209                'display' => 'tar.xz',
 210                'type' => 'application/x-xz',
 211                'suffix' => '.tar.xz',
 212                'format' => 'tar',
 213                'compressor' => ['xz'],
 214                'disabled' => 1},
 215
 216        'zip' => {
 217                'display' => 'zip',
 218                'type' => 'application/x-zip',
 219                'suffix' => '.zip',
 220                'format' => 'zip'},
 221);
 222
 223# Aliases so we understand old gitweb.snapshot values in repository
 224# configuration.
 225our %known_snapshot_format_aliases = (
 226        'gzip'  => 'tgz',
 227        'bzip2' => 'tbz2',
 228        'xz'    => 'txz',
 229
 230        # backward compatibility: legacy gitweb config support
 231        'x-gzip' => undef, 'gz' => undef,
 232        'x-bzip2' => undef, 'bz2' => undef,
 233        'x-zip' => undef, '' => undef,
 234);
 235
 236# Pixel sizes for icons and avatars. If the default font sizes or lineheights
 237# are changed, it may be appropriate to change these values too via
 238# $GITWEB_CONFIG.
 239our %avatar_size = (
 240        'default' => 16,
 241        'double'  => 32
 242);
 243
 244# Used to set the maximum load that we will still respond to gitweb queries.
 245# If server load exceed this value then return "503 server busy" error.
 246# If gitweb cannot determined server load, it is taken to be 0.
 247# Leave it undefined (or set to 'undef') to turn off load checking.
 248our $maxload = 300;
 249
 250# configuration for 'highlight' (http://www.andre-simon.de/)
 251# match by basename
 252our %highlight_basename = (
 253        #'Program' => 'py',
 254        #'Library' => 'py',
 255        'SConstruct' => 'py', # SCons equivalent of Makefile
 256        'Makefile' => 'make',
 257);
 258# match by extension
 259our %highlight_ext = (
 260        # main extensions, defining name of syntax;
 261        # see files in /usr/share/highlight/langDefs/ directory
 262        map { $_ => $_ }
 263                qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
 264        # alternate extensions, see /etc/highlight/filetypes.conf
 265        'h' => 'c',
 266        map { $_ => 'sh'  } qw(bash zsh ksh),
 267        map { $_ => 'cpp' } qw(cxx c++ cc),
 268        map { $_ => 'php' } qw(php3 php4 php5 phps),
 269        map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
 270        map { $_ => 'make'} qw(mak mk),
 271        map { $_ => 'xml' } qw(xhtml html htm),
 272);
 273
 274# You define site-wide feature defaults here; override them with
 275# $GITWEB_CONFIG as necessary.
 276our %feature = (
 277        # feature => {
 278        #       'sub' => feature-sub (subroutine),
 279        #       'override' => allow-override (boolean),
 280        #       'default' => [ default options...] (array reference)}
 281        #
 282        # if feature is overridable (it means that allow-override has true value),
 283        # then feature-sub will be called with default options as parameters;
 284        # return value of feature-sub indicates if to enable specified feature
 285        #
 286        # if there is no 'sub' key (no feature-sub), then feature cannot be
 287        # overridden
 288        #
 289        # use gitweb_get_feature(<feature>) to retrieve the <feature> value
 290        # (an array) or gitweb_check_feature(<feature>) to check if <feature>
 291        # is enabled
 292
 293        # Enable the 'blame' blob view, showing the last commit that modified
 294        # each line in the file. This can be very CPU-intensive.
 295
 296        # To enable system wide have in $GITWEB_CONFIG
 297        # $feature{'blame'}{'default'} = [1];
 298        # To have project specific config enable override in $GITWEB_CONFIG
 299        # $feature{'blame'}{'override'} = 1;
 300        # and in project config gitweb.blame = 0|1;
 301        'blame' => {
 302                'sub' => sub { feature_bool('blame', @_) },
 303                'override' => 0,
 304                'default' => [0]},
 305
 306        # Enable the 'snapshot' link, providing a compressed archive of any
 307        # tree. This can potentially generate high traffic if you have large
 308        # project.
 309
 310        # Value is a list of formats defined in %known_snapshot_formats that
 311        # you wish to offer.
 312        # To disable system wide have in $GITWEB_CONFIG
 313        # $feature{'snapshot'}{'default'} = [];
 314        # To have project specific config enable override in $GITWEB_CONFIG
 315        # $feature{'snapshot'}{'override'} = 1;
 316        # and in project config, a comma-separated list of formats or "none"
 317        # to disable.  Example: gitweb.snapshot = tbz2,zip;
 318        'snapshot' => {
 319                'sub' => \&feature_snapshot,
 320                'override' => 0,
 321                'default' => ['tgz']},
 322
 323        # Enable text search, which will list the commits which match author,
 324        # committer or commit text to a given string.  Enabled by default.
 325        # Project specific override is not supported.
 326        #
 327        # Note that this controls all search features, which means that if
 328        # it is disabled, then 'grep' and 'pickaxe' search would also be
 329        # disabled.
 330        'search' => {
 331                'override' => 0,
 332                'default' => [1]},
 333
 334        # Enable grep search, which will list the files in currently selected
 335        # tree containing the given string. Enabled by default. This can be
 336        # potentially CPU-intensive, of course.
 337        # Note that you need to have 'search' feature enabled too.
 338
 339        # To enable system wide have in $GITWEB_CONFIG
 340        # $feature{'grep'}{'default'} = [1];
 341        # To have project specific config enable override in $GITWEB_CONFIG
 342        # $feature{'grep'}{'override'} = 1;
 343        # and in project config gitweb.grep = 0|1;
 344        'grep' => {
 345                'sub' => sub { feature_bool('grep', @_) },
 346                'override' => 0,
 347                'default' => [1]},
 348
 349        # Enable the pickaxe search, which will list the commits that modified
 350        # a given string in a file. This can be practical and quite faster
 351        # alternative to 'blame', but still potentially CPU-intensive.
 352        # Note that you need to have 'search' feature enabled too.
 353
 354        # To enable system wide have in $GITWEB_CONFIG
 355        # $feature{'pickaxe'}{'default'} = [1];
 356        # To have project specific config enable override in $GITWEB_CONFIG
 357        # $feature{'pickaxe'}{'override'} = 1;
 358        # and in project config gitweb.pickaxe = 0|1;
 359        'pickaxe' => {
 360                'sub' => sub { feature_bool('pickaxe', @_) },
 361                'override' => 0,
 362                'default' => [1]},
 363
 364        # Enable showing size of blobs in a 'tree' view, in a separate
 365        # column, similar to what 'ls -l' does.  This cost a bit of IO.
 366
 367        # To disable system wide have in $GITWEB_CONFIG
 368        # $feature{'show-sizes'}{'default'} = [0];
 369        # To have project specific config enable override in $GITWEB_CONFIG
 370        # $feature{'show-sizes'}{'override'} = 1;
 371        # and in project config gitweb.showsizes = 0|1;
 372        'show-sizes' => {
 373                'sub' => sub { feature_bool('showsizes', @_) },
 374                'override' => 0,
 375                'default' => [1]},
 376
 377        # Make gitweb use an alternative format of the URLs which can be
 378        # more readable and natural-looking: project name is embedded
 379        # directly in the path and the query string contains other
 380        # auxiliary information. All gitweb installations recognize
 381        # URL in either format; this configures in which formats gitweb
 382        # generates links.
 383
 384        # To enable system wide have in $GITWEB_CONFIG
 385        # $feature{'pathinfo'}{'default'} = [1];
 386        # Project specific override is not supported.
 387
 388        # Note that you will need to change the default location of CSS,
 389        # favicon, logo and possibly other files to an absolute URL. Also,
 390        # if gitweb.cgi serves as your indexfile, you will need to force
 391        # $my_uri to contain the script name in your $GITWEB_CONFIG.
 392        'pathinfo' => {
 393                'override' => 0,
 394                'default' => [0]},
 395
 396        # Make gitweb consider projects in project root subdirectories
 397        # to be forks of existing projects. Given project $projname.git,
 398        # projects matching $projname/*.git will not be shown in the main
 399        # projects list, instead a '+' mark will be added to $projname
 400        # there and a 'forks' view will be enabled for the project, listing
 401        # all the forks. If project list is taken from a file, forks have
 402        # to be listed after the main project.
 403
 404        # To enable system wide have in $GITWEB_CONFIG
 405        # $feature{'forks'}{'default'} = [1];
 406        # Project specific override is not supported.
 407        'forks' => {
 408                'override' => 0,
 409                'default' => [0]},
 410
 411        # Insert custom links to the action bar of all project pages.
 412        # This enables you mainly to link to third-party scripts integrating
 413        # into gitweb; e.g. git-browser for graphical history representation
 414        # or custom web-based repository administration interface.
 415
 416        # The 'default' value consists of a list of triplets in the form
 417        # (label, link, position) where position is the label after which
 418        # to insert the link and link is a format string where %n expands
 419        # to the project name, %f to the project path within the filesystem,
 420        # %h to the current hash (h gitweb parameter) and %b to the current
 421        # hash base (hb gitweb parameter); %% expands to %.
 422
 423        # To enable system wide have in $GITWEB_CONFIG e.g.
 424        # $feature{'actions'}{'default'} = [('graphiclog',
 425        #       '/git-browser/by-commit.html?r=%n', 'summary')];
 426        # Project specific override is not supported.
 427        'actions' => {
 428                'override' => 0,
 429                'default' => []},
 430
 431        # Allow gitweb scan project content tags of project repository,
 432        # and display the popular Web 2.0-ish "tag cloud" near the projects
 433        # list.  Note that this is something COMPLETELY different from the
 434        # normal Git tags.
 435
 436        # gitweb by itself can show existing tags, but it does not handle
 437        # tagging itself; you need to do it externally, outside gitweb.
 438        # The format is described in git_get_project_ctags() subroutine.
 439        # You may want to install the HTML::TagCloud Perl module to get
 440        # a pretty tag cloud instead of just a list of tags.
 441
 442        # To enable system wide have in $GITWEB_CONFIG
 443        # $feature{'ctags'}{'default'} = [1];
 444        # Project specific override is not supported.
 445
 446        # In the future whether ctags editing is enabled might depend
 447        # on the value, but using 1 should always mean no editing of ctags.
 448        'ctags' => {
 449                'override' => 0,
 450                'default' => [0]},
 451
 452        # The maximum number of patches in a patchset generated in patch
 453        # view. Set this to 0 or undef to disable patch view, or to a
 454        # negative number to remove any limit.
 455
 456        # To disable system wide have in $GITWEB_CONFIG
 457        # $feature{'patches'}{'default'} = [0];
 458        # To have project specific config enable override in $GITWEB_CONFIG
 459        # $feature{'patches'}{'override'} = 1;
 460        # and in project config gitweb.patches = 0|n;
 461        # where n is the maximum number of patches allowed in a patchset.
 462        'patches' => {
 463                'sub' => \&feature_patches,
 464                'override' => 0,
 465                'default' => [16]},
 466
 467        # Avatar support. When this feature is enabled, views such as
 468        # shortlog or commit will display an avatar associated with
 469        # the email of the committer(s) and/or author(s).
 470
 471        # Currently available providers are gravatar and picon.
 472        # If an unknown provider is specified, the feature is disabled.
 473
 474        # Gravatar depends on Digest::MD5.
 475        # Picon currently relies on the indiana.edu database.
 476
 477        # To enable system wide have in $GITWEB_CONFIG
 478        # $feature{'avatar'}{'default'} = ['<provider>'];
 479        # where <provider> is either gravatar or picon.
 480        # To have project specific config enable override in $GITWEB_CONFIG
 481        # $feature{'avatar'}{'override'} = 1;
 482        # and in project config gitweb.avatar = <provider>;
 483        'avatar' => {
 484                'sub' => \&feature_avatar,
 485                'override' => 0,
 486                'default' => ['']},
 487
 488        # Enable displaying how much time and how many git commands
 489        # it took to generate and display page.  Disabled by default.
 490        # Project specific override is not supported.
 491        'timed' => {
 492                'override' => 0,
 493                'default' => [0]},
 494
 495        # Enable turning some links into links to actions which require
 496        # JavaScript to run (like 'blame_incremental').  Not enabled by
 497        # default.  Project specific override is currently not supported.
 498        'javascript-actions' => {
 499                'override' => 0,
 500                'default' => [0]},
 501
 502        # Enable and configure ability to change common timezone for dates
 503        # in gitweb output via JavaScript.  Enabled by default.
 504        # Project specific override is not supported.
 505        'javascript-timezone' => {
 506                'override' => 0,
 507                'default' => [
 508                        'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
 509                                     # or undef to turn off this feature
 510                        'gitweb_tz', # name of cookie where to store selected timezone
 511                        'datetime',  # CSS class used to mark up dates for manipulation
 512                ]},
 513
 514        # Syntax highlighting support. This is based on Daniel Svensson's
 515        # and Sham Chukoury's work in gitweb-xmms2.git.
 516        # It requires the 'highlight' program present in $PATH,
 517        # and therefore is disabled by default.
 518
 519        # To enable system wide have in $GITWEB_CONFIG
 520        # $feature{'highlight'}{'default'} = [1];
 521
 522        'highlight' => {
 523                'sub' => sub { feature_bool('highlight', @_) },
 524                'override' => 0,
 525                'default' => [0]},
 526
 527        # Enable displaying of remote heads in the heads list
 528
 529        # To enable system wide have in $GITWEB_CONFIG
 530        # $feature{'remote_heads'}{'default'} = [1];
 531        # To have project specific config enable override in $GITWEB_CONFIG
 532        # $feature{'remote_heads'}{'override'} = 1;
 533        # and in project config gitweb.remote_heads = 0|1;
 534        'remote_heads' => {
 535                'sub' => sub { feature_bool('remote_heads', @_) },
 536                'override' => 0,
 537                'default' => [0]},
 538);
 539
 540sub gitweb_get_feature {
 541        my ($name) = @_;
 542        return unless exists $feature{$name};
 543        my ($sub, $override, @defaults) = (
 544                $feature{$name}{'sub'},
 545                $feature{$name}{'override'},
 546                @{$feature{$name}{'default'}});
 547        # project specific override is possible only if we have project
 548        our $git_dir; # global variable, declared later
 549        if (!$override || !defined $git_dir) {
 550                return @defaults;
 551        }
 552        if (!defined $sub) {
 553                warn "feature $name is not overridable";
 554                return @defaults;
 555        }
 556        return $sub->(@defaults);
 557}
 558
 559# A wrapper to check if a given feature is enabled.
 560# With this, you can say
 561#
 562#   my $bool_feat = gitweb_check_feature('bool_feat');
 563#   gitweb_check_feature('bool_feat') or somecode;
 564#
 565# instead of
 566#
 567#   my ($bool_feat) = gitweb_get_feature('bool_feat');
 568#   (gitweb_get_feature('bool_feat'))[0] or somecode;
 569#
 570sub gitweb_check_feature {
 571        return (gitweb_get_feature(@_))[0];
 572}
 573
 574
 575sub feature_bool {
 576        my $key = shift;
 577        my ($val) = git_get_project_config($key, '--bool');
 578
 579        if (!defined $val) {
 580                return ($_[0]);
 581        } elsif ($val eq 'true') {
 582                return (1);
 583        } elsif ($val eq 'false') {
 584                return (0);
 585        }
 586}
 587
 588sub feature_snapshot {
 589        my (@fmts) = @_;
 590
 591        my ($val) = git_get_project_config('snapshot');
 592
 593        if ($val) {
 594                @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
 595        }
 596
 597        return @fmts;
 598}
 599
 600sub feature_patches {
 601        my @val = (git_get_project_config('patches', '--int'));
 602
 603        if (@val) {
 604                return @val;
 605        }
 606
 607        return ($_[0]);
 608}
 609
 610sub feature_avatar {
 611        my @val = (git_get_project_config('avatar'));
 612
 613        return @val ? @val : @_;
 614}
 615
 616# checking HEAD file with -e is fragile if the repository was
 617# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
 618# and then pruned.
 619sub check_head_link {
 620        my ($dir) = @_;
 621        my $headfile = "$dir/HEAD";
 622        return ((-e $headfile) ||
 623                (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
 624}
 625
 626sub check_export_ok {
 627        my ($dir) = @_;
 628        return (check_head_link($dir) &&
 629                (!$export_ok || -e "$dir/$export_ok") &&
 630                (!$export_auth_hook || $export_auth_hook->($dir)));
 631}
 632
 633# process alternate names for backward compatibility
 634# filter out unsupported (unknown) snapshot formats
 635sub filter_snapshot_fmts {
 636        my @fmts = @_;
 637
 638        @fmts = map {
 639                exists $known_snapshot_format_aliases{$_} ?
 640                       $known_snapshot_format_aliases{$_} : $_} @fmts;
 641        @fmts = grep {
 642                exists $known_snapshot_formats{$_} &&
 643                !$known_snapshot_formats{$_}{'disabled'}} @fmts;
 644}
 645
 646# If it is set to code reference, it is code that it is to be run once per
 647# request, allowing updating configurations that change with each request,
 648# while running other code in config file only once.
 649#
 650# Otherwise, if it is false then gitweb would process config file only once;
 651# if it is true then gitweb config would be run for each request.
 652our $per_request_config = 1;
 653
 654# read and parse gitweb config file given by its parameter.
 655# returns true on success, false on recoverable error, allowing
 656# to chain this subroutine, using first file that exists.
 657# dies on errors during parsing config file, as it is unrecoverable.
 658sub read_config_file {
 659        my $filename = shift;
 660        return unless defined $filename;
 661        # die if there are errors parsing config file
 662        if (-e $filename) {
 663                do $filename;
 664                die $@ if $@;
 665                return 1;
 666        }
 667        return;
 668}
 669
 670our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
 671sub evaluate_gitweb_config {
 672        our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
 673        our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
 674        our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
 675
 676        # Protect agains duplications of file names, to not read config twice.
 677        # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
 678        # there possibility of duplication of filename there doesn't matter.
 679        $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
 680        $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
 681
 682        # Common system-wide settings for convenience.
 683        # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
 684        read_config_file($GITWEB_CONFIG_COMMON);
 685
 686        # Use first config file that exists.  This means use the per-instance
 687        # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
 688        read_config_file($GITWEB_CONFIG) and return;
 689        read_config_file($GITWEB_CONFIG_SYSTEM);
 690}
 691
 692# Get loadavg of system, to compare against $maxload.
 693# Currently it requires '/proc/loadavg' present to get loadavg;
 694# if it is not present it returns 0, which means no load checking.
 695sub get_loadavg {
 696        if( -e '/proc/loadavg' ){
 697                open my $fd, '<', '/proc/loadavg'
 698                        or return 0;
 699                my @load = split(/\s+/, scalar <$fd>);
 700                close $fd;
 701
 702                # The first three columns measure CPU and IO utilization of the last one,
 703                # five, and 10 minute periods.  The fourth column shows the number of
 704                # currently running processes and the total number of processes in the m/n
 705                # format.  The last column displays the last process ID used.
 706                return $load[0] || 0;
 707        }
 708        # additional checks for load average should go here for things that don't export
 709        # /proc/loadavg
 710
 711        return 0;
 712}
 713
 714# version of the core git binary
 715our $git_version;
 716sub evaluate_git_version {
 717        our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
 718        $number_of_git_cmds++;
 719}
 720
 721sub check_loadavg {
 722        if (defined $maxload && get_loadavg() > $maxload) {
 723                die_error(503, "The load average on the server is too high");
 724        }
 725}
 726
 727# ======================================================================
 728# input validation and dispatch
 729
 730# input parameters can be collected from a variety of sources (presently, CGI
 731# and PATH_INFO), so we define an %input_params hash that collects them all
 732# together during validation: this allows subsequent uses (e.g. href()) to be
 733# agnostic of the parameter origin
 734
 735our %input_params = ();
 736
 737# input parameters are stored with the long parameter name as key. This will
 738# also be used in the href subroutine to convert parameters to their CGI
 739# equivalent, and since the href() usage is the most frequent one, we store
 740# the name -> CGI key mapping here, instead of the reverse.
 741#
 742# XXX: Warning: If you touch this, check the search form for updating,
 743# too.
 744
 745our @cgi_param_mapping = (
 746        project => "p",
 747        action => "a",
 748        file_name => "f",
 749        file_parent => "fp",
 750        hash => "h",
 751        hash_parent => "hp",
 752        hash_base => "hb",
 753        hash_parent_base => "hpb",
 754        page => "pg",
 755        order => "o",
 756        searchtext => "s",
 757        searchtype => "st",
 758        snapshot_format => "sf",
 759        extra_options => "opt",
 760        search_use_regexp => "sr",
 761        ctag => "by_tag",
 762        diff_style => "ds",
 763        project_filter => "pf",
 764        # this must be last entry (for manipulation from JavaScript)
 765        javascript => "js"
 766);
 767our %cgi_param_mapping = @cgi_param_mapping;
 768
 769# we will also need to know the possible actions, for validation
 770our %actions = (
 771        "blame" => \&git_blame,
 772        "blame_incremental" => \&git_blame_incremental,
 773        "blame_data" => \&git_blame_data,
 774        "blobdiff" => \&git_blobdiff,
 775        "blobdiff_plain" => \&git_blobdiff_plain,
 776        "blob" => \&git_blob,
 777        "blob_plain" => \&git_blob_plain,
 778        "commitdiff" => \&git_commitdiff,
 779        "commitdiff_plain" => \&git_commitdiff_plain,
 780        "commit" => \&git_commit,
 781        "forks" => \&git_forks,
 782        "heads" => \&git_heads,
 783        "history" => \&git_history,
 784        "log" => \&git_log,
 785        "patch" => \&git_patch,
 786        "patches" => \&git_patches,
 787        "remotes" => \&git_remotes,
 788        "rss" => \&git_rss,
 789        "atom" => \&git_atom,
 790        "search" => \&git_search,
 791        "search_help" => \&git_search_help,
 792        "shortlog" => \&git_shortlog,
 793        "summary" => \&git_summary,
 794        "tag" => \&git_tag,
 795        "tags" => \&git_tags,
 796        "tree" => \&git_tree,
 797        "snapshot" => \&git_snapshot,
 798        "object" => \&git_object,
 799        # those below don't need $project
 800        "opml" => \&git_opml,
 801        "project_list" => \&git_project_list,
 802        "project_index" => \&git_project_index,
 803);
 804
 805# finally, we have the hash of allowed extra_options for the commands that
 806# allow them
 807our %allowed_options = (
 808        "--no-merges" => [ qw(rss atom log shortlog history) ],
 809);
 810
 811# fill %input_params with the CGI parameters. All values except for 'opt'
 812# should be single values, but opt can be an array. We should probably
 813# build an array of parameters that can be multi-valued, but since for the time
 814# being it's only this one, we just single it out
 815sub evaluate_query_params {
 816        our $cgi;
 817
 818        while (my ($name, $symbol) = each %cgi_param_mapping) {
 819                if ($symbol eq 'opt') {
 820                        $input_params{$name} = [ map { decode_utf8($_) } $cgi->param($symbol) ];
 821                } else {
 822                        $input_params{$name} = decode_utf8($cgi->param($symbol));
 823                }
 824        }
 825}
 826
 827# now read PATH_INFO and update the parameter list for missing parameters
 828sub evaluate_path_info {
 829        return if defined $input_params{'project'};
 830        return if !$path_info;
 831        $path_info =~ s,^/+,,;
 832        return if !$path_info;
 833
 834        # find which part of PATH_INFO is project
 835        my $project = $path_info;
 836        $project =~ s,/+$,,;
 837        while ($project && !check_head_link("$projectroot/$project")) {
 838                $project =~ s,/*[^/]*$,,;
 839        }
 840        return unless $project;
 841        $input_params{'project'} = $project;
 842
 843        # do not change any parameters if an action is given using the query string
 844        return if $input_params{'action'};
 845        $path_info =~ s,^\Q$project\E/*,,;
 846
 847        # next, check if we have an action
 848        my $action = $path_info;
 849        $action =~ s,/.*$,,;
 850        if (exists $actions{$action}) {
 851                $path_info =~ s,^$action/*,,;
 852                $input_params{'action'} = $action;
 853        }
 854
 855        # list of actions that want hash_base instead of hash, but can have no
 856        # pathname (f) parameter
 857        my @wants_base = (
 858                'tree',
 859                'history',
 860        );
 861
 862        # we want to catch, among others
 863        # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
 864        my ($parentrefname, $parentpathname, $refname, $pathname) =
 865                ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
 866
 867        # first, analyze the 'current' part
 868        if (defined $pathname) {
 869                # we got "branch:filename" or "branch:dir/"
 870                # we could use git_get_type(branch:pathname), but:
 871                # - it needs $git_dir
 872                # - it does a git() call
 873                # - the convention of terminating directories with a slash
 874                #   makes it superfluous
 875                # - embedding the action in the PATH_INFO would make it even
 876                #   more superfluous
 877                $pathname =~ s,^/+,,;
 878                if (!$pathname || substr($pathname, -1) eq "/") {
 879                        $input_params{'action'} ||= "tree";
 880                        $pathname =~ s,/$,,;
 881                } else {
 882                        # the default action depends on whether we had parent info
 883                        # or not
 884                        if ($parentrefname) {
 885                                $input_params{'action'} ||= "blobdiff_plain";
 886                        } else {
 887                                $input_params{'action'} ||= "blob_plain";
 888                        }
 889                }
 890                $input_params{'hash_base'} ||= $refname;
 891                $input_params{'file_name'} ||= $pathname;
 892        } elsif (defined $refname) {
 893                # we got "branch". In this case we have to choose if we have to
 894                # set hash or hash_base.
 895                #
 896                # Most of the actions without a pathname only want hash to be
 897                # set, except for the ones specified in @wants_base that want
 898                # hash_base instead. It should also be noted that hand-crafted
 899                # links having 'history' as an action and no pathname or hash
 900                # set will fail, but that happens regardless of PATH_INFO.
 901                if (defined $parentrefname) {
 902                        # if there is parent let the default be 'shortlog' action
 903                        # (for http://git.example.com/repo.git/A..B links); if there
 904                        # is no parent, dispatch will detect type of object and set
 905                        # action appropriately if required (if action is not set)
 906                        $input_params{'action'} ||= "shortlog";
 907                }
 908                if ($input_params{'action'} &&
 909                    grep { $_ eq $input_params{'action'} } @wants_base) {
 910                        $input_params{'hash_base'} ||= $refname;
 911                } else {
 912                        $input_params{'hash'} ||= $refname;
 913                }
 914        }
 915
 916        # next, handle the 'parent' part, if present
 917        if (defined $parentrefname) {
 918                # a missing pathspec defaults to the 'current' filename, allowing e.g.
 919                # someproject/blobdiff/oldrev..newrev:/filename
 920                if ($parentpathname) {
 921                        $parentpathname =~ s,^/+,,;
 922                        $parentpathname =~ s,/$,,;
 923                        $input_params{'file_parent'} ||= $parentpathname;
 924                } else {
 925                        $input_params{'file_parent'} ||= $input_params{'file_name'};
 926                }
 927                # we assume that hash_parent_base is wanted if a path was specified,
 928                # or if the action wants hash_base instead of hash
 929                if (defined $input_params{'file_parent'} ||
 930                        grep { $_ eq $input_params{'action'} } @wants_base) {
 931                        $input_params{'hash_parent_base'} ||= $parentrefname;
 932                } else {
 933                        $input_params{'hash_parent'} ||= $parentrefname;
 934                }
 935        }
 936
 937        # for the snapshot action, we allow URLs in the form
 938        # $project/snapshot/$hash.ext
 939        # where .ext determines the snapshot and gets removed from the
 940        # passed $refname to provide the $hash.
 941        #
 942        # To be able to tell that $refname includes the format extension, we
 943        # require the following two conditions to be satisfied:
 944        # - the hash input parameter MUST have been set from the $refname part
 945        #   of the URL (i.e. they must be equal)
 946        # - the snapshot format MUST NOT have been defined already (e.g. from
 947        #   CGI parameter sf)
 948        # It's also useless to try any matching unless $refname has a dot,
 949        # so we check for that too
 950        if (defined $input_params{'action'} &&
 951                $input_params{'action'} eq 'snapshot' &&
 952                defined $refname && index($refname, '.') != -1 &&
 953                $refname eq $input_params{'hash'} &&
 954                !defined $input_params{'snapshot_format'}) {
 955                # We loop over the known snapshot formats, checking for
 956                # extensions. Allowed extensions are both the defined suffix
 957                # (which includes the initial dot already) and the snapshot
 958                # format key itself, with a prepended dot
 959                while (my ($fmt, $opt) = each %known_snapshot_formats) {
 960                        my $hash = $refname;
 961                        unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
 962                                next;
 963                        }
 964                        my $sfx = $1;
 965                        # a valid suffix was found, so set the snapshot format
 966                        # and reset the hash parameter
 967                        $input_params{'snapshot_format'} = $fmt;
 968                        $input_params{'hash'} = $hash;
 969                        # we also set the format suffix to the one requested
 970                        # in the URL: this way a request for e.g. .tgz returns
 971                        # a .tgz instead of a .tar.gz
 972                        $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
 973                        last;
 974                }
 975        }
 976}
 977
 978our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
 979     $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
 980     $searchtext, $search_regexp, $project_filter);
 981sub evaluate_and_validate_params {
 982        our $action = $input_params{'action'};
 983        if (defined $action) {
 984                if (!validate_action($action)) {
 985                        die_error(400, "Invalid action parameter");
 986                }
 987        }
 988
 989        # parameters which are pathnames
 990        our $project = $input_params{'project'};
 991        if (defined $project) {
 992                if (!validate_project($project)) {
 993                        undef $project;
 994                        die_error(404, "No such project");
 995                }
 996        }
 997
 998        our $project_filter = $input_params{'project_filter'};
 999        if (defined $project_filter) {
1000                if (!validate_pathname($project_filter)) {
1001                        die_error(404, "Invalid project_filter parameter");
1002                }
1003        }
1004
1005        our $file_name = $input_params{'file_name'};
1006        if (defined $file_name) {
1007                if (!validate_pathname($file_name)) {
1008                        die_error(400, "Invalid file parameter");
1009                }
1010        }
1011
1012        our $file_parent = $input_params{'file_parent'};
1013        if (defined $file_parent) {
1014                if (!validate_pathname($file_parent)) {
1015                        die_error(400, "Invalid file parent parameter");
1016                }
1017        }
1018
1019        # parameters which are refnames
1020        our $hash = $input_params{'hash'};
1021        if (defined $hash) {
1022                if (!validate_refname($hash)) {
1023                        die_error(400, "Invalid hash parameter");
1024                }
1025        }
1026
1027        our $hash_parent = $input_params{'hash_parent'};
1028        if (defined $hash_parent) {
1029                if (!validate_refname($hash_parent)) {
1030                        die_error(400, "Invalid hash parent parameter");
1031                }
1032        }
1033
1034        our $hash_base = $input_params{'hash_base'};
1035        if (defined $hash_base) {
1036                if (!validate_refname($hash_base)) {
1037                        die_error(400, "Invalid hash base parameter");
1038                }
1039        }
1040
1041        our @extra_options = @{$input_params{'extra_options'}};
1042        # @extra_options is always defined, since it can only be (currently) set from
1043        # CGI, and $cgi->param() returns the empty array in array context if the param
1044        # is not set
1045        foreach my $opt (@extra_options) {
1046                if (not exists $allowed_options{$opt}) {
1047                        die_error(400, "Invalid option parameter");
1048                }
1049                if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1050                        die_error(400, "Invalid option parameter for this action");
1051                }
1052        }
1053
1054        our $hash_parent_base = $input_params{'hash_parent_base'};
1055        if (defined $hash_parent_base) {
1056                if (!validate_refname($hash_parent_base)) {
1057                        die_error(400, "Invalid hash parent base parameter");
1058                }
1059        }
1060
1061        # other parameters
1062        our $page = $input_params{'page'};
1063        if (defined $page) {
1064                if ($page =~ m/[^0-9]/) {
1065                        die_error(400, "Invalid page parameter");
1066                }
1067        }
1068
1069        our $searchtype = $input_params{'searchtype'};
1070        if (defined $searchtype) {
1071                if ($searchtype =~ m/[^a-z]/) {
1072                        die_error(400, "Invalid searchtype parameter");
1073                }
1074        }
1075
1076        our $search_use_regexp = $input_params{'search_use_regexp'};
1077
1078        our $searchtext = $input_params{'searchtext'};
1079        our $search_regexp;
1080        if (defined $searchtext) {
1081                if (length($searchtext) < 2) {
1082                        die_error(403, "At least two characters are required for search parameter");
1083                }
1084                if ($search_use_regexp) {
1085                        $search_regexp = $searchtext;
1086                        if (!eval { qr/$search_regexp/; 1; }) {
1087                                (my $error = $@) =~ s/ at \S+ line \d+.*\n?//;
1088                                die_error(400, "Invalid search regexp '$search_regexp'",
1089                                          esc_html($error));
1090                        }
1091                } else {
1092                        $search_regexp = quotemeta $searchtext;
1093                }
1094        }
1095}
1096
1097# path to the current git repository
1098our $git_dir;
1099sub evaluate_git_dir {
1100        our $git_dir = "$projectroot/$project" if $project;
1101}
1102
1103our (@snapshot_fmts, $git_avatar);
1104sub configure_gitweb_features {
1105        # list of supported snapshot formats
1106        our @snapshot_fmts = gitweb_get_feature('snapshot');
1107        @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1108
1109        # check that the avatar feature is set to a known provider name,
1110        # and for each provider check if the dependencies are satisfied.
1111        # if the provider name is invalid or the dependencies are not met,
1112        # reset $git_avatar to the empty string.
1113        our ($git_avatar) = gitweb_get_feature('avatar');
1114        if ($git_avatar eq 'gravatar') {
1115                $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1116        } elsif ($git_avatar eq 'picon') {
1117                # no dependencies
1118        } else {
1119                $git_avatar = '';
1120        }
1121}
1122
1123# custom error handler: 'die <message>' is Internal Server Error
1124sub handle_errors_html {
1125        my $msg = shift; # it is already HTML escaped
1126
1127        # to avoid infinite loop where error occurs in die_error,
1128        # change handler to default handler, disabling handle_errors_html
1129        set_message("Error occured when inside die_error:\n$msg");
1130
1131        # you cannot jump out of die_error when called as error handler;
1132        # the subroutine set via CGI::Carp::set_message is called _after_
1133        # HTTP headers are already written, so it cannot write them itself
1134        die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1135}
1136set_message(\&handle_errors_html);
1137
1138# dispatch
1139sub dispatch {
1140        if (!defined $action) {
1141                if (defined $hash) {
1142                        $action = git_get_type($hash);
1143                        $action or die_error(404, "Object does not exist");
1144                } elsif (defined $hash_base && defined $file_name) {
1145                        $action = git_get_type("$hash_base:$file_name");
1146                        $action or die_error(404, "File or directory does not exist");
1147                } elsif (defined $project) {
1148                        $action = 'summary';
1149                } else {
1150                        $action = 'project_list';
1151                }
1152        }
1153        if (!defined($actions{$action})) {
1154                die_error(400, "Unknown action");
1155        }
1156        if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1157            !$project) {
1158                die_error(400, "Project needed");
1159        }
1160        $actions{$action}->();
1161}
1162
1163sub reset_timer {
1164        our $t0 = [ gettimeofday() ]
1165                if defined $t0;
1166        our $number_of_git_cmds = 0;
1167}
1168
1169our $first_request = 1;
1170sub run_request {
1171        reset_timer();
1172
1173        evaluate_uri();
1174        if ($first_request) {
1175                evaluate_gitweb_config();
1176                evaluate_git_version();
1177        }
1178        if ($per_request_config) {
1179                if (ref($per_request_config) eq 'CODE') {
1180                        $per_request_config->();
1181                } elsif (!$first_request) {
1182                        evaluate_gitweb_config();
1183                }
1184        }
1185        check_loadavg();
1186
1187        # $projectroot and $projects_list might be set in gitweb config file
1188        $projects_list ||= $projectroot;
1189
1190        evaluate_query_params();
1191        evaluate_path_info();
1192        evaluate_and_validate_params();
1193        evaluate_git_dir();
1194
1195        configure_gitweb_features();
1196
1197        dispatch();
1198}
1199
1200our $is_last_request = sub { 1 };
1201our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1202our $CGI = 'CGI';
1203our $cgi;
1204sub configure_as_fcgi {
1205        require CGI::Fast;
1206        our $CGI = 'CGI::Fast';
1207
1208        my $request_number = 0;
1209        # let each child service 100 requests
1210        our $is_last_request = sub { ++$request_number > 100 };
1211}
1212sub evaluate_argv {
1213        my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1214        configure_as_fcgi()
1215                if $script_name =~ /\.fcgi$/;
1216
1217        return unless (@ARGV);
1218
1219        require Getopt::Long;
1220        Getopt::Long::GetOptions(
1221                'fastcgi|fcgi|f' => \&configure_as_fcgi,
1222                'nproc|n=i' => sub {
1223                        my ($arg, $val) = @_;
1224                        return unless eval { require FCGI::ProcManager; 1; };
1225                        my $proc_manager = FCGI::ProcManager->new({
1226                                n_processes => $val,
1227                        });
1228                        our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1229                        our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1230                        our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1231                },
1232        );
1233}
1234
1235sub run {
1236        evaluate_argv();
1237
1238        $first_request = 1;
1239        $pre_listen_hook->()
1240                if $pre_listen_hook;
1241
1242 REQUEST:
1243        while ($cgi = $CGI->new()) {
1244                $pre_dispatch_hook->()
1245                        if $pre_dispatch_hook;
1246
1247                run_request();
1248
1249                $post_dispatch_hook->()
1250                        if $post_dispatch_hook;
1251                $first_request = 0;
1252
1253                last REQUEST if ($is_last_request->());
1254        }
1255
1256 DONE_GITWEB:
1257        1;
1258}
1259
1260run();
1261
1262if (defined caller) {
1263        # wrapped in a subroutine processing requests,
1264        # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1265        return;
1266} else {
1267        # pure CGI script, serving single request
1268        exit;
1269}
1270
1271## ======================================================================
1272## action links
1273
1274# possible values of extra options
1275# -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1276# -replay => 1      - start from a current view (replay with modifications)
1277# -path_info => 0|1 - don't use/use path_info URL (if possible)
1278# -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1279sub href {
1280        my %params = @_;
1281        # default is to use -absolute url() i.e. $my_uri
1282        my $href = $params{-full} ? $my_url : $my_uri;
1283
1284        # implicit -replay, must be first of implicit params
1285        $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1286
1287        $params{'project'} = $project unless exists $params{'project'};
1288
1289        if ($params{-replay}) {
1290                while (my ($name, $symbol) = each %cgi_param_mapping) {
1291                        if (!exists $params{$name}) {
1292                                $params{$name} = $input_params{$name};
1293                        }
1294                }
1295        }
1296
1297        my $use_pathinfo = gitweb_check_feature('pathinfo');
1298        if (defined $params{'project'} &&
1299            (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1300                # try to put as many parameters as possible in PATH_INFO:
1301                #   - project name
1302                #   - action
1303                #   - hash_parent or hash_parent_base:/file_parent
1304                #   - hash or hash_base:/filename
1305                #   - the snapshot_format as an appropriate suffix
1306
1307                # When the script is the root DirectoryIndex for the domain,
1308                # $href here would be something like http://gitweb.example.com/
1309                # Thus, we strip any trailing / from $href, to spare us double
1310                # slashes in the final URL
1311                $href =~ s,/$,,;
1312
1313                # Then add the project name, if present
1314                $href .= "/".esc_path_info($params{'project'});
1315                delete $params{'project'};
1316
1317                # since we destructively absorb parameters, we keep this
1318                # boolean that remembers if we're handling a snapshot
1319                my $is_snapshot = $params{'action'} eq 'snapshot';
1320
1321                # Summary just uses the project path URL, any other action is
1322                # added to the URL
1323                if (defined $params{'action'}) {
1324                        $href .= "/".esc_path_info($params{'action'})
1325                                unless $params{'action'} eq 'summary';
1326                        delete $params{'action'};
1327                }
1328
1329                # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1330                # stripping nonexistent or useless pieces
1331                $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1332                        || $params{'hash_parent'} || $params{'hash'});
1333                if (defined $params{'hash_base'}) {
1334                        if (defined $params{'hash_parent_base'}) {
1335                                $href .= esc_path_info($params{'hash_parent_base'});
1336                                # skip the file_parent if it's the same as the file_name
1337                                if (defined $params{'file_parent'}) {
1338                                        if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1339                                                delete $params{'file_parent'};
1340                                        } elsif ($params{'file_parent'} !~ /\.\./) {
1341                                                $href .= ":/".esc_path_info($params{'file_parent'});
1342                                                delete $params{'file_parent'};
1343                                        }
1344                                }
1345                                $href .= "..";
1346                                delete $params{'hash_parent'};
1347                                delete $params{'hash_parent_base'};
1348                        } elsif (defined $params{'hash_parent'}) {
1349                                $href .= esc_path_info($params{'hash_parent'}). "..";
1350                                delete $params{'hash_parent'};
1351                        }
1352
1353                        $href .= esc_path_info($params{'hash_base'});
1354                        if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1355                                $href .= ":/".esc_path_info($params{'file_name'});
1356                                delete $params{'file_name'};
1357                        }
1358                        delete $params{'hash'};
1359                        delete $params{'hash_base'};
1360                } elsif (defined $params{'hash'}) {
1361                        $href .= esc_path_info($params{'hash'});
1362                        delete $params{'hash'};
1363                }
1364
1365                # If the action was a snapshot, we can absorb the
1366                # snapshot_format parameter too
1367                if ($is_snapshot) {
1368                        my $fmt = $params{'snapshot_format'};
1369                        # snapshot_format should always be defined when href()
1370                        # is called, but just in case some code forgets, we
1371                        # fall back to the default
1372                        $fmt ||= $snapshot_fmts[0];
1373                        $href .= $known_snapshot_formats{$fmt}{'suffix'};
1374                        delete $params{'snapshot_format'};
1375                }
1376        }
1377
1378        # now encode the parameters explicitly
1379        my @result = ();
1380        for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1381                my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1382                if (defined $params{$name}) {
1383                        if (ref($params{$name}) eq "ARRAY") {
1384                                foreach my $par (@{$params{$name}}) {
1385                                        push @result, $symbol . "=" . esc_param($par);
1386                                }
1387                        } else {
1388                                push @result, $symbol . "=" . esc_param($params{$name});
1389                        }
1390                }
1391        }
1392        $href .= "?" . join(';', @result) if scalar @result;
1393
1394        # final transformation: trailing spaces must be escaped (URI-encoded)
1395        $href =~ s/(\s+)$/CGI::escape($1)/e;
1396
1397        if ($params{-anchor}) {
1398                $href .= "#".esc_param($params{-anchor});
1399        }
1400
1401        return $href;
1402}
1403
1404
1405## ======================================================================
1406## validation, quoting/unquoting and escaping
1407
1408sub validate_action {
1409        my $input = shift || return undef;
1410        return undef unless exists $actions{$input};
1411        return $input;
1412}
1413
1414sub validate_project {
1415        my $input = shift || return undef;
1416        if (!validate_pathname($input) ||
1417                !(-d "$projectroot/$input") ||
1418                !check_export_ok("$projectroot/$input") ||
1419                ($strict_export && !project_in_list($input))) {
1420                return undef;
1421        } else {
1422                return $input;
1423        }
1424}
1425
1426sub validate_pathname {
1427        my $input = shift || return undef;
1428
1429        # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1430        # at the beginning, at the end, and between slashes.
1431        # also this catches doubled slashes
1432        if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1433                return undef;
1434        }
1435        # no null characters
1436        if ($input =~ m!\0!) {
1437                return undef;
1438        }
1439        return $input;
1440}
1441
1442sub validate_refname {
1443        my $input = shift || return undef;
1444
1445        # textual hashes are O.K.
1446        if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1447                return $input;
1448        }
1449        # it must be correct pathname
1450        $input = validate_pathname($input)
1451                or return undef;
1452        # restrictions on ref name according to git-check-ref-format
1453        if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1454                return undef;
1455        }
1456        return $input;
1457}
1458
1459# decode sequences of octets in utf8 into Perl's internal form,
1460# which is utf-8 with utf8 flag set if needed.  gitweb writes out
1461# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1462sub to_utf8 {
1463        my $str = shift;
1464        return undef unless defined $str;
1465
1466        if (utf8::is_utf8($str) || utf8::decode($str)) {
1467                return $str;
1468        } else {
1469                return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1470        }
1471}
1472
1473# quote unsafe chars, but keep the slash, even when it's not
1474# correct, but quoted slashes look too horrible in bookmarks
1475sub esc_param {
1476        my $str = shift;
1477        return undef unless defined $str;
1478        $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1479        $str =~ s/ /\+/g;
1480        return $str;
1481}
1482
1483# the quoting rules for path_info fragment are slightly different
1484sub esc_path_info {
1485        my $str = shift;
1486        return undef unless defined $str;
1487
1488        # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1489        $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1490
1491        return $str;
1492}
1493
1494# quote unsafe chars in whole URL, so some characters cannot be quoted
1495sub esc_url {
1496        my $str = shift;
1497        return undef unless defined $str;
1498        $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1499        $str =~ s/ /\+/g;
1500        return $str;
1501}
1502
1503# quote unsafe characters in HTML attributes
1504sub esc_attr {
1505
1506        # for XHTML conformance escaping '"' to '&quot;' is not enough
1507        return esc_html(@_);
1508}
1509
1510# replace invalid utf8 character with SUBSTITUTION sequence
1511sub esc_html {
1512        my $str = shift;
1513        my %opts = @_;
1514
1515        return undef unless defined $str;
1516
1517        $str = to_utf8($str);
1518        $str = $cgi->escapeHTML($str);
1519        if ($opts{'-nbsp'}) {
1520                $str =~ s/ /&nbsp;/g;
1521        }
1522        $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1523        return $str;
1524}
1525
1526# quote control characters and escape filename to HTML
1527sub esc_path {
1528        my $str = shift;
1529        my %opts = @_;
1530
1531        return undef unless defined $str;
1532
1533        $str = to_utf8($str);
1534        $str = $cgi->escapeHTML($str);
1535        if ($opts{'-nbsp'}) {
1536                $str =~ s/ /&nbsp;/g;
1537        }
1538        $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1539        return $str;
1540}
1541
1542# Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1543sub sanitize {
1544        my $str = shift;
1545
1546        return undef unless defined $str;
1547
1548        $str = to_utf8($str);
1549        $str =~ s|([[:cntrl:]])|($1 =~ /[\t\n\r]/ ? $1 : quot_cec($1))|eg;
1550        return $str;
1551}
1552
1553# Make control characters "printable", using character escape codes (CEC)
1554sub quot_cec {
1555        my $cntrl = shift;
1556        my %opts = @_;
1557        my %es = ( # character escape codes, aka escape sequences
1558                "\t" => '\t',   # tab            (HT)
1559                "\n" => '\n',   # line feed      (LF)
1560                "\r" => '\r',   # carrige return (CR)
1561                "\f" => '\f',   # form feed      (FF)
1562                "\b" => '\b',   # backspace      (BS)
1563                "\a" => '\a',   # alarm (bell)   (BEL)
1564                "\e" => '\e',   # escape         (ESC)
1565                "\013" => '\v', # vertical tab   (VT)
1566                "\000" => '\0', # nul character  (NUL)
1567        );
1568        my $chr = ( (exists $es{$cntrl})
1569                    ? $es{$cntrl}
1570                    : sprintf('\%2x', ord($cntrl)) );
1571        if ($opts{-nohtml}) {
1572                return $chr;
1573        } else {
1574                return "<span class=\"cntrl\">$chr</span>";
1575        }
1576}
1577
1578# Alternatively use unicode control pictures codepoints,
1579# Unicode "printable representation" (PR)
1580sub quot_upr {
1581        my $cntrl = shift;
1582        my %opts = @_;
1583
1584        my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1585        if ($opts{-nohtml}) {
1586                return $chr;
1587        } else {
1588                return "<span class=\"cntrl\">$chr</span>";
1589        }
1590}
1591
1592# git may return quoted and escaped filenames
1593sub unquote {
1594        my $str = shift;
1595
1596        sub unq {
1597                my $seq = shift;
1598                my %es = ( # character escape codes, aka escape sequences
1599                        't' => "\t",   # tab            (HT, TAB)
1600                        'n' => "\n",   # newline        (NL)
1601                        'r' => "\r",   # return         (CR)
1602                        'f' => "\f",   # form feed      (FF)
1603                        'b' => "\b",   # backspace      (BS)
1604                        'a' => "\a",   # alarm (bell)   (BEL)
1605                        'e' => "\e",   # escape         (ESC)
1606                        'v' => "\013", # vertical tab   (VT)
1607                );
1608
1609                if ($seq =~ m/^[0-7]{1,3}$/) {
1610                        # octal char sequence
1611                        return chr(oct($seq));
1612                } elsif (exists $es{$seq}) {
1613                        # C escape sequence, aka character escape code
1614                        return $es{$seq};
1615                }
1616                # quoted ordinary character
1617                return $seq;
1618        }
1619
1620        if ($str =~ m/^"(.*)"$/) {
1621                # needs unquoting
1622                $str = $1;
1623                $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1624        }
1625        return $str;
1626}
1627
1628# escape tabs (convert tabs to spaces)
1629sub untabify {
1630        my $line = shift;
1631
1632        while ((my $pos = index($line, "\t")) != -1) {
1633                if (my $count = (8 - ($pos % 8))) {
1634                        my $spaces = ' ' x $count;
1635                        $line =~ s/\t/$spaces/;
1636                }
1637        }
1638
1639        return $line;
1640}
1641
1642sub project_in_list {
1643        my $project = shift;
1644        my @list = git_get_projects_list();
1645        return @list && scalar(grep { $_->{'path'} eq $project } @list);
1646}
1647
1648## ----------------------------------------------------------------------
1649## HTML aware string manipulation
1650
1651# Try to chop given string on a word boundary between position
1652# $len and $len+$add_len. If there is no word boundary there,
1653# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1654# (marking chopped part) would be longer than given string.
1655sub chop_str {
1656        my $str = shift;
1657        my $len = shift;
1658        my $add_len = shift || 10;
1659        my $where = shift || 'right'; # 'left' | 'center' | 'right'
1660
1661        # Make sure perl knows it is utf8 encoded so we don't
1662        # cut in the middle of a utf8 multibyte char.
1663        $str = to_utf8($str);
1664
1665        # allow only $len chars, but don't cut a word if it would fit in $add_len
1666        # if it doesn't fit, cut it if it's still longer than the dots we would add
1667        # remove chopped character entities entirely
1668
1669        # when chopping in the middle, distribute $len into left and right part
1670        # return early if chopping wouldn't make string shorter
1671        if ($where eq 'center') {
1672                return $str if ($len + 5 >= length($str)); # filler is length 5
1673                $len = int($len/2);
1674        } else {
1675                return $str if ($len + 4 >= length($str)); # filler is length 4
1676        }
1677
1678        # regexps: ending and beginning with word part up to $add_len
1679        my $endre = qr/.{$len}\w{0,$add_len}/;
1680        my $begre = qr/\w{0,$add_len}.{$len}/;
1681
1682        if ($where eq 'left') {
1683                $str =~ m/^(.*?)($begre)$/;
1684                my ($lead, $body) = ($1, $2);
1685                if (length($lead) > 4) {
1686                        $lead = " ...";
1687                }
1688                return "$lead$body";
1689
1690        } elsif ($where eq 'center') {
1691                $str =~ m/^($endre)(.*)$/;
1692                my ($left, $str)  = ($1, $2);
1693                $str =~ m/^(.*?)($begre)$/;
1694                my ($mid, $right) = ($1, $2);
1695                if (length($mid) > 5) {
1696                        $mid = " ... ";
1697                }
1698                return "$left$mid$right";
1699
1700        } else {
1701                $str =~ m/^($endre)(.*)$/;
1702                my $body = $1;
1703                my $tail = $2;
1704                if (length($tail) > 4) {
1705                        $tail = "... ";
1706                }
1707                return "$body$tail";
1708        }
1709}
1710
1711# takes the same arguments as chop_str, but also wraps a <span> around the
1712# result with a title attribute if it does get chopped. Additionally, the
1713# string is HTML-escaped.
1714sub chop_and_escape_str {
1715        my ($str) = @_;
1716
1717        my $chopped = chop_str(@_);
1718        $str = to_utf8($str);
1719        if ($chopped eq $str) {
1720                return esc_html($chopped);
1721        } else {
1722                $str =~ s/[[:cntrl:]]/?/g;
1723                return $cgi->span({-title=>$str}, esc_html($chopped));
1724        }
1725}
1726
1727# Highlight selected fragments of string, using given CSS class,
1728# and escape HTML.  It is assumed that fragments do not overlap.
1729# Regions are passed as list of pairs (array references).
1730#
1731# Example: esc_html_hl_regions("foobar", "mark", [ 0, 3 ]) returns
1732# '<span class="mark">foo</span>bar'
1733sub esc_html_hl_regions {
1734        my ($str, $css_class, @sel) = @_;
1735        my %opts = grep { ref($_) ne 'ARRAY' } @sel;
1736        @sel     = grep { ref($_) eq 'ARRAY' } @sel;
1737        return esc_html($str, %opts) unless @sel;
1738
1739        my $out = '';
1740        my $pos = 0;
1741
1742        for my $s (@sel) {
1743                my ($begin, $end) = @$s;
1744
1745                # Don't create empty <span> elements.
1746                next if $end <= $begin;
1747
1748                my $escaped = esc_html(substr($str, $begin, $end - $begin),
1749                                       %opts);
1750
1751                $out .= esc_html(substr($str, $pos, $begin - $pos), %opts)
1752                        if ($begin - $pos > 0);
1753                $out .= $cgi->span({-class => $css_class}, $escaped);
1754
1755                $pos = $end;
1756        }
1757        $out .= esc_html(substr($str, $pos), %opts)
1758                if ($pos < length($str));
1759
1760        return $out;
1761}
1762
1763# return positions of beginning and end of each match
1764sub matchpos_list {
1765        my ($str, $regexp) = @_;
1766        return unless (defined $str && defined $regexp);
1767
1768        my @matches;
1769        while ($str =~ /$regexp/g) {
1770                push @matches, [$-[0], $+[0]];
1771        }
1772        return @matches;
1773}
1774
1775# highlight match (if any), and escape HTML
1776sub esc_html_match_hl {
1777        my ($str, $regexp) = @_;
1778        return esc_html($str) unless defined $regexp;
1779
1780        my @matches = matchpos_list($str, $regexp);
1781        return esc_html($str) unless @matches;
1782
1783        return esc_html_hl_regions($str, 'match', @matches);
1784}
1785
1786
1787# highlight match (if any) of shortened string, and escape HTML
1788sub esc_html_match_hl_chopped {
1789        my ($str, $chopped, $regexp) = @_;
1790        return esc_html_match_hl($str, $regexp) unless defined $chopped;
1791
1792        my @matches = matchpos_list($str, $regexp);
1793        return esc_html($chopped) unless @matches;
1794
1795        # filter matches so that we mark chopped string
1796        my $tail = "... "; # see chop_str
1797        unless ($chopped =~ s/\Q$tail\E$//) {
1798                $tail = '';
1799        }
1800        my $chop_len = length($chopped);
1801        my $tail_len = length($tail);
1802        my @filtered;
1803
1804        for my $m (@matches) {
1805                if ($m->[0] > $chop_len) {
1806                        push @filtered, [ $chop_len, $chop_len + $tail_len ] if ($tail_len > 0);
1807                        last;
1808                } elsif ($m->[1] > $chop_len) {
1809                        push @filtered, [ $m->[0], $chop_len + $tail_len ];
1810                        last;
1811                }
1812                push @filtered, $m;
1813        }
1814
1815        return esc_html_hl_regions($chopped . $tail, 'match', @filtered);
1816}
1817
1818## ----------------------------------------------------------------------
1819## functions returning short strings
1820
1821# CSS class for given age value (in seconds)
1822sub age_class {
1823        my $age = shift;
1824
1825        if (!defined $age) {
1826                return "noage";
1827        } elsif ($age < 60*60*2) {
1828                return "age0";
1829        } elsif ($age < 60*60*24*2) {
1830                return "age1";
1831        } else {
1832                return "age2";
1833        }
1834}
1835
1836# convert age in seconds to "nn units ago" string
1837sub age_string {
1838        my $age = shift;
1839        my $age_str;
1840
1841        if ($age > 60*60*24*365*2) {
1842                $age_str = (int $age/60/60/24/365);
1843                $age_str .= " years ago";
1844        } elsif ($age > 60*60*24*(365/12)*2) {
1845                $age_str = int $age/60/60/24/(365/12);
1846                $age_str .= " months ago";
1847        } elsif ($age > 60*60*24*7*2) {
1848                $age_str = int $age/60/60/24/7;
1849                $age_str .= " weeks ago";
1850        } elsif ($age > 60*60*24*2) {
1851                $age_str = int $age/60/60/24;
1852                $age_str .= " days ago";
1853        } elsif ($age > 60*60*2) {
1854                $age_str = int $age/60/60;
1855                $age_str .= " hours ago";
1856        } elsif ($age > 60*2) {
1857                $age_str = int $age/60;
1858                $age_str .= " min ago";
1859        } elsif ($age > 2) {
1860                $age_str = int $age;
1861                $age_str .= " sec ago";
1862        } else {
1863                $age_str .= " right now";
1864        }
1865        return $age_str;
1866}
1867
1868use constant {
1869        S_IFINVALID => 0030000,
1870        S_IFGITLINK => 0160000,
1871};
1872
1873# submodule/subproject, a commit object reference
1874sub S_ISGITLINK {
1875        my $mode = shift;
1876
1877        return (($mode & S_IFMT) == S_IFGITLINK)
1878}
1879
1880# convert file mode in octal to symbolic file mode string
1881sub mode_str {
1882        my $mode = oct shift;
1883
1884        if (S_ISGITLINK($mode)) {
1885                return 'm---------';
1886        } elsif (S_ISDIR($mode & S_IFMT)) {
1887                return 'drwxr-xr-x';
1888        } elsif (S_ISLNK($mode)) {
1889                return 'lrwxrwxrwx';
1890        } elsif (S_ISREG($mode)) {
1891                # git cares only about the executable bit
1892                if ($mode & S_IXUSR) {
1893                        return '-rwxr-xr-x';
1894                } else {
1895                        return '-rw-r--r--';
1896                };
1897        } else {
1898                return '----------';
1899        }
1900}
1901
1902# convert file mode in octal to file type string
1903sub file_type {
1904        my $mode = shift;
1905
1906        if ($mode !~ m/^[0-7]+$/) {
1907                return $mode;
1908        } else {
1909                $mode = oct $mode;
1910        }
1911
1912        if (S_ISGITLINK($mode)) {
1913                return "submodule";
1914        } elsif (S_ISDIR($mode & S_IFMT)) {
1915                return "directory";
1916        } elsif (S_ISLNK($mode)) {
1917                return "symlink";
1918        } elsif (S_ISREG($mode)) {
1919                return "file";
1920        } else {
1921                return "unknown";
1922        }
1923}
1924
1925# convert file mode in octal to file type description string
1926sub file_type_long {
1927        my $mode = shift;
1928
1929        if ($mode !~ m/^[0-7]+$/) {
1930                return $mode;
1931        } else {
1932                $mode = oct $mode;
1933        }
1934
1935        if (S_ISGITLINK($mode)) {
1936                return "submodule";
1937        } elsif (S_ISDIR($mode & S_IFMT)) {
1938                return "directory";
1939        } elsif (S_ISLNK($mode)) {
1940                return "symlink";
1941        } elsif (S_ISREG($mode)) {
1942                if ($mode & S_IXUSR) {
1943                        return "executable";
1944                } else {
1945                        return "file";
1946                };
1947        } else {
1948                return "unknown";
1949        }
1950}
1951
1952
1953## ----------------------------------------------------------------------
1954## functions returning short HTML fragments, or transforming HTML fragments
1955## which don't belong to other sections
1956
1957# format line of commit message.
1958sub format_log_line_html {
1959        my $line = shift;
1960
1961        $line = esc_html($line, -nbsp=>1);
1962        $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1963                $cgi->a({-href => href(action=>"object", hash=>$1),
1964                                        -class => "text"}, $1);
1965        }eg;
1966
1967        return $line;
1968}
1969
1970# format marker of refs pointing to given object
1971
1972# the destination action is chosen based on object type and current context:
1973# - for annotated tags, we choose the tag view unless it's the current view
1974#   already, in which case we go to shortlog view
1975# - for other refs, we keep the current view if we're in history, shortlog or
1976#   log view, and select shortlog otherwise
1977sub format_ref_marker {
1978        my ($refs, $id) = @_;
1979        my $markers = '';
1980
1981        if (defined $refs->{$id}) {
1982                foreach my $ref (@{$refs->{$id}}) {
1983                        # this code exploits the fact that non-lightweight tags are the
1984                        # only indirect objects, and that they are the only objects for which
1985                        # we want to use tag instead of shortlog as action
1986                        my ($type, $name) = qw();
1987                        my $indirect = ($ref =~ s/\^\{\}$//);
1988                        # e.g. tags/v2.6.11 or heads/next
1989                        if ($ref =~ m!^(.*?)s?/(.*)$!) {
1990                                $type = $1;
1991                                $name = $2;
1992                        } else {
1993                                $type = "ref";
1994                                $name = $ref;
1995                        }
1996
1997                        my $class = $type;
1998                        $class .= " indirect" if $indirect;
1999
2000                        my $dest_action = "shortlog";
2001
2002                        if ($indirect) {
2003                                $dest_action = "tag" unless $action eq "tag";
2004                        } elsif ($action =~ /^(history|(short)?log)$/) {
2005                                $dest_action = $action;
2006                        }
2007
2008                        my $dest = "";
2009                        $dest .= "refs/" unless $ref =~ m!^refs/!;
2010                        $dest .= $ref;
2011
2012                        my $link = $cgi->a({
2013                                -href => href(
2014                                        action=>$dest_action,
2015                                        hash=>$dest
2016                                )}, $name);
2017
2018                        $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
2019                                $link . "</span>";
2020                }
2021        }
2022
2023        if ($markers) {
2024                return ' <span class="refs">'. $markers . '</span>';
2025        } else {
2026                return "";
2027        }
2028}
2029
2030# format, perhaps shortened and with markers, title line
2031sub format_subject_html {
2032        my ($long, $short, $href, $extra) = @_;
2033        $extra = '' unless defined($extra);
2034
2035        if (length($short) < length($long)) {
2036                $long =~ s/[[:cntrl:]]/?/g;
2037                return $cgi->a({-href => $href, -class => "list subject",
2038                                -title => to_utf8($long)},
2039                       esc_html($short)) . $extra;
2040        } else {
2041                return $cgi->a({-href => $href, -class => "list subject"},
2042                       esc_html($long)) . $extra;
2043        }
2044}
2045
2046# Rather than recomputing the url for an email multiple times, we cache it
2047# after the first hit. This gives a visible benefit in views where the avatar
2048# for the same email is used repeatedly (e.g. shortlog).
2049# The cache is shared by all avatar engines (currently gravatar only), which
2050# are free to use it as preferred. Since only one avatar engine is used for any
2051# given page, there's no risk for cache conflicts.
2052our %avatar_cache = ();
2053
2054# Compute the picon url for a given email, by using the picon search service over at
2055# http://www.cs.indiana.edu/picons/search.html
2056sub picon_url {
2057        my $email = lc shift;
2058        if (!$avatar_cache{$email}) {
2059                my ($user, $domain) = split('@', $email);
2060                $avatar_cache{$email} =
2061                        "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
2062                        "$domain/$user/" .
2063                        "users+domains+unknown/up/single";
2064        }
2065        return $avatar_cache{$email};
2066}
2067
2068# Compute the gravatar url for a given email, if it's not in the cache already.
2069# Gravatar stores only the part of the URL before the size, since that's the
2070# one computationally more expensive. This also allows reuse of the cache for
2071# different sizes (for this particular engine).
2072sub gravatar_url {
2073        my $email = lc shift;
2074        my $size = shift;
2075        $avatar_cache{$email} ||=
2076                "http://www.gravatar.com/avatar/" .
2077                        Digest::MD5::md5_hex($email) . "?s=";
2078        return $avatar_cache{$email} . $size;
2079}
2080
2081# Insert an avatar for the given $email at the given $size if the feature
2082# is enabled.
2083sub git_get_avatar {
2084        my ($email, %opts) = @_;
2085        my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
2086        my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
2087        $opts{-size} ||= 'default';
2088        my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
2089        my $url = "";
2090        if ($git_avatar eq 'gravatar') {
2091                $url = gravatar_url($email, $size);
2092        } elsif ($git_avatar eq 'picon') {
2093                $url = picon_url($email);
2094        }
2095        # Other providers can be added by extending the if chain, defining $url
2096        # as needed. If no variant puts something in $url, we assume avatars
2097        # are completely disabled/unavailable.
2098        if ($url) {
2099                return $pre_white .
2100                       "<img width=\"$size\" " .
2101                            "class=\"avatar\" " .
2102                            "src=\"".esc_url($url)."\" " .
2103                            "alt=\"\" " .
2104                       "/>" . $post_white;
2105        } else {
2106                return "";
2107        }
2108}
2109
2110sub format_search_author {
2111        my ($author, $searchtype, $displaytext) = @_;
2112        my $have_search = gitweb_check_feature('search');
2113
2114        if ($have_search) {
2115                my $performed = "";
2116                if ($searchtype eq 'author') {
2117                        $performed = "authored";
2118                } elsif ($searchtype eq 'committer') {
2119                        $performed = "committed";
2120                }
2121
2122                return $cgi->a({-href => href(action=>"search", hash=>$hash,
2123                                searchtext=>$author,
2124                                searchtype=>$searchtype), class=>"list",
2125                                title=>"Search for commits $performed by $author"},
2126                                $displaytext);
2127
2128        } else {
2129                return $displaytext;
2130        }
2131}
2132
2133# format the author name of the given commit with the given tag
2134# the author name is chopped and escaped according to the other
2135# optional parameters (see chop_str).
2136sub format_author_html {
2137        my $tag = shift;
2138        my $co = shift;
2139        my $author = chop_and_escape_str($co->{'author_name'}, @_);
2140        return "<$tag class=\"author\">" .
2141               format_search_author($co->{'author_name'}, "author",
2142                       git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2143                       $author) .
2144               "</$tag>";
2145}
2146
2147# format git diff header line, i.e. "diff --(git|combined|cc) ..."
2148sub format_git_diff_header_line {
2149        my $line = shift;
2150        my $diffinfo = shift;
2151        my ($from, $to) = @_;
2152
2153        if ($diffinfo->{'nparents'}) {
2154                # combined diff
2155                $line =~ s!^(diff (.*?) )"?.*$!$1!;
2156                if ($to->{'href'}) {
2157                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2158                                         esc_path($to->{'file'}));
2159                } else { # file was deleted (no href)
2160                        $line .= esc_path($to->{'file'});
2161                }
2162        } else {
2163                # "ordinary" diff
2164                $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2165                if ($from->{'href'}) {
2166                        $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2167                                         'a/' . esc_path($from->{'file'}));
2168                } else { # file was added (no href)
2169                        $line .= 'a/' . esc_path($from->{'file'});
2170                }
2171                $line .= ' ';
2172                if ($to->{'href'}) {
2173                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2174                                         'b/' . esc_path($to->{'file'}));
2175                } else { # file was deleted
2176                        $line .= 'b/' . esc_path($to->{'file'});
2177                }
2178        }
2179
2180        return "<div class=\"diff header\">$line</div>\n";
2181}
2182
2183# format extended diff header line, before patch itself
2184sub format_extended_diff_header_line {
2185        my $line = shift;
2186        my $diffinfo = shift;
2187        my ($from, $to) = @_;
2188
2189        # match <path>
2190        if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2191                $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2192                                       esc_path($from->{'file'}));
2193        }
2194        if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2195                $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2196                                 esc_path($to->{'file'}));
2197        }
2198        # match single <mode>
2199        if ($line =~ m/\s(\d{6})$/) {
2200                $line .= '<span class="info"> (' .
2201                         file_type_long($1) .
2202                         ')</span>';
2203        }
2204        # match <hash>
2205        if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2206                # can match only for combined diff
2207                $line = 'index ';
2208                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2209                        if ($from->{'href'}[$i]) {
2210                                $line .= $cgi->a({-href=>$from->{'href'}[$i],
2211                                                  -class=>"hash"},
2212                                                 substr($diffinfo->{'from_id'}[$i],0,7));
2213                        } else {
2214                                $line .= '0' x 7;
2215                        }
2216                        # separator
2217                        $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2218                }
2219                $line .= '..';
2220                if ($to->{'href'}) {
2221                        $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2222                                         substr($diffinfo->{'to_id'},0,7));
2223                } else {
2224                        $line .= '0' x 7;
2225                }
2226
2227        } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2228                # can match only for ordinary diff
2229                my ($from_link, $to_link);
2230                if ($from->{'href'}) {
2231                        $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2232                                             substr($diffinfo->{'from_id'},0,7));
2233                } else {
2234                        $from_link = '0' x 7;
2235                }
2236                if ($to->{'href'}) {
2237                        $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2238                                           substr($diffinfo->{'to_id'},0,7));
2239                } else {
2240                        $to_link = '0' x 7;
2241                }
2242                my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2243                $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2244        }
2245
2246        return $line . "<br/>\n";
2247}
2248
2249# format from-file/to-file diff header
2250sub format_diff_from_to_header {
2251        my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2252        my $line;
2253        my $result = '';
2254
2255        $line = $from_line;
2256        #assert($line =~ m/^---/) if DEBUG;
2257        # no extra formatting for "^--- /dev/null"
2258        if (! $diffinfo->{'nparents'}) {
2259                # ordinary (single parent) diff
2260                if ($line =~ m!^--- "?a/!) {
2261                        if ($from->{'href'}) {
2262                                $line = '--- a/' .
2263                                        $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2264                                                esc_path($from->{'file'}));
2265                        } else {
2266                                $line = '--- a/' .
2267                                        esc_path($from->{'file'});
2268                        }
2269                }
2270                $result .= qq!<div class="diff from_file">$line</div>\n!;
2271
2272        } else {
2273                # combined diff (merge commit)
2274                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2275                        if ($from->{'href'}[$i]) {
2276                                $line = '--- ' .
2277                                        $cgi->a({-href=>href(action=>"blobdiff",
2278                                                             hash_parent=>$diffinfo->{'from_id'}[$i],
2279                                                             hash_parent_base=>$parents[$i],
2280                                                             file_parent=>$from->{'file'}[$i],
2281                                                             hash=>$diffinfo->{'to_id'},
2282                                                             hash_base=>$hash,
2283                                                             file_name=>$to->{'file'}),
2284                                                 -class=>"path",
2285                                                 -title=>"diff" . ($i+1)},
2286                                                $i+1) .
2287                                        '/' .
2288                                        $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2289                                                esc_path($from->{'file'}[$i]));
2290                        } else {
2291                                $line = '--- /dev/null';
2292                        }
2293                        $result .= qq!<div class="diff from_file">$line</div>\n!;
2294                }
2295        }
2296
2297        $line = $to_line;
2298        #assert($line =~ m/^\+\+\+/) if DEBUG;
2299        # no extra formatting for "^+++ /dev/null"
2300        if ($line =~ m!^\+\+\+ "?b/!) {
2301                if ($to->{'href'}) {
2302                        $line = '+++ b/' .
2303                                $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2304                                        esc_path($to->{'file'}));
2305                } else {
2306                        $line = '+++ b/' .
2307                                esc_path($to->{'file'});
2308                }
2309        }
2310        $result .= qq!<div class="diff to_file">$line</div>\n!;
2311
2312        return $result;
2313}
2314
2315# create note for patch simplified by combined diff
2316sub format_diff_cc_simplified {
2317        my ($diffinfo, @parents) = @_;
2318        my $result = '';
2319
2320        $result .= "<div class=\"diff header\">" .
2321                   "diff --cc ";
2322        if (!is_deleted($diffinfo)) {
2323                $result .= $cgi->a({-href => href(action=>"blob",
2324                                                  hash_base=>$hash,
2325                                                  hash=>$diffinfo->{'to_id'},
2326                                                  file_name=>$diffinfo->{'to_file'}),
2327                                    -class => "path"},
2328                                   esc_path($diffinfo->{'to_file'}));
2329        } else {
2330                $result .= esc_path($diffinfo->{'to_file'});
2331        }
2332        $result .= "</div>\n" . # class="diff header"
2333                   "<div class=\"diff nodifferences\">" .
2334                   "Simple merge" .
2335                   "</div>\n"; # class="diff nodifferences"
2336
2337        return $result;
2338}
2339
2340sub diff_line_class {
2341        my ($line, $from, $to) = @_;
2342
2343        # ordinary diff
2344        my $num_sign = 1;
2345        # combined diff
2346        if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2347                $num_sign = scalar @{$from->{'href'}};
2348        }
2349
2350        my @diff_line_classifier = (
2351                { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2352                { regexp => qr/^\\/,               class => "incomplete"  },
2353                { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2354                # classifier for context must come before classifier add/rem,
2355                # or we would have to use more complicated regexp, for example
2356                # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2357                { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2358                { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2359        );
2360        for my $clsfy (@diff_line_classifier) {
2361                return $clsfy->{'class'}
2362                        if ($line =~ $clsfy->{'regexp'});
2363        }
2364
2365        # fallback
2366        return "";
2367}
2368
2369# assumes that $from and $to are defined and correctly filled,
2370# and that $line holds a line of chunk header for unified diff
2371sub format_unidiff_chunk_header {
2372        my ($line, $from, $to) = @_;
2373
2374        my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2375                $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2376
2377        $from_lines = 0 unless defined $from_lines;
2378        $to_lines   = 0 unless defined $to_lines;
2379
2380        if ($from->{'href'}) {
2381                $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2382                                     -class=>"list"}, $from_text);
2383        }
2384        if ($to->{'href'}) {
2385                $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2386                                     -class=>"list"}, $to_text);
2387        }
2388        $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2389                "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2390        return $line;
2391}
2392
2393# assumes that $from and $to are defined and correctly filled,
2394# and that $line holds a line of chunk header for combined diff
2395sub format_cc_diff_chunk_header {
2396        my ($line, $from, $to) = @_;
2397
2398        my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2399        my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2400
2401        @from_text = split(' ', $ranges);
2402        for (my $i = 0; $i < @from_text; ++$i) {
2403                ($from_start[$i], $from_nlines[$i]) =
2404                        (split(',', substr($from_text[$i], 1)), 0);
2405        }
2406
2407        $to_text   = pop @from_text;
2408        $to_start  = pop @from_start;
2409        $to_nlines = pop @from_nlines;
2410
2411        $line = "<span class=\"chunk_info\">$prefix ";
2412        for (my $i = 0; $i < @from_text; ++$i) {
2413                if ($from->{'href'}[$i]) {
2414                        $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2415                                          -class=>"list"}, $from_text[$i]);
2416                } else {
2417                        $line .= $from_text[$i];
2418                }
2419                $line .= " ";
2420        }
2421        if ($to->{'href'}) {
2422                $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2423                                  -class=>"list"}, $to_text);
2424        } else {
2425                $line .= $to_text;
2426        }
2427        $line .= " $prefix</span>" .
2428                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2429        return $line;
2430}
2431
2432# process patch (diff) line (not to be used for diff headers),
2433# returning class and HTML-formatted (but not wrapped) line
2434sub process_diff_line {
2435        my $line = shift;
2436        my ($from, $to) = @_;
2437
2438        my $diff_class = diff_line_class($line, $from, $to);
2439
2440        chomp $line;
2441        $line = untabify($line);
2442
2443        if ($from && $to && $line =~ m/^\@{2} /) {
2444                $line = format_unidiff_chunk_header($line, $from, $to);
2445                return $diff_class, $line;
2446
2447        } elsif ($from && $to && $line =~ m/^\@{3}/) {
2448                $line = format_cc_diff_chunk_header($line, $from, $to);
2449                return $diff_class, $line;
2450
2451        }
2452        return $diff_class, esc_html($line, -nbsp=>1);
2453}
2454
2455# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2456# linked.  Pass the hash of the tree/commit to snapshot.
2457sub format_snapshot_links {
2458        my ($hash) = @_;
2459        my $num_fmts = @snapshot_fmts;
2460        if ($num_fmts > 1) {
2461                # A parenthesized list of links bearing format names.
2462                # e.g. "snapshot (_tar.gz_ _zip_)"
2463                return "snapshot (" . join(' ', map
2464                        $cgi->a({
2465                                -href => href(
2466                                        action=>"snapshot",
2467                                        hash=>$hash,
2468                                        snapshot_format=>$_
2469                                )
2470                        }, $known_snapshot_formats{$_}{'display'})
2471                , @snapshot_fmts) . ")";
2472        } elsif ($num_fmts == 1) {
2473                # A single "snapshot" link whose tooltip bears the format name.
2474                # i.e. "_snapshot_"
2475                my ($fmt) = @snapshot_fmts;
2476                return
2477                        $cgi->a({
2478                                -href => href(
2479                                        action=>"snapshot",
2480                                        hash=>$hash,
2481                                        snapshot_format=>$fmt
2482                                ),
2483                                -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2484                        }, "snapshot");
2485        } else { # $num_fmts == 0
2486                return undef;
2487        }
2488}
2489
2490## ......................................................................
2491## functions returning values to be passed, perhaps after some
2492## transformation, to other functions; e.g. returning arguments to href()
2493
2494# returns hash to be passed to href to generate gitweb URL
2495# in -title key it returns description of link
2496sub get_feed_info {
2497        my $format = shift || 'Atom';
2498        my %res = (action => lc($format));
2499
2500        # feed links are possible only for project views
2501        return unless (defined $project);
2502        # some views should link to OPML, or to generic project feed,
2503        # or don't have specific feed yet (so they should use generic)
2504        return if (!$action || $action =~ /^(?:tags|heads|forks|tag|search)$/x);
2505
2506        my $branch;
2507        # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2508        # from tag links; this also makes possible to detect branch links
2509        if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2510            (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2511                $branch = $1;
2512        }
2513        # find log type for feed description (title)
2514        my $type = 'log';
2515        if (defined $file_name) {
2516                $type  = "history of $file_name";
2517                $type .= "/" if ($action eq 'tree');
2518                $type .= " on '$branch'" if (defined $branch);
2519        } else {
2520                $type = "log of $branch" if (defined $branch);
2521        }
2522
2523        $res{-title} = $type;
2524        $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2525        $res{'file_name'} = $file_name;
2526
2527        return %res;
2528}
2529
2530## ----------------------------------------------------------------------
2531## git utility subroutines, invoking git commands
2532
2533# returns path to the core git executable and the --git-dir parameter as list
2534sub git_cmd {
2535        $number_of_git_cmds++;
2536        return $GIT, '--git-dir='.$git_dir;
2537}
2538
2539# quote the given arguments for passing them to the shell
2540# quote_command("command", "arg 1", "arg with ' and ! characters")
2541# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2542# Try to avoid using this function wherever possible.
2543sub quote_command {
2544        return join(' ',
2545                map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2546}
2547
2548# get HEAD ref of given project as hash
2549sub git_get_head_hash {
2550        return git_get_full_hash(shift, 'HEAD');
2551}
2552
2553sub git_get_full_hash {
2554        return git_get_hash(@_);
2555}
2556
2557sub git_get_short_hash {
2558        return git_get_hash(@_, '--short=7');
2559}
2560
2561sub git_get_hash {
2562        my ($project, $hash, @options) = @_;
2563        my $o_git_dir = $git_dir;
2564        my $retval = undef;
2565        $git_dir = "$projectroot/$project";
2566        if (open my $fd, '-|', git_cmd(), 'rev-parse',
2567            '--verify', '-q', @options, $hash) {
2568                $retval = <$fd>;
2569                chomp $retval if defined $retval;
2570                close $fd;
2571        }
2572        if (defined $o_git_dir) {
2573                $git_dir = $o_git_dir;
2574        }
2575        return $retval;
2576}
2577
2578# get type of given object
2579sub git_get_type {
2580        my $hash = shift;
2581
2582        open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2583        my $type = <$fd>;
2584        close $fd or return;
2585        chomp $type;
2586        return $type;
2587}
2588
2589# repository configuration
2590our $config_file = '';
2591our %config;
2592
2593# store multiple values for single key as anonymous array reference
2594# single values stored directly in the hash, not as [ <value> ]
2595sub hash_set_multi {
2596        my ($hash, $key, $value) = @_;
2597
2598        if (!exists $hash->{$key}) {
2599                $hash->{$key} = $value;
2600        } elsif (!ref $hash->{$key}) {
2601                $hash->{$key} = [ $hash->{$key}, $value ];
2602        } else {
2603                push @{$hash->{$key}}, $value;
2604        }
2605}
2606
2607# return hash of git project configuration
2608# optionally limited to some section, e.g. 'gitweb'
2609sub git_parse_project_config {
2610        my $section_regexp = shift;
2611        my %config;
2612
2613        local $/ = "\0";
2614
2615        open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2616                or return;
2617
2618        while (my $keyval = <$fh>) {
2619                chomp $keyval;
2620                my ($key, $value) = split(/\n/, $keyval, 2);
2621
2622                hash_set_multi(\%config, $key, $value)
2623                        if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2624        }
2625        close $fh;
2626
2627        return %config;
2628}
2629
2630# convert config value to boolean: 'true' or 'false'
2631# no value, number > 0, 'true' and 'yes' values are true
2632# rest of values are treated as false (never as error)
2633sub config_to_bool {
2634        my $val = shift;
2635
2636        return 1 if !defined $val;             # section.key
2637
2638        # strip leading and trailing whitespace
2639        $val =~ s/^\s+//;
2640        $val =~ s/\s+$//;
2641
2642        return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2643                ($val =~ /^(?:true|yes)$/i));  # section.key = true
2644}
2645
2646# convert config value to simple decimal number
2647# an optional value suffix of 'k', 'm', or 'g' will cause the value
2648# to be multiplied by 1024, 1048576, or 1073741824
2649sub config_to_int {
2650        my $val = shift;
2651
2652        # strip leading and trailing whitespace
2653        $val =~ s/^\s+//;
2654        $val =~ s/\s+$//;
2655
2656        if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2657                $unit = lc($unit);
2658                # unknown unit is treated as 1
2659                return $num * ($unit eq 'g' ? 1073741824 :
2660                               $unit eq 'm' ?    1048576 :
2661                               $unit eq 'k' ?       1024 : 1);
2662        }
2663        return $val;
2664}
2665
2666# convert config value to array reference, if needed
2667sub config_to_multi {
2668        my $val = shift;
2669
2670        return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2671}
2672
2673sub git_get_project_config {
2674        my ($key, $type) = @_;
2675
2676        return unless defined $git_dir;
2677
2678        # key sanity check
2679        return unless ($key);
2680        # only subsection, if exists, is case sensitive,
2681        # and not lowercased by 'git config -z -l'
2682        if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2683                $key = join(".", lc($hi), $mi, lc($lo));
2684        } else {
2685                $key = lc($key);
2686        }
2687        $key =~ s/^gitweb\.//;
2688        return if ($key =~ m/\W/);
2689
2690        # type sanity check
2691        if (defined $type) {
2692                $type =~ s/^--//;
2693                $type = undef
2694                        unless ($type eq 'bool' || $type eq 'int');
2695        }
2696
2697        # get config
2698        if (!defined $config_file ||
2699            $config_file ne "$git_dir/config") {
2700                %config = git_parse_project_config('gitweb');
2701                $config_file = "$git_dir/config";
2702        }
2703
2704        # check if config variable (key) exists
2705        return unless exists $config{"gitweb.$key"};
2706
2707        # ensure given type
2708        if (!defined $type) {
2709                return $config{"gitweb.$key"};
2710        } elsif ($type eq 'bool') {
2711                # backward compatibility: 'git config --bool' returns true/false
2712                return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2713        } elsif ($type eq 'int') {
2714                return config_to_int($config{"gitweb.$key"});
2715        }
2716        return $config{"gitweb.$key"};
2717}
2718
2719# get hash of given path at given ref
2720sub git_get_hash_by_path {
2721        my $base = shift;
2722        my $path = shift || return undef;
2723        my $type = shift;
2724
2725        $path =~ s,/+$,,;
2726
2727        open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2728                or die_error(500, "Open git-ls-tree failed");
2729        my $line = <$fd>;
2730        close $fd or return undef;
2731
2732        if (!defined $line) {
2733                # there is no tree or hash given by $path at $base
2734                return undef;
2735        }
2736
2737        #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2738        $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2739        if (defined $type && $type ne $2) {
2740                # type doesn't match
2741                return undef;
2742        }
2743        return $3;
2744}
2745
2746# get path of entry with given hash at given tree-ish (ref)
2747# used to get 'from' filename for combined diff (merge commit) for renames
2748sub git_get_path_by_hash {
2749        my $base = shift || return;
2750        my $hash = shift || return;
2751
2752        local $/ = "\0";
2753
2754        open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2755                or return undef;
2756        while (my $line = <$fd>) {
2757                chomp $line;
2758
2759                #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2760                #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2761                if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2762                        close $fd;
2763                        return $1;
2764                }
2765        }
2766        close $fd;
2767        return undef;
2768}
2769
2770## ......................................................................
2771## git utility functions, directly accessing git repository
2772
2773# get the value of config variable either from file named as the variable
2774# itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2775# configuration variable in the repository config file.
2776sub git_get_file_or_project_config {
2777        my ($path, $name) = @_;
2778
2779        $git_dir = "$projectroot/$path";
2780        open my $fd, '<', "$git_dir/$name"
2781                or return git_get_project_config($name);
2782        my $conf = <$fd>;
2783        close $fd;
2784        if (defined $conf) {
2785                chomp $conf;
2786        }
2787        return $conf;
2788}
2789
2790sub git_get_project_description {
2791        my $path = shift;
2792        return git_get_file_or_project_config($path, 'description');
2793}
2794
2795sub git_get_project_category {
2796        my $path = shift;
2797        return git_get_file_or_project_config($path, 'category');
2798}
2799
2800
2801# supported formats:
2802# * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2803#   - if its contents is a number, use it as tag weight,
2804#   - otherwise add a tag with weight 1
2805# * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2806#   the same value multiple times increases tag weight
2807# * `gitweb.ctag' multi-valued repo config variable
2808sub git_get_project_ctags {
2809        my $project = shift;
2810        my $ctags = {};
2811
2812        $git_dir = "$projectroot/$project";
2813        if (opendir my $dh, "$git_dir/ctags") {
2814                my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2815                foreach my $tagfile (@files) {
2816                        open my $ct, '<', $tagfile
2817                                or next;
2818                        my $val = <$ct>;
2819                        chomp $val if $val;
2820                        close $ct;
2821
2822                        (my $ctag = $tagfile) =~ s#.*/##;
2823                        if ($val =~ /^\d+$/) {
2824                                $ctags->{$ctag} = $val;
2825                        } else {
2826                                $ctags->{$ctag} = 1;
2827                        }
2828                }
2829                closedir $dh;
2830
2831        } elsif (open my $fh, '<', "$git_dir/ctags") {
2832                while (my $line = <$fh>) {
2833                        chomp $line;
2834                        $ctags->{$line}++ if $line;
2835                }
2836                close $fh;
2837
2838        } else {
2839                my $taglist = config_to_multi(git_get_project_config('ctag'));
2840                foreach my $tag (@$taglist) {
2841                        $ctags->{$tag}++;
2842                }
2843        }
2844
2845        return $ctags;
2846}
2847
2848# return hash, where keys are content tags ('ctags'),
2849# and values are sum of weights of given tag in every project
2850sub git_gather_all_ctags {
2851        my $projects = shift;
2852        my $ctags = {};
2853
2854        foreach my $p (@$projects) {
2855                foreach my $ct (keys %{$p->{'ctags'}}) {
2856                        $ctags->{$ct} += $p->{'ctags'}->{$ct};
2857                }
2858        }
2859
2860        return $ctags;
2861}
2862
2863sub git_populate_project_tagcloud {
2864        my $ctags = shift;
2865
2866        # First, merge different-cased tags; tags vote on casing
2867        my %ctags_lc;
2868        foreach (keys %$ctags) {
2869                $ctags_lc{lc $_}->{count} += $ctags->{$_};
2870                if (not $ctags_lc{lc $_}->{topcount}
2871                    or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2872                        $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2873                        $ctags_lc{lc $_}->{topname} = $_;
2874                }
2875        }
2876
2877        my $cloud;
2878        my $matched = $input_params{'ctag'};
2879        if (eval { require HTML::TagCloud; 1; }) {
2880                $cloud = HTML::TagCloud->new;
2881                foreach my $ctag (sort keys %ctags_lc) {
2882                        # Pad the title with spaces so that the cloud looks
2883                        # less crammed.
2884                        my $title = esc_html($ctags_lc{$ctag}->{topname});
2885                        $title =~ s/ /&nbsp;/g;
2886                        $title =~ s/^/&nbsp;/g;
2887                        $title =~ s/$/&nbsp;/g;
2888                        if (defined $matched && $matched eq $ctag) {
2889                                $title = qq(<span class="match">$title</span>);
2890                        }
2891                        $cloud->add($title, href(project=>undef, ctag=>$ctag),
2892                                    $ctags_lc{$ctag}->{count});
2893                }
2894        } else {
2895                $cloud = {};
2896                foreach my $ctag (keys %ctags_lc) {
2897                        my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2898                        if (defined $matched && $matched eq $ctag) {
2899                                $title = qq(<span class="match">$title</span>);
2900                        }
2901                        $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2902                        $cloud->{$ctag}{ctag} =
2903                                $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2904                }
2905        }
2906        return $cloud;
2907}
2908
2909sub git_show_project_tagcloud {
2910        my ($cloud, $count) = @_;
2911        if (ref $cloud eq 'HTML::TagCloud') {
2912                return $cloud->html_and_css($count);
2913        } else {
2914                my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2915                return
2916                        '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2917                        join (', ', map {
2918                                $cloud->{$_}->{'ctag'}
2919                        } splice(@tags, 0, $count)) .
2920                        '</div>';
2921        }
2922}
2923
2924sub git_get_project_url_list {
2925        my $path = shift;
2926
2927        $git_dir = "$projectroot/$path";
2928        open my $fd, '<', "$git_dir/cloneurl"
2929                or return wantarray ?
2930                @{ config_to_multi(git_get_project_config('url')) } :
2931                   config_to_multi(git_get_project_config('url'));
2932        my @git_project_url_list = map { chomp; $_ } <$fd>;
2933        close $fd;
2934
2935        return wantarray ? @git_project_url_list : \@git_project_url_list;
2936}
2937
2938sub git_get_projects_list {
2939        my $filter = shift || '';
2940        my $paranoid = shift;
2941        my @list;
2942
2943        if (-d $projects_list) {
2944                # search in directory
2945                my $dir = $projects_list;
2946                # remove the trailing "/"
2947                $dir =~ s!/+$!!;
2948                my $pfxlen = length("$dir");
2949                my $pfxdepth = ($dir =~ tr!/!!);
2950                # when filtering, search only given subdirectory
2951                if ($filter && !$paranoid) {
2952                        $dir .= "/$filter";
2953                        $dir =~ s!/+$!!;
2954                }
2955
2956                File::Find::find({
2957                        follow_fast => 1, # follow symbolic links
2958                        follow_skip => 2, # ignore duplicates
2959                        dangling_symlinks => 0, # ignore dangling symlinks, silently
2960                        wanted => sub {
2961                                # global variables
2962                                our $project_maxdepth;
2963                                our $projectroot;
2964                                # skip project-list toplevel, if we get it.
2965                                return if (m!^[/.]$!);
2966                                # only directories can be git repositories
2967                                return unless (-d $_);
2968                                # don't traverse too deep (Find is super slow on os x)
2969                                # $project_maxdepth excludes depth of $projectroot
2970                                if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2971                                        $File::Find::prune = 1;
2972                                        return;
2973                                }
2974
2975                                my $path = substr($File::Find::name, $pfxlen + 1);
2976                                # paranoidly only filter here
2977                                if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
2978                                        next;
2979                                }
2980                                # we check related file in $projectroot
2981                                if (check_export_ok("$projectroot/$path")) {
2982                                        push @list, { path => $path };
2983                                        $File::Find::prune = 1;
2984                                }
2985                        },
2986                }, "$dir");
2987
2988        } elsif (-f $projects_list) {
2989                # read from file(url-encoded):
2990                # 'git%2Fgit.git Linus+Torvalds'
2991                # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2992                # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2993                open my $fd, '<', $projects_list or return;
2994        PROJECT:
2995                while (my $line = <$fd>) {
2996                        chomp $line;
2997                        my ($path, $owner) = split ' ', $line;
2998                        $path = unescape($path);
2999                        $owner = unescape($owner);
3000                        if (!defined $path) {
3001                                next;
3002                        }
3003                        # if $filter is rpovided, check if $path begins with $filter
3004                        if ($filter && $path !~ m!^\Q$filter\E/!) {
3005                                next;
3006                        }
3007                        if (check_export_ok("$projectroot/$path")) {
3008                                my $pr = {
3009                                        path => $path,
3010                                        owner => to_utf8($owner),
3011                                };
3012                                push @list, $pr;
3013                        }
3014                }
3015                close $fd;
3016        }
3017        return @list;
3018}
3019
3020# written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
3021# as side effects it sets 'forks' field to list of forks for forked projects
3022sub filter_forks_from_projects_list {
3023        my $projects = shift;
3024
3025        my %trie; # prefix tree of directories (path components)
3026        # generate trie out of those directories that might contain forks
3027        foreach my $pr (@$projects) {
3028                my $path = $pr->{'path'};
3029                $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
3030                next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
3031                next unless ($path);      # skip '.git' repository: tests, git-instaweb
3032                next unless (-d "$projectroot/$path"); # containing directory exists
3033                $pr->{'forks'} = [];      # there can be 0 or more forks of project
3034
3035                # add to trie
3036                my @dirs = split('/', $path);
3037                # walk the trie, until either runs out of components or out of trie
3038                my $ref = \%trie;
3039                while (scalar @dirs &&
3040                       exists($ref->{$dirs[0]})) {
3041                        $ref = $ref->{shift @dirs};
3042                }
3043                # create rest of trie structure from rest of components
3044                foreach my $dir (@dirs) {
3045                        $ref = $ref->{$dir} = {};
3046                }
3047                # create end marker, store $pr as a data
3048                $ref->{''} = $pr if (!exists $ref->{''});
3049        }
3050
3051        # filter out forks, by finding shortest prefix match for paths
3052        my @filtered;
3053 PROJECT:
3054        foreach my $pr (@$projects) {
3055                # trie lookup
3056                my $ref = \%trie;
3057        DIR:
3058                foreach my $dir (split('/', $pr->{'path'})) {
3059                        if (exists $ref->{''}) {
3060                                # found [shortest] prefix, is a fork - skip it
3061                                push @{$ref->{''}{'forks'}}, $pr;
3062                                next PROJECT;
3063                        }
3064                        if (!exists $ref->{$dir}) {
3065                                # not in trie, cannot have prefix, not a fork
3066                                push @filtered, $pr;
3067                                next PROJECT;
3068                        }
3069                        # If the dir is there, we just walk one step down the trie.
3070                        $ref = $ref->{$dir};
3071                }
3072                # we ran out of trie
3073                # (shouldn't happen: it's either no match, or end marker)
3074                push @filtered, $pr;
3075        }
3076
3077        return @filtered;
3078}
3079
3080# note: fill_project_list_info must be run first,
3081# for 'descr_long' and 'ctags' to be filled
3082sub search_projects_list {
3083        my ($projlist, %opts) = @_;
3084        my $tagfilter  = $opts{'tagfilter'};
3085        my $search_re = $opts{'search_regexp'};
3086
3087        return @$projlist
3088                unless ($tagfilter || $search_re);
3089
3090        # searching projects require filling to be run before it;
3091        fill_project_list_info($projlist,
3092                               $tagfilter  ? 'ctags' : (),
3093                               $search_re ? ('path', 'descr') : ());
3094        my @projects;
3095 PROJECT:
3096        foreach my $pr (@$projlist) {
3097
3098                if ($tagfilter) {
3099                        next unless ref($pr->{'ctags'}) eq 'HASH';
3100                        next unless
3101                                grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
3102                }
3103
3104                if ($search_re) {
3105                        next unless
3106                                $pr->{'path'} =~ /$search_re/ ||
3107                                $pr->{'descr_long'} =~ /$search_re/;
3108                }
3109
3110                push @projects, $pr;
3111        }
3112
3113        return @projects;
3114}
3115
3116our $gitweb_project_owner = undef;
3117sub git_get_project_list_from_file {
3118
3119        return if (defined $gitweb_project_owner);
3120
3121        $gitweb_project_owner = {};
3122        # read from file (url-encoded):
3123        # 'git%2Fgit.git Linus+Torvalds'
3124        # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3125        # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3126        if (-f $projects_list) {
3127                open(my $fd, '<', $projects_list);
3128                while (my $line = <$fd>) {
3129                        chomp $line;
3130                        my ($pr, $ow) = split ' ', $line;
3131                        $pr = unescape($pr);
3132                        $ow = unescape($ow);
3133                        $gitweb_project_owner->{$pr} = to_utf8($ow);
3134                }
3135                close $fd;
3136        }
3137}
3138
3139sub git_get_project_owner {
3140        my $project = shift;
3141        my $owner;
3142
3143        return undef unless $project;
3144        $git_dir = "$projectroot/$project";
3145
3146        if (!defined $gitweb_project_owner) {
3147                git_get_project_list_from_file();
3148        }
3149
3150        if (exists $gitweb_project_owner->{$project}) {
3151                $owner = $gitweb_project_owner->{$project};
3152        }
3153        if (!defined $owner){
3154                $owner = git_get_project_config('owner');
3155        }
3156        if (!defined $owner) {
3157                $owner = get_file_owner("$git_dir");
3158        }
3159
3160        return $owner;
3161}
3162
3163sub git_get_last_activity {
3164        my ($path) = @_;
3165        my $fd;
3166
3167        $git_dir = "$projectroot/$path";
3168        open($fd, "-|", git_cmd(), 'for-each-ref',
3169             '--format=%(committer)',
3170             '--sort=-committerdate',
3171             '--count=1',
3172             'refs/heads') or return;
3173        my $most_recent = <$fd>;
3174        close $fd or return;
3175        if (defined $most_recent &&
3176            $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3177                my $timestamp = $1;
3178                my $age = time - $timestamp;
3179                return ($age, age_string($age));
3180        }
3181        return (undef, undef);
3182}
3183
3184# Implementation note: when a single remote is wanted, we cannot use 'git
3185# remote show -n' because that command always work (assuming it's a remote URL
3186# if it's not defined), and we cannot use 'git remote show' because that would
3187# try to make a network roundtrip. So the only way to find if that particular
3188# remote is defined is to walk the list provided by 'git remote -v' and stop if
3189# and when we find what we want.
3190sub git_get_remotes_list {
3191        my $wanted = shift;
3192        my %remotes = ();
3193
3194        open my $fd, '-|' , git_cmd(), 'remote', '-v';
3195        return unless $fd;
3196        while (my $remote = <$fd>) {
3197                chomp $remote;
3198                $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3199                next if $wanted and not $remote eq $wanted;
3200                my ($url, $key) = ($1, $2);
3201
3202                $remotes{$remote} ||= { 'heads' => () };
3203                $remotes{$remote}{$key} = $url;
3204        }
3205        close $fd or return;
3206        return wantarray ? %remotes : \%remotes;
3207}
3208
3209# Takes a hash of remotes as first parameter and fills it by adding the
3210# available remote heads for each of the indicated remotes.
3211sub fill_remote_heads {
3212        my $remotes = shift;
3213        my @heads = map { "remotes/$_" } keys %$remotes;
3214        my @remoteheads = git_get_heads_list(undef, @heads);
3215        foreach my $remote (keys %$remotes) {
3216                $remotes->{$remote}{'heads'} = [ grep {
3217                        $_->{'name'} =~ s!^$remote/!!
3218                        } @remoteheads ];
3219        }
3220}
3221
3222sub git_get_references {
3223        my $type = shift || "";
3224        my %refs;
3225        # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3226        # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3227        open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3228                ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3229                or return;
3230
3231        while (my $line = <$fd>) {
3232                chomp $line;
3233                if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3234                        if (defined $refs{$1}) {
3235                                push @{$refs{$1}}, $2;
3236                        } else {
3237                                $refs{$1} = [ $2 ];
3238                        }
3239                }
3240        }
3241        close $fd or return;
3242        return \%refs;
3243}
3244
3245sub git_get_rev_name_tags {
3246        my $hash = shift || return undef;
3247
3248        open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3249                or return;
3250        my $name_rev = <$fd>;
3251        close $fd;
3252
3253        if ($name_rev =~ m|^$hash tags/(.*)$|) {
3254                return $1;
3255        } else {
3256                # catches also '$hash undefined' output
3257                return undef;
3258        }
3259}
3260
3261## ----------------------------------------------------------------------
3262## parse to hash functions
3263
3264sub parse_date {
3265        my $epoch = shift;
3266        my $tz = shift || "-0000";
3267
3268        my %date;
3269        my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3270        my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3271        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3272        $date{'hour'} = $hour;
3273        $date{'minute'} = $min;
3274        $date{'mday'} = $mday;
3275        $date{'day'} = $days[$wday];
3276        $date{'month'} = $months[$mon];
3277        $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3278                             $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3279        $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3280                             $mday, $months[$mon], $hour ,$min;
3281        $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3282                             1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3283
3284        my ($tz_sign, $tz_hour, $tz_min) =
3285                ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3286        $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3287        my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3288        ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3289        $date{'hour_local'} = $hour;
3290        $date{'minute_local'} = $min;
3291        $date{'tz_local'} = $tz;
3292        $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3293                                  1900+$year, $mon+1, $mday,
3294                                  $hour, $min, $sec, $tz);
3295        return %date;
3296}
3297
3298sub parse_tag {
3299        my $tag_id = shift;
3300        my %tag;
3301        my @comment;
3302
3303        open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3304        $tag{'id'} = $tag_id;
3305        while (my $line = <$fd>) {
3306                chomp $line;
3307                if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3308                        $tag{'object'} = $1;
3309                } elsif ($line =~ m/^type (.+)$/) {
3310                        $tag{'type'} = $1;
3311                } elsif ($line =~ m/^tag (.+)$/) {
3312                        $tag{'name'} = $1;
3313                } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3314                        $tag{'author'} = $1;
3315                        $tag{'author_epoch'} = $2;
3316                        $tag{'author_tz'} = $3;
3317                        if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3318                                $tag{'author_name'}  = $1;
3319                                $tag{'author_email'} = $2;
3320                        } else {
3321                                $tag{'author_name'} = $tag{'author'};
3322                        }
3323                } elsif ($line =~ m/--BEGIN/) {
3324                        push @comment, $line;
3325                        last;
3326                } elsif ($line eq "") {
3327                        last;
3328                }
3329        }
3330        push @comment, <$fd>;
3331        $tag{'comment'} = \@comment;
3332        close $fd or return;
3333        if (!defined $tag{'name'}) {
3334                return
3335        };
3336        return %tag
3337}
3338
3339sub parse_commit_text {
3340        my ($commit_text, $withparents) = @_;
3341        my @commit_lines = split '\n', $commit_text;
3342        my %co;
3343
3344        pop @commit_lines; # Remove '\0'
3345
3346        if (! @commit_lines) {
3347                return;
3348        }
3349
3350        my $header = shift @commit_lines;
3351        if ($header !~ m/^[0-9a-fA-F]{40}/) {
3352                return;
3353        }
3354        ($co{'id'}, my @parents) = split ' ', $header;
3355        while (my $line = shift @commit_lines) {
3356                last if $line eq "\n";
3357                if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3358                        $co{'tree'} = $1;
3359                } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3360                        push @parents, $1;
3361                } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3362                        $co{'author'} = to_utf8($1);
3363                        $co{'author_epoch'} = $2;
3364                        $co{'author_tz'} = $3;
3365                        if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3366                                $co{'author_name'}  = $1;
3367                                $co{'author_email'} = $2;
3368                        } else {
3369                                $co{'author_name'} = $co{'author'};
3370                        }
3371                } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3372                        $co{'committer'} = to_utf8($1);
3373                        $co{'committer_epoch'} = $2;
3374                        $co{'committer_tz'} = $3;
3375                        if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3376                                $co{'committer_name'}  = $1;
3377                                $co{'committer_email'} = $2;
3378                        } else {
3379                                $co{'committer_name'} = $co{'committer'};
3380                        }
3381                }
3382        }
3383        if (!defined $co{'tree'}) {
3384                return;
3385        };
3386        $co{'parents'} = \@parents;
3387        $co{'parent'} = $parents[0];
3388
3389        foreach my $title (@commit_lines) {
3390                $title =~ s/^    //;
3391                if ($title ne "") {
3392                        $co{'title'} = chop_str($title, 80, 5);
3393                        # remove leading stuff of merges to make the interesting part visible
3394                        if (length($title) > 50) {
3395                                $title =~ s/^Automatic //;
3396                                $title =~ s/^merge (of|with) /Merge ... /i;
3397                                if (length($title) > 50) {
3398                                        $title =~ s/(http|rsync):\/\///;
3399                                }
3400                                if (length($title) > 50) {
3401                                        $title =~ s/(master|www|rsync)\.//;
3402                                }
3403                                if (length($title) > 50) {
3404                                        $title =~ s/kernel.org:?//;
3405                                }
3406                                if (length($title) > 50) {
3407                                        $title =~ s/\/pub\/scm//;
3408                                }
3409                        }
3410                        $co{'title_short'} = chop_str($title, 50, 5);
3411                        last;
3412                }
3413        }
3414        if (! defined $co{'title'} || $co{'title'} eq "") {
3415                $co{'title'} = $co{'title_short'} = '(no commit message)';
3416        }
3417        # remove added spaces
3418        foreach my $line (@commit_lines) {
3419                $line =~ s/^    //;
3420        }
3421        $co{'comment'} = \@commit_lines;
3422
3423        my $age = time - $co{'committer_epoch'};
3424        $co{'age'} = $age;
3425        $co{'age_string'} = age_string($age);
3426        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3427        if ($age > 60*60*24*7*2) {
3428                $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3429                $co{'age_string_age'} = $co{'age_string'};
3430        } else {
3431                $co{'age_string_date'} = $co{'age_string'};
3432                $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3433        }
3434        return %co;
3435}
3436
3437sub parse_commit {
3438        my ($commit_id) = @_;
3439        my %co;
3440
3441        local $/ = "\0";
3442
3443        open my $fd, "-|", git_cmd(), "rev-list",
3444                "--parents",
3445                "--header",
3446                "--max-count=1",
3447                $commit_id,
3448                "--",
3449                or die_error(500, "Open git-rev-list failed");
3450        %co = parse_commit_text(<$fd>, 1);
3451        close $fd;
3452
3453        return %co;
3454}
3455
3456sub parse_commits {
3457        my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3458        my @cos;
3459
3460        $maxcount ||= 1;
3461        $skip ||= 0;
3462
3463        local $/ = "\0";
3464
3465        open my $fd, "-|", git_cmd(), "rev-list",
3466                "--header",
3467                @args,
3468                ("--max-count=" . $maxcount),
3469                ("--skip=" . $skip),
3470                @extra_options,
3471                $commit_id,
3472                "--",
3473                ($filename ? ($filename) : ())
3474                or die_error(500, "Open git-rev-list failed");
3475        while (my $line = <$fd>) {
3476                my %co = parse_commit_text($line);
3477                push @cos, \%co;
3478        }
3479        close $fd;
3480
3481        return wantarray ? @cos : \@cos;
3482}
3483
3484# parse line of git-diff-tree "raw" output
3485sub parse_difftree_raw_line {
3486        my $line = shift;
3487        my %res;
3488
3489        # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3490        # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3491        if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3492                $res{'from_mode'} = $1;
3493                $res{'to_mode'} = $2;
3494                $res{'from_id'} = $3;
3495                $res{'to_id'} = $4;
3496                $res{'status'} = $5;
3497                $res{'similarity'} = $6;
3498                if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3499                        ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3500                } else {
3501                        $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3502                }
3503        }
3504        # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3505        # combined diff (for merge commit)
3506        elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3507                $res{'nparents'}  = length($1);
3508                $res{'from_mode'} = [ split(' ', $2) ];
3509                $res{'to_mode'} = pop @{$res{'from_mode'}};
3510                $res{'from_id'} = [ split(' ', $3) ];
3511                $res{'to_id'} = pop @{$res{'from_id'}};
3512                $res{'status'} = [ split('', $4) ];
3513                $res{'to_file'} = unquote($5);
3514        }
3515        # 'c512b523472485aef4fff9e57b229d9d243c967f'
3516        elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3517                $res{'commit'} = $1;
3518        }
3519
3520        return wantarray ? %res : \%res;
3521}
3522
3523# wrapper: return parsed line of git-diff-tree "raw" output
3524# (the argument might be raw line, or parsed info)
3525sub parsed_difftree_line {
3526        my $line_or_ref = shift;
3527
3528        if (ref($line_or_ref) eq "HASH") {
3529                # pre-parsed (or generated by hand)
3530                return $line_or_ref;
3531        } else {
3532                return parse_difftree_raw_line($line_or_ref);
3533        }
3534}
3535
3536# parse line of git-ls-tree output
3537sub parse_ls_tree_line {
3538        my $line = shift;
3539        my %opts = @_;
3540        my %res;
3541
3542        if ($opts{'-l'}) {
3543                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3544                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3545
3546                $res{'mode'} = $1;
3547                $res{'type'} = $2;
3548                $res{'hash'} = $3;
3549                $res{'size'} = $4;
3550                if ($opts{'-z'}) {
3551                        $res{'name'} = $5;
3552                } else {
3553                        $res{'name'} = unquote($5);
3554                }
3555        } else {
3556                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3557                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3558
3559                $res{'mode'} = $1;
3560                $res{'type'} = $2;
3561                $res{'hash'} = $3;
3562                if ($opts{'-z'}) {
3563                        $res{'name'} = $4;
3564                } else {
3565                        $res{'name'} = unquote($4);
3566                }
3567        }
3568
3569        return wantarray ? %res : \%res;
3570}
3571
3572# generates _two_ hashes, references to which are passed as 2 and 3 argument
3573sub parse_from_to_diffinfo {
3574        my ($diffinfo, $from, $to, @parents) = @_;
3575
3576        if ($diffinfo->{'nparents'}) {
3577                # combined diff
3578                $from->{'file'} = [];
3579                $from->{'href'} = [];
3580                fill_from_file_info($diffinfo, @parents)
3581                        unless exists $diffinfo->{'from_file'};
3582                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3583                        $from->{'file'}[$i] =
3584                                defined $diffinfo->{'from_file'}[$i] ?
3585                                        $diffinfo->{'from_file'}[$i] :
3586                                        $diffinfo->{'to_file'};
3587                        if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3588                                $from->{'href'}[$i] = href(action=>"blob",
3589                                                           hash_base=>$parents[$i],
3590                                                           hash=>$diffinfo->{'from_id'}[$i],
3591                                                           file_name=>$from->{'file'}[$i]);
3592                        } else {
3593                                $from->{'href'}[$i] = undef;
3594                        }
3595                }
3596        } else {
3597                # ordinary (not combined) diff
3598                $from->{'file'} = $diffinfo->{'from_file'};
3599                if ($diffinfo->{'status'} ne "A") { # not new (added) file
3600                        $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3601                                               hash=>$diffinfo->{'from_id'},
3602                                               file_name=>$from->{'file'});
3603                } else {
3604                        delete $from->{'href'};
3605                }
3606        }
3607
3608        $to->{'file'} = $diffinfo->{'to_file'};
3609        if (!is_deleted($diffinfo)) { # file exists in result
3610                $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3611                                     hash=>$diffinfo->{'to_id'},
3612                                     file_name=>$to->{'file'});
3613        } else {
3614                delete $to->{'href'};
3615        }
3616}
3617
3618## ......................................................................
3619## parse to array of hashes functions
3620
3621sub git_get_heads_list {
3622        my ($limit, @classes) = @_;
3623        @classes = ('heads') unless @classes;
3624        my @patterns = map { "refs/$_" } @classes;
3625        my @headslist;
3626
3627        open my $fd, '-|', git_cmd(), 'for-each-ref',
3628                ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3629                '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3630                @patterns
3631                or return;
3632        while (my $line = <$fd>) {
3633                my %ref_item;
3634
3635                chomp $line;
3636                my ($refinfo, $committerinfo) = split(/\0/, $line);
3637                my ($hash, $name, $title) = split(' ', $refinfo, 3);
3638                my ($committer, $epoch, $tz) =
3639                        ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3640                $ref_item{'fullname'}  = $name;
3641                $name =~ s!^refs/(?:head|remote)s/!!;
3642
3643                $ref_item{'name'}  = $name;
3644                $ref_item{'id'}    = $hash;
3645                $ref_item{'title'} = $title || '(no commit message)';
3646                $ref_item{'epoch'} = $epoch;
3647                if ($epoch) {
3648                        $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3649                } else {
3650                        $ref_item{'age'} = "unknown";
3651                }
3652
3653                push @headslist, \%ref_item;
3654        }
3655        close $fd;
3656
3657        return wantarray ? @headslist : \@headslist;
3658}
3659
3660sub git_get_tags_list {
3661        my $limit = shift;
3662        my @tagslist;
3663
3664        open my $fd, '-|', git_cmd(), 'for-each-ref',
3665                ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3666                '--format=%(objectname) %(objecttype) %(refname) '.
3667                '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3668                'refs/tags'
3669                or return;
3670        while (my $line = <$fd>) {
3671                my %ref_item;
3672
3673                chomp $line;
3674                my ($refinfo, $creatorinfo) = split(/\0/, $line);
3675                my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3676                my ($creator, $epoch, $tz) =
3677                        ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3678                $ref_item{'fullname'} = $name;
3679                $name =~ s!^refs/tags/!!;
3680
3681                $ref_item{'type'} = $type;
3682                $ref_item{'id'} = $id;
3683                $ref_item{'name'} = $name;
3684                if ($type eq "tag") {
3685                        $ref_item{'subject'} = $title;
3686                        $ref_item{'reftype'} = $reftype;
3687                        $ref_item{'refid'}   = $refid;
3688                } else {
3689                        $ref_item{'reftype'} = $type;
3690                        $ref_item{'refid'}   = $id;
3691                }
3692
3693                if ($type eq "tag" || $type eq "commit") {
3694                        $ref_item{'epoch'} = $epoch;
3695                        if ($epoch) {
3696                                $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3697                        } else {
3698                                $ref_item{'age'} = "unknown";
3699                        }
3700                }
3701
3702                push @tagslist, \%ref_item;
3703        }
3704        close $fd;
3705
3706        return wantarray ? @tagslist : \@tagslist;
3707}
3708
3709## ----------------------------------------------------------------------
3710## filesystem-related functions
3711
3712sub get_file_owner {
3713        my $path = shift;
3714
3715        my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3716        my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3717        if (!defined $gcos) {
3718                return undef;
3719        }
3720        my $owner = $gcos;
3721        $owner =~ s/[,;].*$//;
3722        return to_utf8($owner);
3723}
3724
3725# assume that file exists
3726sub insert_file {
3727        my $filename = shift;
3728
3729        open my $fd, '<', $filename;
3730        print map { to_utf8($_) } <$fd>;
3731        close $fd;
3732}
3733
3734## ......................................................................
3735## mimetype related functions
3736
3737sub mimetype_guess_file {
3738        my $filename = shift;
3739        my $mimemap = shift;
3740        -r $mimemap or return undef;
3741
3742        my %mimemap;
3743        open(my $mh, '<', $mimemap) or return undef;
3744        while (<$mh>) {
3745                next if m/^#/; # skip comments
3746                my ($mimetype, @exts) = split(/\s+/);
3747                foreach my $ext (@exts) {
3748                        $mimemap{$ext} = $mimetype;
3749                }
3750        }
3751        close($mh);
3752
3753        $filename =~ /\.([^.]*)$/;
3754        return $mimemap{$1};
3755}
3756
3757sub mimetype_guess {
3758        my $filename = shift;
3759        my $mime;
3760        $filename =~ /\./ or return undef;
3761
3762        if ($mimetypes_file) {
3763                my $file = $mimetypes_file;
3764                if ($file !~ m!^/!) { # if it is relative path
3765                        # it is relative to project
3766                        $file = "$projectroot/$project/$file";
3767                }
3768                $mime = mimetype_guess_file($filename, $file);
3769        }
3770        $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3771        return $mime;
3772}
3773
3774sub blob_mimetype {
3775        my $fd = shift;
3776        my $filename = shift;
3777
3778        if ($filename) {
3779                my $mime = mimetype_guess($filename);
3780                $mime and return $mime;
3781        }
3782
3783        # just in case
3784        return $default_blob_plain_mimetype unless $fd;
3785
3786        if (-T $fd) {
3787                return 'text/plain';
3788        } elsif (! $filename) {
3789                return 'application/octet-stream';
3790        } elsif ($filename =~ m/\.png$/i) {
3791                return 'image/png';
3792        } elsif ($filename =~ m/\.gif$/i) {
3793                return 'image/gif';
3794        } elsif ($filename =~ m/\.jpe?g$/i) {
3795                return 'image/jpeg';
3796        } else {
3797                return 'application/octet-stream';
3798        }
3799}
3800
3801sub blob_contenttype {
3802        my ($fd, $file_name, $type) = @_;
3803
3804        $type ||= blob_mimetype($fd, $file_name);
3805        if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3806                $type .= "; charset=$default_text_plain_charset";
3807        }
3808
3809        return $type;
3810}
3811
3812# guess file syntax for syntax highlighting; return undef if no highlighting
3813# the name of syntax can (in the future) depend on syntax highlighter used
3814sub guess_file_syntax {
3815        my ($highlight, $mimetype, $file_name) = @_;
3816        return undef unless ($highlight && defined $file_name);
3817        my $basename = basename($file_name, '.in');
3818        return $highlight_basename{$basename}
3819                if exists $highlight_basename{$basename};
3820
3821        $basename =~ /\.([^.]*)$/;
3822        my $ext = $1 or return undef;
3823        return $highlight_ext{$ext}
3824                if exists $highlight_ext{$ext};
3825
3826        return undef;
3827}
3828
3829# run highlighter and return FD of its output,
3830# or return original FD if no highlighting
3831sub run_highlighter {
3832        my ($fd, $highlight, $syntax) = @_;
3833        return $fd unless ($highlight && defined $syntax);
3834
3835        close $fd;
3836        open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3837                  quote_command($highlight_bin).
3838                  " --replace-tabs=8 --fragment --syntax $syntax |"
3839                or die_error(500, "Couldn't open file or run syntax highlighter");
3840        return $fd;
3841}
3842
3843## ======================================================================
3844## functions printing HTML: header, footer, error page
3845
3846sub get_page_title {
3847        my $title = to_utf8($site_name);
3848
3849        unless (defined $project) {
3850                if (defined $project_filter) {
3851                        $title .= " - projects in '" . esc_path($project_filter) . "'";
3852                }
3853                return $title;
3854        }
3855        $title .= " - " . to_utf8($project);
3856
3857        return $title unless (defined $action);
3858        $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3859
3860        return $title unless (defined $file_name);
3861        $title .= " - " . esc_path($file_name);
3862        if ($action eq "tree" && $file_name !~ m|/$|) {
3863                $title .= "/";
3864        }
3865
3866        return $title;
3867}
3868
3869sub get_content_type_html {
3870        # require explicit support from the UA if we are to send the page as
3871        # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3872        # we have to do this because MSIE sometimes globs '*/*', pretending to
3873        # support xhtml+xml but choking when it gets what it asked for.
3874        if (defined $cgi->http('HTTP_ACCEPT') &&
3875            $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3876            $cgi->Accept('application/xhtml+xml') != 0) {
3877                return 'application/xhtml+xml';
3878        } else {
3879                return 'text/html';
3880        }
3881}
3882
3883sub print_feed_meta {
3884        if (defined $project) {
3885                my %href_params = get_feed_info();
3886                if (!exists $href_params{'-title'}) {
3887                        $href_params{'-title'} = 'log';
3888                }
3889
3890                foreach my $format (qw(RSS Atom)) {
3891                        my $type = lc($format);
3892                        my %link_attr = (
3893                                '-rel' => 'alternate',
3894                                '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3895                                '-type' => "application/$type+xml"
3896                        );
3897
3898                        $href_params{'action'} = $type;
3899                        $link_attr{'-href'} = href(%href_params);
3900                        print "<link ".
3901                              "rel=\"$link_attr{'-rel'}\" ".
3902                              "title=\"$link_attr{'-title'}\" ".
3903                              "href=\"$link_attr{'-href'}\" ".
3904                              "type=\"$link_attr{'-type'}\" ".
3905                              "/>\n";
3906
3907                        $href_params{'extra_options'} = '--no-merges';
3908                        $link_attr{'-href'} = href(%href_params);
3909                        $link_attr{'-title'} .= ' (no merges)';
3910                        print "<link ".
3911                              "rel=\"$link_attr{'-rel'}\" ".
3912                              "title=\"$link_attr{'-title'}\" ".
3913                              "href=\"$link_attr{'-href'}\" ".
3914                              "type=\"$link_attr{'-type'}\" ".
3915                              "/>\n";
3916                }
3917
3918        } else {
3919                printf('<link rel="alternate" title="%s projects list" '.
3920                       'href="%s" type="text/plain; charset=utf-8" />'."\n",
3921                       esc_attr($site_name), href(project=>undef, action=>"project_index"));
3922                printf('<link rel="alternate" title="%s projects feeds" '.
3923                       'href="%s" type="text/x-opml" />'."\n",
3924                       esc_attr($site_name), href(project=>undef, action=>"opml"));
3925        }
3926}
3927
3928sub print_header_links {
3929        my $status = shift;
3930
3931        # print out each stylesheet that exist, providing backwards capability
3932        # for those people who defined $stylesheet in a config file
3933        if (defined $stylesheet) {
3934                print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3935        } else {
3936                foreach my $stylesheet (@stylesheets) {
3937                        next unless $stylesheet;
3938                        print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3939                }
3940        }
3941        print_feed_meta()
3942                if ($status eq '200 OK');
3943        if (defined $favicon) {
3944                print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3945        }
3946}
3947
3948sub print_nav_breadcrumbs_path {
3949        my $dirprefix = undef;
3950        while (my $part = shift) {
3951                $dirprefix .= "/" if defined $dirprefix;
3952                $dirprefix .= $part;
3953                print $cgi->a({-href => href(project => undef,
3954                                             project_filter => $dirprefix,
3955                                             action => "project_list")},
3956                              esc_html($part)) . " / ";
3957        }
3958}
3959
3960sub print_nav_breadcrumbs {
3961        my %opts = @_;
3962
3963        print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3964        if (defined $project) {
3965                my @dirname = split '/', $project;
3966                my $projectbasename = pop @dirname;
3967                print_nav_breadcrumbs_path(@dirname);
3968                print $cgi->a({-href => href(action=>"summary")}, esc_html($projectbasename));
3969                if (defined $action) {
3970                        my $action_print = $action ;
3971                        if (defined $opts{-action_extra}) {
3972                                $action_print = $cgi->a({-href => href(action=>$action)},
3973                                        $action);
3974                        }
3975                        print " / $action_print";
3976                }
3977                if (defined $opts{-action_extra}) {
3978                        print " / $opts{-action_extra}";
3979                }
3980                print "\n";
3981        } elsif (defined $project_filter) {
3982                print_nav_breadcrumbs_path(split '/', $project_filter);
3983        }
3984}
3985
3986sub print_search_form {
3987        if (!defined $searchtext) {
3988                $searchtext = "";
3989        }
3990        my $search_hash;
3991        if (defined $hash_base) {
3992                $search_hash = $hash_base;
3993        } elsif (defined $hash) {
3994                $search_hash = $hash;
3995        } else {
3996                $search_hash = "HEAD";
3997        }
3998        my $action = $my_uri;
3999        my $use_pathinfo = gitweb_check_feature('pathinfo');
4000        if ($use_pathinfo) {
4001                $action .= "/".esc_url($project);
4002        }
4003        print $cgi->startform(-method => "get", -action => $action) .
4004              "<div class=\"search\">\n" .
4005              (!$use_pathinfo &&
4006              $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
4007              $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
4008              $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
4009              $cgi->popup_menu(-name => 'st', -default => 'commit',
4010                               -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
4011              $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
4012              " search:\n",
4013              $cgi->textfield(-name => "s", -value => $searchtext, -override => 1) . "\n" .
4014              "<span title=\"Extended regular expression\">" .
4015              $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
4016                             -checked => $search_use_regexp) .
4017              "</span>" .
4018              "</div>" .
4019              $cgi->end_form() . "\n";
4020}
4021
4022sub git_header_html {
4023        my $status = shift || "200 OK";
4024        my $expires = shift;
4025        my %opts = @_;
4026
4027        my $title = get_page_title();
4028        my $content_type = get_content_type_html();
4029        print $cgi->header(-type=>$content_type, -charset => 'utf-8',
4030                           -status=> $status, -expires => $expires)
4031                unless ($opts{'-no_http_header'});
4032        my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
4033        print <<EOF;
4034<?xml version="1.0" encoding="utf-8"?>
4035<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
4036<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
4037<!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
4038<!-- git core binaries version $git_version -->
4039<head>
4040<meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
4041<meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
4042<meta name="robots" content="index, nofollow"/>
4043<title>$title</title>
4044EOF
4045        # the stylesheet, favicon etc urls won't work correctly with path_info
4046        # unless we set the appropriate base URL
4047        if ($ENV{'PATH_INFO'}) {
4048                print "<base href=\"".esc_url($base_url)."\" />\n";
4049        }
4050        print_header_links($status);
4051
4052        if (defined $site_html_head_string) {
4053                print to_utf8($site_html_head_string);
4054        }
4055
4056        print "</head>\n" .
4057              "<body>\n";
4058
4059        if (defined $site_header && -f $site_header) {
4060                insert_file($site_header);
4061        }
4062
4063        print "<div class=\"page_header\">\n";
4064        if (defined $logo) {
4065                print $cgi->a({-href => esc_url($logo_url),
4066                               -title => $logo_label},
4067                              $cgi->img({-src => esc_url($logo),
4068                                         -width => 72, -height => 27,
4069                                         -alt => "git",
4070                                         -class => "logo"}));
4071        }
4072        print_nav_breadcrumbs(%opts);
4073        print "</div>\n";
4074
4075        my $have_search = gitweb_check_feature('search');
4076        if (defined $project && $have_search) {
4077                print_search_form();
4078        }
4079}
4080
4081sub git_footer_html {
4082        my $feed_class = 'rss_logo';
4083
4084        print "<div class=\"page_footer\">\n";
4085        if (defined $project) {
4086                my $descr = git_get_project_description($project);
4087                if (defined $descr) {
4088                        print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
4089                }
4090
4091                my %href_params = get_feed_info();
4092                if (!%href_params) {
4093                        $feed_class .= ' generic';
4094                }
4095                $href_params{'-title'} ||= 'log';
4096
4097                foreach my $format (qw(RSS Atom)) {
4098                        $href_params{'action'} = lc($format);
4099                        print $cgi->a({-href => href(%href_params),
4100                                      -title => "$href_params{'-title'} $format feed",
4101                                      -class => $feed_class}, $format)."\n";
4102                }
4103
4104        } else {
4105                print $cgi->a({-href => href(project=>undef, action=>"opml",
4106                                             project_filter => $project_filter),
4107                              -class => $feed_class}, "OPML") . " ";
4108                print $cgi->a({-href => href(project=>undef, action=>"project_index",
4109                                             project_filter => $project_filter),
4110                              -class => $feed_class}, "TXT") . "\n";
4111        }
4112        print "</div>\n"; # class="page_footer"
4113
4114        if (defined $t0 && gitweb_check_feature('timed')) {
4115                print "<div id=\"generating_info\">\n";
4116                print 'This page took '.
4117                      '<span id="generating_time" class="time_span">'.
4118                      tv_interval($t0, [ gettimeofday() ]).
4119                      ' seconds </span>'.
4120                      ' and '.
4121                      '<span id="generating_cmd">'.
4122                      $number_of_git_cmds.
4123                      '</span> git commands '.
4124                      " to generate.\n";
4125                print "</div>\n"; # class="page_footer"
4126        }
4127
4128        if (defined $site_footer && -f $site_footer) {
4129                insert_file($site_footer);
4130        }
4131
4132        print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
4133        if (defined $action &&
4134            $action eq 'blame_incremental') {
4135                print qq!<script type="text/javascript">\n!.
4136                      qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
4137                      qq!           "!. href() .qq!");\n!.
4138                      qq!</script>\n!;
4139        } else {
4140                my ($jstimezone, $tz_cookie, $datetime_class) =
4141                        gitweb_get_feature('javascript-timezone');
4142
4143                print qq!<script type="text/javascript">\n!.
4144                      qq!window.onload = function () {\n!;
4145                if (gitweb_check_feature('javascript-actions')) {
4146                        print qq!       fixLinks();\n!;
4147                }
4148                if ($jstimezone && $tz_cookie && $datetime_class) {
4149                        print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4150                              qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4151                }
4152                print qq!};\n!.
4153                      qq!</script>\n!;
4154        }
4155
4156        print "</body>\n" .
4157              "</html>";
4158}
4159
4160# die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4161# Example: die_error(404, 'Hash not found')
4162# By convention, use the following status codes (as defined in RFC 2616):
4163# 400: Invalid or missing CGI parameters, or
4164#      requested object exists but has wrong type.
4165# 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4166#      this server or project.
4167# 404: Requested object/revision/project doesn't exist.
4168# 500: The server isn't configured properly, or
4169#      an internal error occurred (e.g. failed assertions caused by bugs), or
4170#      an unknown error occurred (e.g. the git binary died unexpectedly).
4171# 503: The server is currently unavailable (because it is overloaded,
4172#      or down for maintenance).  Generally, this is a temporary state.
4173sub die_error {
4174        my $status = shift || 500;
4175        my $error = esc_html(shift) || "Internal Server Error";
4176        my $extra = shift;
4177        my %opts = @_;
4178
4179        my %http_responses = (
4180                400 => '400 Bad Request',
4181                403 => '403 Forbidden',
4182                404 => '404 Not Found',
4183                500 => '500 Internal Server Error',
4184                503 => '503 Service Unavailable',
4185        );
4186        git_header_html($http_responses{$status}, undef, %opts);
4187        print <<EOF;
4188<div class="page_body">
4189<br /><br />
4190$status - $error
4191<br />
4192EOF
4193        if (defined $extra) {
4194                print "<hr />\n" .
4195                      "$extra\n";
4196        }
4197        print "</div>\n";
4198
4199        git_footer_html();
4200        goto DONE_GITWEB
4201                unless ($opts{'-error_handler'});
4202}
4203
4204## ----------------------------------------------------------------------
4205## functions printing or outputting HTML: navigation
4206
4207sub git_print_page_nav {
4208        my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4209        $extra = '' if !defined $extra; # pager or formats
4210
4211        my @navs = qw(summary shortlog log commit commitdiff tree);
4212        if ($suppress) {
4213                @navs = grep { $_ ne $suppress } @navs;
4214        }
4215
4216        my %arg = map { $_ => {action=>$_} } @navs;
4217        if (defined $head) {
4218                for (qw(commit commitdiff)) {
4219                        $arg{$_}{'hash'} = $head;
4220                }
4221                if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4222                        for (qw(shortlog log)) {
4223                                $arg{$_}{'hash'} = $head;
4224                        }
4225                }
4226        }
4227
4228        $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4229        $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4230
4231        my @actions = gitweb_get_feature('actions');
4232        my %repl = (
4233                '%' => '%',
4234                'n' => $project,         # project name
4235                'f' => $git_dir,         # project path within filesystem
4236                'h' => $treehead || '',  # current hash ('h' parameter)
4237                'b' => $treebase || '',  # hash base ('hb' parameter)
4238        );
4239        while (@actions) {
4240                my ($label, $link, $pos) = splice(@actions,0,3);
4241                # insert
4242                @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4243                # munch munch
4244                $link =~ s/%([%nfhb])/$repl{$1}/g;
4245                $arg{$label}{'_href'} = $link;
4246        }
4247
4248        print "<div class=\"page_nav\">\n" .
4249                (join " | ",
4250                 map { $_ eq $current ?
4251                       $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4252                 } @navs);
4253        print "<br/>\n$extra<br/>\n" .
4254              "</div>\n";
4255}
4256
4257# returns a submenu for the nagivation of the refs views (tags, heads,
4258# remotes) with the current view disabled and the remotes view only
4259# available if the feature is enabled
4260sub format_ref_views {
4261        my ($current) = @_;
4262        my @ref_views = qw{tags heads};
4263        push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4264        return join " | ", map {
4265                $_ eq $current ? $_ :
4266                $cgi->a({-href => href(action=>$_)}, $_)
4267        } @ref_views
4268}
4269
4270sub format_paging_nav {
4271        my ($action, $page, $has_next_link) = @_;
4272        my $paging_nav;
4273
4274
4275        if ($page > 0) {
4276                $paging_nav .=
4277                        $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4278                        " &sdot; " .
4279                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
4280                                 -accesskey => "p", -title => "Alt-p"}, "prev");
4281        } else {
4282                $paging_nav .= "first &sdot; prev";
4283        }
4284
4285        if ($has_next_link) {
4286                $paging_nav .= " &sdot; " .
4287                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
4288                                 -accesskey => "n", -title => "Alt-n"}, "next");
4289        } else {
4290                $paging_nav .= " &sdot; next";
4291        }
4292
4293        return $paging_nav;
4294}
4295
4296## ......................................................................
4297## functions printing or outputting HTML: div
4298
4299sub git_print_header_div {
4300        my ($action, $title, $hash, $hash_base) = @_;
4301        my %args = ();
4302
4303        $args{'action'} = $action;
4304        $args{'hash'} = $hash if $hash;
4305        $args{'hash_base'} = $hash_base if $hash_base;
4306
4307        print "<div class=\"header\">\n" .
4308              $cgi->a({-href => href(%args), -class => "title"},
4309              $title ? $title : $action) .
4310              "\n</div>\n";
4311}
4312
4313sub format_repo_url {
4314        my ($name, $url) = @_;
4315        return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4316}
4317
4318# Group output by placing it in a DIV element and adding a header.
4319# Options for start_div() can be provided by passing a hash reference as the
4320# first parameter to the function.
4321# Options to git_print_header_div() can be provided by passing an array
4322# reference. This must follow the options to start_div if they are present.
4323# The content can be a scalar, which is output as-is, a scalar reference, which
4324# is output after html escaping, an IO handle passed either as *handle or
4325# *handle{IO}, or a function reference. In the latter case all following
4326# parameters will be taken as argument to the content function call.
4327sub git_print_section {
4328        my ($div_args, $header_args, $content);
4329        my $arg = shift;
4330        if (ref($arg) eq 'HASH') {
4331                $div_args = $arg;
4332                $arg = shift;
4333        }
4334        if (ref($arg) eq 'ARRAY') {
4335                $header_args = $arg;
4336                $arg = shift;
4337        }
4338        $content = $arg;
4339
4340        print $cgi->start_div($div_args);
4341        git_print_header_div(@$header_args);
4342
4343        if (ref($content) eq 'CODE') {
4344                $content->(@_);
4345        } elsif (ref($content) eq 'SCALAR') {
4346                print esc_html($$content);
4347        } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4348                print <$content>;
4349        } elsif (!ref($content) && defined($content)) {
4350                print $content;
4351        }
4352
4353        print $cgi->end_div;
4354}
4355
4356sub format_timestamp_html {
4357        my $date = shift;
4358        my $strtime = $date->{'rfc2822'};
4359
4360        my (undef, undef, $datetime_class) =
4361                gitweb_get_feature('javascript-timezone');
4362        if ($datetime_class) {
4363                $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4364        }
4365
4366        my $localtime_format = '(%02d:%02d %s)';
4367        if ($date->{'hour_local'} < 6) {
4368                $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4369        }
4370        $strtime .= ' ' .
4371                    sprintf($localtime_format,
4372                            $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4373
4374        return $strtime;
4375}
4376
4377# Outputs the author name and date in long form
4378sub git_print_authorship {
4379        my $co = shift;
4380        my %opts = @_;
4381        my $tag = $opts{-tag} || 'div';
4382        my $author = $co->{'author_name'};
4383
4384        my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4385        print "<$tag class=\"author_date\">" .
4386              format_search_author($author, "author", esc_html($author)) .
4387              " [".format_timestamp_html(\%ad)."]".
4388              git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4389              "</$tag>\n";
4390}
4391
4392# Outputs table rows containing the full author or committer information,
4393# in the format expected for 'commit' view (& similar).
4394# Parameters are a commit hash reference, followed by the list of people
4395# to output information for. If the list is empty it defaults to both
4396# author and committer.
4397sub git_print_authorship_rows {
4398        my $co = shift;
4399        # too bad we can't use @people = @_ || ('author', 'committer')
4400        my @people = @_;
4401        @people = ('author', 'committer') unless @people;
4402        foreach my $who (@people) {
4403                my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4404                print "<tr><td>$who</td><td>" .
4405                      format_search_author($co->{"${who}_name"}, $who,
4406                                           esc_html($co->{"${who}_name"})) . " " .
4407                      format_search_author($co->{"${who}_email"}, $who,
4408                                           esc_html("<" . $co->{"${who}_email"} . ">")) .
4409                      "</td><td rowspan=\"2\">" .
4410                      git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4411                      "</td></tr>\n" .
4412                      "<tr>" .
4413                      "<td></td><td>" .
4414                      format_timestamp_html(\%wd) .
4415                      "</td>" .
4416                      "</tr>\n";
4417        }
4418}
4419
4420sub git_print_page_path {
4421        my $name = shift;
4422        my $type = shift;
4423        my $hb = shift;
4424
4425
4426        print "<div class=\"page_path\">";
4427        print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4428                      -title => 'tree root'}, to_utf8("[$project]"));
4429        print " / ";
4430        if (defined $name) {
4431                my @dirname = split '/', $name;
4432                my $basename = pop @dirname;
4433                my $fullname = '';
4434
4435                foreach my $dir (@dirname) {
4436                        $fullname .= ($fullname ? '/' : '') . $dir;
4437                        print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4438                                                     hash_base=>$hb),
4439                                      -title => $fullname}, esc_path($dir));
4440                        print " / ";
4441                }
4442                if (defined $type && $type eq 'blob') {
4443                        print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4444                                                     hash_base=>$hb),
4445                                      -title => $name}, esc_path($basename));
4446                } elsif (defined $type && $type eq 'tree') {
4447                        print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4448                                                     hash_base=>$hb),
4449                                      -title => $name}, esc_path($basename));
4450                        print " / ";
4451                } else {
4452                        print esc_path($basename);
4453                }
4454        }
4455        print "<br/></div>\n";
4456}
4457
4458sub git_print_log {
4459        my $log = shift;
4460        my %opts = @_;
4461
4462        if ($opts{'-remove_title'}) {
4463                # remove title, i.e. first line of log
4464                shift @$log;
4465        }
4466        # remove leading empty lines
4467        while (defined $log->[0] && $log->[0] eq "") {
4468                shift @$log;
4469        }
4470
4471        # print log
4472        my $signoff = 0;
4473        my $empty = 0;
4474        foreach my $line (@$log) {
4475                if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4476                        $signoff = 1;
4477                        $empty = 0;
4478                        if (! $opts{'-remove_signoff'}) {
4479                                print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4480                                next;
4481                        } else {
4482                                # remove signoff lines
4483                                next;
4484                        }
4485                } else {
4486                        $signoff = 0;
4487                }
4488
4489                # print only one empty line
4490                # do not print empty line after signoff
4491                if ($line eq "") {
4492                        next if ($empty || $signoff);
4493                        $empty = 1;
4494                } else {
4495                        $empty = 0;
4496                }
4497
4498                print format_log_line_html($line) . "<br/>\n";
4499        }
4500
4501        if ($opts{'-final_empty_line'}) {
4502                # end with single empty line
4503                print "<br/>\n" unless $empty;
4504        }
4505}
4506
4507# return link target (what link points to)
4508sub git_get_link_target {
4509        my $hash = shift;
4510        my $link_target;
4511
4512        # read link
4513        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4514                or return;
4515        {
4516                local $/ = undef;
4517                $link_target = <$fd>;
4518        }
4519        close $fd
4520                or return;
4521
4522        return $link_target;
4523}
4524
4525# given link target, and the directory (basedir) the link is in,
4526# return target of link relative to top directory (top tree);
4527# return undef if it is not possible (including absolute links).
4528sub normalize_link_target {
4529        my ($link_target, $basedir) = @_;
4530
4531        # absolute symlinks (beginning with '/') cannot be normalized
4532        return if (substr($link_target, 0, 1) eq '/');
4533
4534        # normalize link target to path from top (root) tree (dir)
4535        my $path;
4536        if ($basedir) {
4537                $path = $basedir . '/' . $link_target;
4538        } else {
4539                # we are in top (root) tree (dir)
4540                $path = $link_target;
4541        }
4542
4543        # remove //, /./, and /../
4544        my @path_parts;
4545        foreach my $part (split('/', $path)) {
4546                # discard '.' and ''
4547                next if (!$part || $part eq '.');
4548                # handle '..'
4549                if ($part eq '..') {
4550                        if (@path_parts) {
4551                                pop @path_parts;
4552                        } else {
4553                                # link leads outside repository (outside top dir)
4554                                return;
4555                        }
4556                } else {
4557                        push @path_parts, $part;
4558                }
4559        }
4560        $path = join('/', @path_parts);
4561
4562        return $path;
4563}
4564
4565# print tree entry (row of git_tree), but without encompassing <tr> element
4566sub git_print_tree_entry {
4567        my ($t, $basedir, $hash_base, $have_blame) = @_;
4568
4569        my %base_key = ();
4570        $base_key{'hash_base'} = $hash_base if defined $hash_base;
4571
4572        # The format of a table row is: mode list link.  Where mode is
4573        # the mode of the entry, list is the name of the entry, an href,
4574        # and link is the action links of the entry.
4575
4576        print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4577        if (exists $t->{'size'}) {
4578                print "<td class=\"size\">$t->{'size'}</td>\n";
4579        }
4580        if ($t->{'type'} eq "blob") {
4581                print "<td class=\"list\">" .
4582                        $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4583                                               file_name=>"$basedir$t->{'name'}", %base_key),
4584                                -class => "list"}, esc_path($t->{'name'}));
4585                if (S_ISLNK(oct $t->{'mode'})) {
4586                        my $link_target = git_get_link_target($t->{'hash'});
4587                        if ($link_target) {
4588                                my $norm_target = normalize_link_target($link_target, $basedir);
4589                                if (defined $norm_target) {
4590                                        print " -> " .
4591                                              $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4592                                                                     file_name=>$norm_target),
4593                                                       -title => $norm_target}, esc_path($link_target));
4594                                } else {
4595                                        print " -> " . esc_path($link_target);
4596                                }
4597                        }
4598                }
4599                print "</td>\n";
4600                print "<td class=\"link\">";
4601                print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4602                                             file_name=>"$basedir$t->{'name'}", %base_key)},
4603                              "blob");
4604                if ($have_blame) {
4605                        print " | " .
4606                              $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4607                                                     file_name=>"$basedir$t->{'name'}", %base_key)},
4608                                      "blame");
4609                }
4610                if (defined $hash_base) {
4611                        print " | " .
4612                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4613                                                     hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4614                                      "history");
4615                }
4616                print " | " .
4617                        $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4618                                               file_name=>"$basedir$t->{'name'}")},
4619                                "raw");
4620                print "</td>\n";
4621
4622        } elsif ($t->{'type'} eq "tree") {
4623                print "<td class=\"list\">";
4624                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4625                                             file_name=>"$basedir$t->{'name'}",
4626                                             %base_key)},
4627                              esc_path($t->{'name'}));
4628                print "</td>\n";
4629                print "<td class=\"link\">";
4630                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4631                                             file_name=>"$basedir$t->{'name'}",
4632                                             %base_key)},
4633                              "tree");
4634                if (defined $hash_base) {
4635                        print " | " .
4636                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4637                                                     file_name=>"$basedir$t->{'name'}")},
4638                                      "history");
4639                }
4640                print "</td>\n";
4641        } else {
4642                # unknown object: we can only present history for it
4643                # (this includes 'commit' object, i.e. submodule support)
4644                print "<td class=\"list\">" .
4645                      esc_path($t->{'name'}) .
4646                      "</td>\n";
4647                print "<td class=\"link\">";
4648                if (defined $hash_base) {
4649                        print $cgi->a({-href => href(action=>"history",
4650                                                     hash_base=>$hash_base,
4651                                                     file_name=>"$basedir$t->{'name'}")},
4652                                      "history");
4653                }
4654                print "</td>\n";
4655        }
4656}
4657
4658## ......................................................................
4659## functions printing large fragments of HTML
4660
4661# get pre-image filenames for merge (combined) diff
4662sub fill_from_file_info {
4663        my ($diff, @parents) = @_;
4664
4665        $diff->{'from_file'} = [ ];
4666        $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4667        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4668                if ($diff->{'status'}[$i] eq 'R' ||
4669                    $diff->{'status'}[$i] eq 'C') {
4670                        $diff->{'from_file'}[$i] =
4671                                git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4672                }
4673        }
4674
4675        return $diff;
4676}
4677
4678# is current raw difftree line of file deletion
4679sub is_deleted {
4680        my $diffinfo = shift;
4681
4682        return $diffinfo->{'to_id'} eq ('0' x 40);
4683}
4684
4685# does patch correspond to [previous] difftree raw line
4686# $diffinfo  - hashref of parsed raw diff format
4687# $patchinfo - hashref of parsed patch diff format
4688#              (the same keys as in $diffinfo)
4689sub is_patch_split {
4690        my ($diffinfo, $patchinfo) = @_;
4691
4692        return defined $diffinfo && defined $patchinfo
4693                && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4694}
4695
4696
4697sub git_difftree_body {
4698        my ($difftree, $hash, @parents) = @_;
4699        my ($parent) = $parents[0];
4700        my $have_blame = gitweb_check_feature('blame');
4701        print "<div class=\"list_head\">\n";
4702        if ($#{$difftree} > 10) {
4703                print(($#{$difftree} + 1) . " files changed:\n");
4704        }
4705        print "</div>\n";
4706
4707        print "<table class=\"" .
4708              (@parents > 1 ? "combined " : "") .
4709              "diff_tree\">\n";
4710
4711        # header only for combined diff in 'commitdiff' view
4712        my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4713        if ($has_header) {
4714                # table header
4715                print "<thead><tr>\n" .
4716                       "<th></th><th></th>\n"; # filename, patchN link
4717                for (my $i = 0; $i < @parents; $i++) {
4718                        my $par = $parents[$i];
4719                        print "<th>" .
4720                              $cgi->a({-href => href(action=>"commitdiff",
4721                                                     hash=>$hash, hash_parent=>$par),
4722                                       -title => 'commitdiff to parent number ' .
4723                                                  ($i+1) . ': ' . substr($par,0,7)},
4724                                      $i+1) .
4725                              "&nbsp;</th>\n";
4726                }
4727                print "</tr></thead>\n<tbody>\n";
4728        }
4729
4730        my $alternate = 1;
4731        my $patchno = 0;
4732        foreach my $line (@{$difftree}) {
4733                my $diff = parsed_difftree_line($line);
4734
4735                if ($alternate) {
4736                        print "<tr class=\"dark\">\n";
4737                } else {
4738                        print "<tr class=\"light\">\n";
4739                }
4740                $alternate ^= 1;
4741
4742                if (exists $diff->{'nparents'}) { # combined diff
4743
4744                        fill_from_file_info($diff, @parents)
4745                                unless exists $diff->{'from_file'};
4746
4747                        if (!is_deleted($diff)) {
4748                                # file exists in the result (child) commit
4749                                print "<td>" .
4750                                      $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4751                                                             file_name=>$diff->{'to_file'},
4752                                                             hash_base=>$hash),
4753                                              -class => "list"}, esc_path($diff->{'to_file'})) .
4754                                      "</td>\n";
4755                        } else {
4756                                print "<td>" .
4757                                      esc_path($diff->{'to_file'}) .
4758                                      "</td>\n";
4759                        }
4760
4761                        if ($action eq 'commitdiff') {
4762                                # link to patch
4763                                $patchno++;
4764                                print "<td class=\"link\">" .
4765                                      $cgi->a({-href => href(-anchor=>"patch$patchno")},
4766                                              "patch") .
4767                                      " | " .
4768                                      "</td>\n";
4769                        }
4770
4771                        my $has_history = 0;
4772                        my $not_deleted = 0;
4773                        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4774                                my $hash_parent = $parents[$i];
4775                                my $from_hash = $diff->{'from_id'}[$i];
4776                                my $from_path = $diff->{'from_file'}[$i];
4777                                my $status = $diff->{'status'}[$i];
4778
4779                                $has_history ||= ($status ne 'A');
4780                                $not_deleted ||= ($status ne 'D');
4781
4782                                if ($status eq 'A') {
4783                                        print "<td  class=\"link\" align=\"right\"> | </td>\n";
4784                                } elsif ($status eq 'D') {
4785                                        print "<td class=\"link\">" .
4786                                              $cgi->a({-href => href(action=>"blob",
4787                                                                     hash_base=>$hash,
4788                                                                     hash=>$from_hash,
4789                                                                     file_name=>$from_path)},
4790                                                      "blob" . ($i+1)) .
4791                                              " | </td>\n";
4792                                } else {
4793                                        if ($diff->{'to_id'} eq $from_hash) {
4794                                                print "<td class=\"link nochange\">";
4795                                        } else {
4796                                                print "<td class=\"link\">";
4797                                        }
4798                                        print $cgi->a({-href => href(action=>"blobdiff",
4799                                                                     hash=>$diff->{'to_id'},
4800                                                                     hash_parent=>$from_hash,
4801                                                                     hash_base=>$hash,
4802                                                                     hash_parent_base=>$hash_parent,
4803                                                                     file_name=>$diff->{'to_file'},
4804                                                                     file_parent=>$from_path)},
4805                                                      "diff" . ($i+1)) .
4806                                              " | </td>\n";
4807                                }
4808                        }
4809
4810                        print "<td class=\"link\">";
4811                        if ($not_deleted) {
4812                                print $cgi->a({-href => href(action=>"blob",
4813                                                             hash=>$diff->{'to_id'},
4814                                                             file_name=>$diff->{'to_file'},
4815                                                             hash_base=>$hash)},
4816                                              "blob");
4817                                print " | " if ($has_history);
4818                        }
4819                        if ($has_history) {
4820                                print $cgi->a({-href => href(action=>"history",
4821                                                             file_name=>$diff->{'to_file'},
4822                                                             hash_base=>$hash)},
4823                                              "history");
4824                        }
4825                        print "</td>\n";
4826
4827                        print "</tr>\n";
4828                        next; # instead of 'else' clause, to avoid extra indent
4829                }
4830                # else ordinary diff
4831
4832                my ($to_mode_oct, $to_mode_str, $to_file_type);
4833                my ($from_mode_oct, $from_mode_str, $from_file_type);
4834                if ($diff->{'to_mode'} ne ('0' x 6)) {
4835                        $to_mode_oct = oct $diff->{'to_mode'};
4836                        if (S_ISREG($to_mode_oct)) { # only for regular file
4837                                $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4838                        }
4839                        $to_file_type = file_type($diff->{'to_mode'});
4840                }
4841                if ($diff->{'from_mode'} ne ('0' x 6)) {
4842                        $from_mode_oct = oct $diff->{'from_mode'};
4843                        if (S_ISREG($from_mode_oct)) { # only for regular file
4844                                $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4845                        }
4846                        $from_file_type = file_type($diff->{'from_mode'});
4847                }
4848
4849                if ($diff->{'status'} eq "A") { # created
4850                        my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4851                        $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4852                        $mode_chng   .= "]</span>";
4853                        print "<td>";
4854                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4855                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4856                                      -class => "list"}, esc_path($diff->{'file'}));
4857                        print "</td>\n";
4858                        print "<td>$mode_chng</td>\n";
4859                        print "<td class=\"link\">";
4860                        if ($action eq 'commitdiff') {
4861                                # link to patch
4862                                $patchno++;
4863                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4864                                              "patch") .
4865                                      " | ";
4866                        }
4867                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4868                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4869                                      "blob");
4870                        print "</td>\n";
4871
4872                } elsif ($diff->{'status'} eq "D") { # deleted
4873                        my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4874                        print "<td>";
4875                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4876                                                     hash_base=>$parent, file_name=>$diff->{'file'}),
4877                                       -class => "list"}, esc_path($diff->{'file'}));
4878                        print "</td>\n";
4879                        print "<td>$mode_chng</td>\n";
4880                        print "<td class=\"link\">";
4881                        if ($action eq 'commitdiff') {
4882                                # link to patch
4883                                $patchno++;
4884                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4885                                              "patch") .
4886                                      " | ";
4887                        }
4888                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4889                                                     hash_base=>$parent, file_name=>$diff->{'file'})},
4890                                      "blob") . " | ";
4891                        if ($have_blame) {
4892                                print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4893                                                             file_name=>$diff->{'file'})},
4894                                              "blame") . " | ";
4895                        }
4896                        print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4897                                                     file_name=>$diff->{'file'})},
4898                                      "history");
4899                        print "</td>\n";
4900
4901                } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4902                        my $mode_chnge = "";
4903                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4904                                $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4905                                if ($from_file_type ne $to_file_type) {
4906                                        $mode_chnge .= " from $from_file_type to $to_file_type";
4907                                }
4908                                if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4909                                        if ($from_mode_str && $to_mode_str) {
4910                                                $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4911                                        } elsif ($to_mode_str) {
4912                                                $mode_chnge .= " mode: $to_mode_str";
4913                                        }
4914                                }
4915                                $mode_chnge .= "]</span>\n";
4916                        }
4917                        print "<td>";
4918                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4919                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4920                                      -class => "list"}, esc_path($diff->{'file'}));
4921                        print "</td>\n";
4922                        print "<td>$mode_chnge</td>\n";
4923                        print "<td class=\"link\">";
4924                        if ($action eq 'commitdiff') {
4925                                # link to patch
4926                                $patchno++;
4927                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4928                                              "patch") .
4929                                      " | ";
4930                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4931                                # "commit" view and modified file (not onlu mode changed)
4932                                print $cgi->a({-href => href(action=>"blobdiff",
4933                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4934                                                             hash_base=>$hash, hash_parent_base=>$parent,
4935                                                             file_name=>$diff->{'file'})},
4936                                              "diff") .
4937                                      " | ";
4938                        }
4939                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4940                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4941                                       "blob") . " | ";
4942                        if ($have_blame) {
4943                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4944                                                             file_name=>$diff->{'file'})},
4945                                              "blame") . " | ";
4946                        }
4947                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4948                                                     file_name=>$diff->{'file'})},
4949                                      "history");
4950                        print "</td>\n";
4951
4952                } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4953                        my %status_name = ('R' => 'moved', 'C' => 'copied');
4954                        my $nstatus = $status_name{$diff->{'status'}};
4955                        my $mode_chng = "";
4956                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4957                                # mode also for directories, so we cannot use $to_mode_str
4958                                $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4959                        }
4960                        print "<td>" .
4961                              $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4962                                                     hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4963                                      -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4964                              "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4965                              $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4966                                                     hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4967                                      -class => "list"}, esc_path($diff->{'from_file'})) .
4968                              " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4969                              "<td class=\"link\">";
4970                        if ($action eq 'commitdiff') {
4971                                # link to patch
4972                                $patchno++;
4973                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4974                                              "patch") .
4975                                      " | ";
4976                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4977                                # "commit" view and modified file (not only pure rename or copy)
4978                                print $cgi->a({-href => href(action=>"blobdiff",
4979                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4980                                                             hash_base=>$hash, hash_parent_base=>$parent,
4981                                                             file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4982                                              "diff") .
4983                                      " | ";
4984                        }
4985                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4986                                                     hash_base=>$parent, file_name=>$diff->{'to_file'})},
4987                                      "blob") . " | ";
4988                        if ($have_blame) {
4989                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4990                                                             file_name=>$diff->{'to_file'})},
4991                                              "blame") . " | ";
4992                        }
4993                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4994                                                    file_name=>$diff->{'to_file'})},
4995                                      "history");
4996                        print "</td>\n";
4997
4998                } # we should not encounter Unmerged (U) or Unknown (X) status
4999                print "</tr>\n";
5000        }
5001        print "</tbody>" if $has_header;
5002        print "</table>\n";
5003}
5004
5005# Print context lines and then rem/add lines in a side-by-side manner.
5006sub print_sidebyside_diff_lines {
5007        my ($ctx, $rem, $add) = @_;
5008
5009        # print context block before add/rem block
5010        if (@$ctx) {
5011                print join '',
5012                        '<div class="chunk_block ctx">',
5013                                '<div class="old">',
5014                                @$ctx,
5015                                '</div>',
5016                                '<div class="new">',
5017                                @$ctx,
5018                                '</div>',
5019                        '</div>';
5020        }
5021
5022        if (!@$add) {
5023                # pure removal
5024                print join '',
5025                        '<div class="chunk_block rem">',
5026                                '<div class="old">',
5027                                @$rem,
5028                                '</div>',
5029                        '</div>';
5030        } elsif (!@$rem) {
5031                # pure addition
5032                print join '',
5033                        '<div class="chunk_block add">',
5034                                '<div class="new">',
5035                                @$add,
5036                                '</div>',
5037                        '</div>';
5038        } else {
5039                print join '',
5040                        '<div class="chunk_block chg">',
5041                                '<div class="old">',
5042                                @$rem,
5043                                '</div>',
5044                                '<div class="new">',
5045                                @$add,
5046                                '</div>',
5047                        '</div>';
5048        }
5049}
5050
5051# Print context lines and then rem/add lines in inline manner.
5052sub print_inline_diff_lines {
5053        my ($ctx, $rem, $add) = @_;
5054
5055        print @$ctx, @$rem, @$add;
5056}
5057
5058# Print context lines and then rem/add lines.
5059sub print_diff_lines {
5060        my ($ctx, $rem, $add, $diff_style, $is_combined) = @_;
5061
5062        if ($diff_style eq 'sidebyside' && !$is_combined) {
5063                print_sidebyside_diff_lines($ctx, $rem, $add);
5064        } else {
5065                # default 'inline' style and unknown styles
5066                print_inline_diff_lines($ctx, $rem, $add);
5067        }
5068}
5069
5070sub print_diff_chunk {
5071        my ($diff_style, $is_combined, @chunk) = @_;
5072        my (@ctx, @rem, @add);
5073
5074        # The class of the previous line.
5075        my $prev_class = '';
5076
5077        return unless @chunk;
5078
5079        # incomplete last line might be among removed or added lines,
5080        # or both, or among context lines: find which
5081        for (my $i = 1; $i < @chunk; $i++) {
5082                if ($chunk[$i][0] eq 'incomplete') {
5083                        $chunk[$i][0] = $chunk[$i-1][0];
5084                }
5085        }
5086
5087        # guardian
5088        push @chunk, ["", ""];
5089
5090        foreach my $line_info (@chunk) {
5091                my ($class, $line) = @$line_info;
5092
5093                # print chunk headers
5094                if ($class && $class eq 'chunk_header') {
5095                        print $line;
5096                        next;
5097                }
5098
5099                ## print from accumulator when have some add/rem lines or end
5100                # of chunk (flush context lines), or when have add and rem
5101                # lines and new block is reached (otherwise add/rem lines could
5102                # be reordered)
5103                if (!$class || ((@rem || @add) && $class eq 'ctx') ||
5104                    (@rem && @add && $class ne $prev_class)) {
5105                        print_diff_lines(\@ctx, \@rem, \@add,
5106                                         $diff_style, $is_combined);
5107                        @ctx = @rem = @add = ();
5108                }
5109
5110                ## adding lines to accumulator
5111                # guardian value
5112                last unless $line;
5113                # rem, add or change
5114                if ($class eq 'rem') {
5115                        push @rem, $line;
5116                } elsif ($class eq 'add') {
5117                        push @add, $line;
5118                }
5119                # context line
5120                if ($class eq 'ctx') {
5121                        push @ctx, $line;
5122                }
5123
5124                $prev_class = $class;
5125        }
5126}
5127
5128sub git_patchset_body {
5129        my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
5130        my ($hash_parent) = $hash_parents[0];
5131
5132        my $is_combined = (@hash_parents > 1);
5133        my $patch_idx = 0;
5134        my $patch_number = 0;
5135        my $patch_line;
5136        my $diffinfo;
5137        my $to_name;
5138        my (%from, %to);
5139        my @chunk; # for side-by-side diff
5140
5141        print "<div class=\"patchset\">\n";
5142
5143        # skip to first patch
5144        while ($patch_line = <$fd>) {
5145                chomp $patch_line;
5146
5147                last if ($patch_line =~ m/^diff /);
5148        }
5149
5150 PATCH:
5151        while ($patch_line) {
5152
5153                # parse "git diff" header line
5154                if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
5155                        # $1 is from_name, which we do not use
5156                        $to_name = unquote($2);
5157                        $to_name =~ s!^b/!!;
5158                } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
5159                        # $1 is 'cc' or 'combined', which we do not use
5160                        $to_name = unquote($2);
5161                } else {
5162                        $to_name = undef;
5163                }
5164
5165                # check if current patch belong to current raw line
5166                # and parse raw git-diff line if needed
5167                if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
5168                        # this is continuation of a split patch
5169                        print "<div class=\"patch cont\">\n";
5170                } else {
5171                        # advance raw git-diff output if needed
5172                        $patch_idx++ if defined $diffinfo;
5173
5174                        # read and prepare patch information
5175                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5176
5177                        # compact combined diff output can have some patches skipped
5178                        # find which patch (using pathname of result) we are at now;
5179                        if ($is_combined) {
5180                                while ($to_name ne $diffinfo->{'to_file'}) {
5181                                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5182                                              format_diff_cc_simplified($diffinfo, @hash_parents) .
5183                                              "</div>\n";  # class="patch"
5184
5185                                        $patch_idx++;
5186                                        $patch_number++;
5187
5188                                        last if $patch_idx > $#$difftree;
5189                                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5190                                }
5191                        }
5192
5193                        # modifies %from, %to hashes
5194                        parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5195
5196                        # this is first patch for raw difftree line with $patch_idx index
5197                        # we index @$difftree array from 0, but number patches from 1
5198                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5199                }
5200
5201                # git diff header
5202                #assert($patch_line =~ m/^diff /) if DEBUG;
5203                #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5204                $patch_number++;
5205                # print "git diff" header
5206                print format_git_diff_header_line($patch_line, $diffinfo,
5207                                                  \%from, \%to);
5208
5209                # print extended diff header
5210                print "<div class=\"diff extended_header\">\n";
5211        EXTENDED_HEADER:
5212                while ($patch_line = <$fd>) {
5213                        chomp $patch_line;
5214
5215                        last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5216
5217                        print format_extended_diff_header_line($patch_line, $diffinfo,
5218                                                               \%from, \%to);
5219                }
5220                print "</div>\n"; # class="diff extended_header"
5221
5222                # from-file/to-file diff header
5223                if (! $patch_line) {
5224                        print "</div>\n"; # class="patch"
5225                        last PATCH;
5226                }
5227                next PATCH if ($patch_line =~ m/^diff /);
5228                #assert($patch_line =~ m/^---/) if DEBUG;
5229
5230                my $last_patch_line = $patch_line;
5231                $patch_line = <$fd>;
5232                chomp $patch_line;
5233                #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5234
5235                print format_diff_from_to_header($last_patch_line, $patch_line,
5236                                                 $diffinfo, \%from, \%to,
5237                                                 @hash_parents);
5238
5239                # the patch itself
5240        LINE:
5241                while ($patch_line = <$fd>) {
5242                        chomp $patch_line;
5243
5244                        next PATCH if ($patch_line =~ m/^diff /);
5245
5246                        my ($class, $line) = process_diff_line($patch_line, \%from, \%to);
5247                        my $diff_classes = "diff";
5248                        $diff_classes .= " $class" if ($class);
5249                        $line = "<div class=\"$diff_classes\">$line</div>\n";
5250
5251                        if ($class eq 'chunk_header') {
5252                                print_diff_chunk($diff_style, $is_combined, @chunk);
5253                                @chunk = ();
5254                        }
5255
5256                        push @chunk, [ $class, $line ];
5257                }
5258
5259        } continue {
5260                if (@chunk) {
5261                        print_diff_chunk($diff_style, $is_combined, @chunk);
5262                        @chunk = ();
5263                }
5264                print "</div>\n"; # class="patch"
5265        }
5266
5267        # for compact combined (--cc) format, with chunk and patch simplification
5268        # the patchset might be empty, but there might be unprocessed raw lines
5269        for (++$patch_idx if $patch_number > 0;
5270             $patch_idx < @$difftree;
5271             ++$patch_idx) {
5272                # read and prepare patch information
5273                $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5274
5275                # generate anchor for "patch" links in difftree / whatchanged part
5276                print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5277                      format_diff_cc_simplified($diffinfo, @hash_parents) .
5278                      "</div>\n";  # class="patch"
5279
5280                $patch_number++;
5281        }
5282
5283        if ($patch_number == 0) {
5284                if (@hash_parents > 1) {
5285                        print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5286                } else {
5287                        print "<div class=\"diff nodifferences\">No differences found</div>\n";
5288                }
5289        }
5290
5291        print "</div>\n"; # class="patchset"
5292}
5293
5294# . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5295
5296sub git_project_search_form {
5297        my ($searchtext, $search_use_regexp) = @_;
5298
5299        my $limit = '';
5300        if ($project_filter) {
5301                $limit = " in '$project_filter/'";
5302        }
5303
5304        print "<div class=\"projsearch\">\n";
5305        print $cgi->startform(-method => 'get', -action => $my_uri) .
5306              $cgi->hidden(-name => 'a', -value => 'project_list')  . "\n";
5307        print $cgi->hidden(-name => 'pf', -value => $project_filter). "\n"
5308                if (defined $project_filter);
5309        print $cgi->textfield(-name => 's', -value => $searchtext,
5310                              -title => "Search project by name and description$limit",
5311                              -size => 60) . "\n" .
5312              "<span title=\"Extended regular expression\">" .
5313              $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
5314                             -checked => $search_use_regexp) .
5315              "</span>\n" .
5316              $cgi->submit(-name => 'btnS', -value => 'Search') .
5317              $cgi->end_form() . "\n" .
5318              $cgi->a({-href => href(project => undef, searchtext => undef,
5319                                     project_filter => $project_filter)},
5320                      esc_html("List all projects$limit")) . "<br />\n";
5321        print "</div>\n";
5322}
5323
5324# entry for given @keys needs filling if at least one of keys in list
5325# is not present in %$project_info
5326sub project_info_needs_filling {
5327        my ($project_info, @keys) = @_;
5328
5329        # return List::MoreUtils::any { !exists $project_info->{$_} } @keys;
5330        foreach my $key (@keys) {
5331                if (!exists $project_info->{$key}) {
5332                        return 1;
5333                }
5334        }
5335        return;
5336}
5337
5338# fills project list info (age, description, owner, category, forks, etc.)
5339# for each project in the list, removing invalid projects from
5340# returned list, or fill only specified info.
5341#
5342# Invalid projects are removed from the returned list if and only if you
5343# ask 'age' or 'age_string' to be filled, because they are the only fields
5344# that run unconditionally git command that requires repository, and
5345# therefore do always check if project repository is invalid.
5346#
5347# USAGE:
5348# * fill_project_list_info(\@project_list, 'descr_long', 'ctags')
5349#   ensures that 'descr_long' and 'ctags' fields are filled
5350# * @project_list = fill_project_list_info(\@project_list)
5351#   ensures that all fields are filled (and invalid projects removed)
5352#
5353# NOTE: modifies $projlist, but does not remove entries from it
5354sub fill_project_list_info {
5355        my ($projlist, @wanted_keys) = @_;
5356        my @projects;
5357        my $filter_set = sub { return @_; };
5358        if (@wanted_keys) {
5359                my %wanted_keys = map { $_ => 1 } @wanted_keys;
5360                $filter_set = sub { return grep { $wanted_keys{$_} } @_; };
5361        }
5362
5363        my $show_ctags = gitweb_check_feature('ctags');
5364 PROJECT:
5365        foreach my $pr (@$projlist) {
5366                if (project_info_needs_filling($pr, $filter_set->('age', 'age_string'))) {
5367                        my (@activity) = git_get_last_activity($pr->{'path'});
5368                        unless (@activity) {
5369                                next PROJECT;
5370                        }
5371                        ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5372                }
5373                if (project_info_needs_filling($pr, $filter_set->('descr', 'descr_long'))) {
5374                        my $descr = git_get_project_description($pr->{'path'}) || "";
5375                        $descr = to_utf8($descr);
5376                        $pr->{'descr_long'} = $descr;
5377                        $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5378                }
5379                if (project_info_needs_filling($pr, $filter_set->('owner'))) {
5380                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5381                }
5382                if ($show_ctags &&
5383                    project_info_needs_filling($pr, $filter_set->('ctags'))) {
5384                        $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5385                }
5386                if ($projects_list_group_categories &&
5387                    project_info_needs_filling($pr, $filter_set->('category'))) {
5388                        my $cat = git_get_project_category($pr->{'path'}) ||
5389                                                           $project_list_default_category;
5390                        $pr->{'category'} = to_utf8($cat);
5391                }
5392
5393                push @projects, $pr;
5394        }
5395
5396        return @projects;
5397}
5398
5399sub sort_projects_list {
5400        my ($projlist, $order) = @_;
5401        my @projects;
5402
5403        my %order_info = (
5404                project => { key => 'path', type => 'str' },
5405                descr => { key => 'descr_long', type => 'str' },
5406                owner => { key => 'owner', type => 'str' },
5407                age => { key => 'age', type => 'num' }
5408        );
5409        my $oi = $order_info{$order};
5410        return @$projlist unless defined $oi;
5411        if ($oi->{'type'} eq 'str') {
5412                @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5413        } else {
5414                @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5415        }
5416
5417        return @projects;
5418}
5419
5420# returns a hash of categories, containing the list of project
5421# belonging to each category
5422sub build_projlist_by_category {
5423        my ($projlist, $from, $to) = @_;
5424        my %categories;
5425
5426        $from = 0 unless defined $from;
5427        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5428
5429        for (my $i = $from; $i <= $to; $i++) {
5430                my $pr = $projlist->[$i];
5431                push @{$categories{ $pr->{'category'} }}, $pr;
5432        }
5433
5434        return wantarray ? %categories : \%categories;
5435}
5436
5437# print 'sort by' <th> element, generating 'sort by $name' replay link
5438# if that order is not selected
5439sub print_sort_th {
5440        print format_sort_th(@_);
5441}
5442
5443sub format_sort_th {
5444        my ($name, $order, $header) = @_;
5445        my $sort_th = "";
5446        $header ||= ucfirst($name);
5447
5448        if ($order eq $name) {
5449                $sort_th .= "<th>$header</th>\n";
5450        } else {
5451                $sort_th .= "<th>" .
5452                            $cgi->a({-href => href(-replay=>1, order=>$name),
5453                                     -class => "header"}, $header) .
5454                            "</th>\n";
5455        }
5456
5457        return $sort_th;
5458}
5459
5460sub git_project_list_rows {
5461        my ($projlist, $from, $to, $check_forks) = @_;
5462
5463        $from = 0 unless defined $from;
5464        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5465
5466        my $alternate = 1;
5467        for (my $i = $from; $i <= $to; $i++) {
5468                my $pr = $projlist->[$i];
5469
5470                if ($alternate) {
5471                        print "<tr class=\"dark\">\n";
5472                } else {
5473                        print "<tr class=\"light\">\n";
5474                }
5475                $alternate ^= 1;
5476
5477                if ($check_forks) {
5478                        print "<td>";
5479                        if ($pr->{'forks'}) {
5480                                my $nforks = scalar @{$pr->{'forks'}};
5481                                if ($nforks > 0) {
5482                                        print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5483                                                       -title => "$nforks forks"}, "+");
5484                                } else {
5485                                        print $cgi->span({-title => "$nforks forks"}, "+");
5486                                }
5487                        }
5488                        print "</td>\n";
5489                }
5490                print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5491                                        -class => "list"},
5492                                       esc_html_match_hl($pr->{'path'}, $search_regexp)) .
5493                      "</td>\n" .
5494                      "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5495                                        -class => "list",
5496                                        -title => $pr->{'descr_long'}},
5497                                        $search_regexp
5498                                        ? esc_html_match_hl_chopped($pr->{'descr_long'},
5499                                                                    $pr->{'descr'}, $search_regexp)
5500                                        : esc_html($pr->{'descr'})) .
5501                      "</td>\n" .
5502                      "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5503                print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5504                      (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
5505                      "<td class=\"link\">" .
5506                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5507                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5508                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5509                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5510                      ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5511                      "</td>\n" .
5512                      "</tr>\n";
5513        }
5514}
5515
5516sub git_project_list_body {
5517        # actually uses global variable $project
5518        my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5519        my @projects = @$projlist;
5520
5521        my $check_forks = gitweb_check_feature('forks');
5522        my $show_ctags  = gitweb_check_feature('ctags');
5523        my $tagfilter = $show_ctags ? $input_params{'ctag'} : undef;
5524        $check_forks = undef
5525                if ($tagfilter || $search_regexp);
5526
5527        # filtering out forks before filling info allows to do less work
5528        @projects = filter_forks_from_projects_list(\@projects)
5529                if ($check_forks);
5530        # search_projects_list pre-fills required info
5531        @projects = search_projects_list(\@projects,
5532                                         'search_regexp' => $search_regexp,
5533                                         'tagfilter'  => $tagfilter)
5534                if ($tagfilter || $search_regexp);
5535        # fill the rest
5536        @projects = fill_project_list_info(\@projects);
5537
5538        $order ||= $default_projects_order;
5539        $from = 0 unless defined $from;
5540        $to = $#projects if (!defined $to || $#projects < $to);
5541
5542        # short circuit
5543        if ($from > $to) {
5544                print "<center>\n".
5545                      "<b>No such projects found</b><br />\n".
5546                      "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5547                      "</center>\n<br />\n";
5548                return;
5549        }
5550
5551        @projects = sort_projects_list(\@projects, $order);
5552
5553        if ($show_ctags) {
5554                my $ctags = git_gather_all_ctags(\@projects);
5555                my $cloud = git_populate_project_tagcloud($ctags);
5556                print git_show_project_tagcloud($cloud, 64);
5557        }
5558
5559        print "<table class=\"project_list\">\n";
5560        unless ($no_header) {
5561                print "<tr>\n";
5562                if ($check_forks) {
5563                        print "<th></th>\n";
5564                }
5565                print_sort_th('project', $order, 'Project');
5566                print_sort_th('descr', $order, 'Description');
5567                print_sort_th('owner', $order, 'Owner');
5568                print_sort_th('age', $order, 'Last Change');
5569                print "<th></th>\n" . # for links
5570                      "</tr>\n";
5571        }
5572
5573        if ($projects_list_group_categories) {
5574                # only display categories with projects in the $from-$to window
5575                @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5576                my %categories = build_projlist_by_category(\@projects, $from, $to);
5577                foreach my $cat (sort keys %categories) {
5578                        unless ($cat eq "") {
5579                                print "<tr>\n";
5580                                if ($check_forks) {
5581                                        print "<td></td>\n";
5582                                }
5583                                print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5584                                print "</tr>\n";
5585                        }
5586
5587                        git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5588                }
5589        } else {
5590                git_project_list_rows(\@projects, $from, $to, $check_forks);
5591        }
5592
5593        if (defined $extra) {
5594                print "<tr>\n";
5595                if ($check_forks) {
5596                        print "<td></td>\n";
5597                }
5598                print "<td colspan=\"5\">$extra</td>\n" .
5599                      "</tr>\n";
5600        }
5601        print "</table>\n";
5602}
5603
5604sub git_log_body {
5605        # uses global variable $project
5606        my ($commitlist, $from, $to, $refs, $extra) = @_;
5607
5608        $from = 0 unless defined $from;
5609        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5610
5611        for (my $i = 0; $i <= $to; $i++) {
5612                my %co = %{$commitlist->[$i]};
5613                next if !%co;
5614                my $commit = $co{'id'};
5615                my $ref = format_ref_marker($refs, $commit);
5616                git_print_header_div('commit',
5617                               "<span class=\"age\">$co{'age_string'}</span>" .
5618                               esc_html($co{'title'}) . $ref,
5619                               $commit);
5620                print "<div class=\"title_text\">\n" .
5621                      "<div class=\"log_link\">\n" .
5622                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5623                      " | " .
5624                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5625                      " | " .
5626                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5627                      "<br/>\n" .
5628                      "</div>\n";
5629                      git_print_authorship(\%co, -tag => 'span');
5630                      print "<br/>\n</div>\n";
5631
5632                print "<div class=\"log_body\">\n";
5633                git_print_log($co{'comment'}, -final_empty_line=> 1);
5634                print "</div>\n";
5635        }
5636        if ($extra) {
5637                print "<div class=\"page_nav\">\n";
5638                print "$extra\n";
5639                print "</div>\n";
5640        }
5641}
5642
5643sub git_shortlog_body {
5644        # uses global variable $project
5645        my ($commitlist, $from, $to, $refs, $extra) = @_;
5646
5647        $from = 0 unless defined $from;
5648        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5649
5650        print "<table class=\"shortlog\">\n";
5651        my $alternate = 1;
5652        for (my $i = $from; $i <= $to; $i++) {
5653                my %co = %{$commitlist->[$i]};
5654                my $commit = $co{'id'};
5655                my $ref = format_ref_marker($refs, $commit);
5656                if ($alternate) {
5657                        print "<tr class=\"dark\">\n";
5658                } else {
5659                        print "<tr class=\"light\">\n";
5660                }
5661                $alternate ^= 1;
5662                # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5663                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5664                      format_author_html('td', \%co, 10) . "<td>";
5665                print format_subject_html($co{'title'}, $co{'title_short'},
5666                                          href(action=>"commit", hash=>$commit), $ref);
5667                print "</td>\n" .
5668                      "<td class=\"link\">" .
5669                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5670                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5671                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5672                my $snapshot_links = format_snapshot_links($commit);
5673                if (defined $snapshot_links) {
5674                        print " | " . $snapshot_links;
5675                }
5676                print "</td>\n" .
5677                      "</tr>\n";
5678        }
5679        if (defined $extra) {
5680                print "<tr>\n" .
5681                      "<td colspan=\"4\">$extra</td>\n" .
5682                      "</tr>\n";
5683        }
5684        print "</table>\n";
5685}
5686
5687sub git_history_body {
5688        # Warning: assumes constant type (blob or tree) during history
5689        my ($commitlist, $from, $to, $refs, $extra,
5690            $file_name, $file_hash, $ftype) = @_;
5691
5692        $from = 0 unless defined $from;
5693        $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5694
5695        print "<table class=\"history\">\n";
5696        my $alternate = 1;
5697        for (my $i = $from; $i <= $to; $i++) {
5698                my %co = %{$commitlist->[$i]};
5699                if (!%co) {
5700                        next;
5701                }
5702                my $commit = $co{'id'};
5703
5704                my $ref = format_ref_marker($refs, $commit);
5705
5706                if ($alternate) {
5707                        print "<tr class=\"dark\">\n";
5708                } else {
5709                        print "<tr class=\"light\">\n";
5710                }
5711                $alternate ^= 1;
5712                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5713        # shortlog:   format_author_html('td', \%co, 10)
5714                      format_author_html('td', \%co, 15, 3) . "<td>";
5715                # originally git_history used chop_str($co{'title'}, 50)
5716                print format_subject_html($co{'title'}, $co{'title_short'},
5717                                          href(action=>"commit", hash=>$commit), $ref);
5718                print "</td>\n" .
5719                      "<td class=\"link\">" .
5720                      $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5721                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5722
5723                if ($ftype eq 'blob') {
5724                        my $blob_current = $file_hash;
5725                        my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5726                        if (defined $blob_current && defined $blob_parent &&
5727                                        $blob_current ne $blob_parent) {
5728                                print " | " .
5729                                        $cgi->a({-href => href(action=>"blobdiff",
5730                                                               hash=>$blob_current, hash_parent=>$blob_parent,
5731                                                               hash_base=>$hash_base, hash_parent_base=>$commit,
5732                                                               file_name=>$file_name)},
5733                                                "diff to current");
5734                        }
5735                }
5736                print "</td>\n" .
5737                      "</tr>\n";
5738        }
5739        if (defined $extra) {
5740                print "<tr>\n" .
5741                      "<td colspan=\"4\">$extra</td>\n" .
5742                      "</tr>\n";
5743        }
5744        print "</table>\n";
5745}
5746
5747sub git_tags_body {
5748        # uses global variable $project
5749        my ($taglist, $from, $to, $extra) = @_;
5750        $from = 0 unless defined $from;
5751        $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5752
5753        print "<table class=\"tags\">\n";
5754        my $alternate = 1;
5755        for (my $i = $from; $i <= $to; $i++) {
5756                my $entry = $taglist->[$i];
5757                my %tag = %$entry;
5758                my $comment = $tag{'subject'};
5759                my $comment_short;
5760                if (defined $comment) {
5761                        $comment_short = chop_str($comment, 30, 5);
5762                }
5763                if ($alternate) {
5764                        print "<tr class=\"dark\">\n";
5765                } else {
5766                        print "<tr class=\"light\">\n";
5767                }
5768                $alternate ^= 1;
5769                if (defined $tag{'age'}) {
5770                        print "<td><i>$tag{'age'}</i></td>\n";
5771                } else {
5772                        print "<td></td>\n";
5773                }
5774                print "<td>" .
5775                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5776                               -class => "list name"}, esc_html($tag{'name'})) .
5777                      "</td>\n" .
5778                      "<td>";
5779                if (defined $comment) {
5780                        print format_subject_html($comment, $comment_short,
5781                                                  href(action=>"tag", hash=>$tag{'id'}));
5782                }
5783                print "</td>\n" .
5784                      "<td class=\"selflink\">";
5785                if ($tag{'type'} eq "tag") {
5786                        print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5787                } else {
5788                        print "&nbsp;";
5789                }
5790                print "</td>\n" .
5791                      "<td class=\"link\">" . " | " .
5792                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5793                if ($tag{'reftype'} eq "commit") {
5794                        print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5795                              " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5796                } elsif ($tag{'reftype'} eq "blob") {
5797                        print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5798                }
5799                print "</td>\n" .
5800                      "</tr>";
5801        }
5802        if (defined $extra) {
5803                print "<tr>\n" .
5804                      "<td colspan=\"5\">$extra</td>\n" .
5805                      "</tr>\n";
5806        }
5807        print "</table>\n";
5808}
5809
5810sub git_heads_body {
5811        # uses global variable $project
5812        my ($headlist, $head_at, $from, $to, $extra) = @_;
5813        $from = 0 unless defined $from;
5814        $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5815
5816        print "<table class=\"heads\">\n";
5817        my $alternate = 1;
5818        for (my $i = $from; $i <= $to; $i++) {
5819                my $entry = $headlist->[$i];
5820                my %ref = %$entry;
5821                my $curr = defined $head_at && $ref{'id'} eq $head_at;
5822                if ($alternate) {
5823                        print "<tr class=\"dark\">\n";
5824                } else {
5825                        print "<tr class=\"light\">\n";
5826                }
5827                $alternate ^= 1;
5828                print "<td><i>$ref{'age'}</i></td>\n" .
5829                      ($curr ? "<td class=\"current_head\">" : "<td>") .
5830                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5831                               -class => "list name"},esc_html($ref{'name'})) .
5832                      "</td>\n" .
5833                      "<td class=\"link\">" .
5834                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5835                      $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5836                      $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5837                      "</td>\n" .
5838                      "</tr>";
5839        }
5840        if (defined $extra) {
5841                print "<tr>\n" .
5842                      "<td colspan=\"3\">$extra</td>\n" .
5843                      "</tr>\n";
5844        }
5845        print "</table>\n";
5846}
5847
5848# Display a single remote block
5849sub git_remote_block {
5850        my ($remote, $rdata, $limit, $head) = @_;
5851
5852        my $heads = $rdata->{'heads'};
5853        my $fetch = $rdata->{'fetch'};
5854        my $push = $rdata->{'push'};
5855
5856        my $urls_table = "<table class=\"projects_list\">\n" ;
5857
5858        if (defined $fetch) {
5859                if ($fetch eq $push) {
5860                        $urls_table .= format_repo_url("URL", $fetch);
5861                } else {
5862                        $urls_table .= format_repo_url("Fetch URL", $fetch);
5863                        $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5864                }
5865        } elsif (defined $push) {
5866                $urls_table .= format_repo_url("Push URL", $push);
5867        } else {
5868                $urls_table .= format_repo_url("", "No remote URL");
5869        }
5870
5871        $urls_table .= "</table>\n";
5872
5873        my $dots;
5874        if (defined $limit && $limit < @$heads) {
5875                $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5876        }
5877
5878        print $urls_table;
5879        git_heads_body($heads, $head, 0, $limit, $dots);
5880}
5881
5882# Display a list of remote names with the respective fetch and push URLs
5883sub git_remotes_list {
5884        my ($remotedata, $limit) = @_;
5885        print "<table class=\"heads\">\n";
5886        my $alternate = 1;
5887        my @remotes = sort keys %$remotedata;
5888
5889        my $limited = $limit && $limit < @remotes;
5890
5891        $#remotes = $limit - 1 if $limited;
5892
5893        while (my $remote = shift @remotes) {
5894                my $rdata = $remotedata->{$remote};
5895                my $fetch = $rdata->{'fetch'};
5896                my $push = $rdata->{'push'};
5897                if ($alternate) {
5898                        print "<tr class=\"dark\">\n";
5899                } else {
5900                        print "<tr class=\"light\">\n";
5901                }
5902                $alternate ^= 1;
5903                print "<td>" .
5904                      $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5905                               -class=> "list name"},esc_html($remote)) .
5906                      "</td>";
5907                print "<td class=\"link\">" .
5908                      (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5909                      " | " .
5910                      (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5911                      "</td>";
5912
5913                print "</tr>\n";
5914        }
5915
5916        if ($limited) {
5917                print "<tr>\n" .
5918                      "<td colspan=\"3\">" .
5919                      $cgi->a({-href => href(action=>"remotes")}, "...") .
5920                      "</td>\n" . "</tr>\n";
5921        }
5922
5923        print "</table>";
5924}
5925
5926# Display remote heads grouped by remote, unless there are too many
5927# remotes, in which case we only display the remote names
5928sub git_remotes_body {
5929        my ($remotedata, $limit, $head) = @_;
5930        if ($limit and $limit < keys %$remotedata) {
5931                git_remotes_list($remotedata, $limit);
5932        } else {
5933                fill_remote_heads($remotedata);
5934                while (my ($remote, $rdata) = each %$remotedata) {
5935                        git_print_section({-class=>"remote", -id=>$remote},
5936                                ["remotes", $remote, $remote], sub {
5937                                        git_remote_block($remote, $rdata, $limit, $head);
5938                                });
5939                }
5940        }
5941}
5942
5943sub git_search_message {
5944        my %co = @_;
5945
5946        my $greptype;
5947        if ($searchtype eq 'commit') {
5948                $greptype = "--grep=";
5949        } elsif ($searchtype eq 'author') {
5950                $greptype = "--author=";
5951        } elsif ($searchtype eq 'committer') {
5952                $greptype = "--committer=";
5953        }
5954        $greptype .= $searchtext;
5955        my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
5956                                       $greptype, '--regexp-ignore-case',
5957                                       $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
5958
5959        my $paging_nav = '';
5960        if ($page > 0) {
5961                $paging_nav .=
5962                        $cgi->a({-href => href(-replay=>1, page=>undef)},
5963                                "first") .
5964                        " &sdot; " .
5965                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
5966                                 -accesskey => "p", -title => "Alt-p"}, "prev");
5967        } else {
5968                $paging_nav .= "first &sdot; prev";
5969        }
5970        my $next_link = '';
5971        if ($#commitlist >= 100) {
5972                $next_link =
5973                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
5974                                 -accesskey => "n", -title => "Alt-n"}, "next");
5975                $paging_nav .= " &sdot; $next_link";
5976        } else {
5977                $paging_nav .= " &sdot; next";
5978        }
5979
5980        git_header_html();
5981
5982        git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
5983        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5984        if ($page == 0 && !@commitlist) {
5985                print "<p>No match.</p>\n";
5986        } else {
5987                git_search_grep_body(\@commitlist, 0, 99, $next_link);
5988        }
5989
5990        git_footer_html();
5991}
5992
5993sub git_search_changes {
5994        my %co = @_;
5995
5996        local $/ = "\n";
5997        open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
5998                '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
5999                ($search_use_regexp ? '--pickaxe-regex' : ())
6000                        or die_error(500, "Open git-log failed");
6001
6002        git_header_html();
6003
6004        git_print_page_nav('','', $hash,$co{'tree'},$hash);
6005        git_print_header_div('commit', esc_html($co{'title'}), $hash);
6006
6007        print "<table class=\"pickaxe search\">\n";
6008        my $alternate = 1;
6009        undef %co;
6010        my @files;
6011        while (my $line = <$fd>) {
6012                chomp $line;
6013                next unless $line;
6014
6015                my %set = parse_difftree_raw_line($line);
6016                if (defined $set{'commit'}) {
6017                        # finish previous commit
6018                        if (%co) {
6019                                print "</td>\n" .
6020                                      "<td class=\"link\">" .
6021                                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
6022                                              "commit") .
6023                                      " | " .
6024                                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
6025                                                             hash_base=>$co{'id'})},
6026                                              "tree") .
6027                                      "</td>\n" .
6028                                      "</tr>\n";
6029                        }
6030
6031                        if ($alternate) {
6032                                print "<tr class=\"dark\">\n";
6033                        } else {
6034                                print "<tr class=\"light\">\n";
6035                        }
6036                        $alternate ^= 1;
6037                        %co = parse_commit($set{'commit'});
6038                        my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6039                        print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6040                              "<td><i>$author</i></td>\n" .
6041                              "<td>" .
6042                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6043                                      -class => "list subject"},
6044                                      chop_and_escape_str($co{'title'}, 50) . "<br/>");
6045                } elsif (defined $set{'to_id'}) {
6046                        next if ($set{'to_id'} =~ m/^0{40}$/);
6047
6048                        print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6049                                                     hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6050                                      -class => "list"},
6051                                      "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6052                              "<br/>\n";
6053                }
6054        }
6055        close $fd;
6056
6057        # finish last commit (warning: repetition!)
6058        if (%co) {
6059                print "</td>\n" .
6060                      "<td class=\"link\">" .
6061                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
6062                              "commit") .
6063                      " | " .
6064                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
6065                                             hash_base=>$co{'id'})},
6066                              "tree") .
6067                      "</td>\n" .
6068                      "</tr>\n";
6069        }
6070
6071        print "</table>\n";
6072
6073        git_footer_html();
6074}
6075
6076sub git_search_files {
6077        my %co = @_;
6078
6079        local $/ = "\n";
6080        open my $fd, "-|", git_cmd(), 'grep', '-n', '-z',
6081                $search_use_regexp ? ('-E', '-i') : '-F',
6082                $searchtext, $co{'tree'}
6083                        or die_error(500, "Open git-grep failed");
6084
6085        git_header_html();
6086
6087        git_print_page_nav('','', $hash,$co{'tree'},$hash);
6088        git_print_header_div('commit', esc_html($co{'title'}), $hash);
6089
6090        print "<table class=\"grep_search\">\n";
6091        my $alternate = 1;
6092        my $matches = 0;
6093        my $lastfile = '';
6094        my $file_href;
6095        while (my $line = <$fd>) {
6096                chomp $line;
6097                my ($file, $lno, $ltext, $binary);
6098                last if ($matches++ > 1000);
6099                if ($line =~ /^Binary file (.+) matches$/) {
6100                        $file = $1;
6101                        $binary = 1;
6102                } else {
6103                        ($file, $lno, $ltext) = split(/\0/, $line, 3);
6104                        $file =~ s/^$co{'tree'}://;
6105                }
6106                if ($file ne $lastfile) {
6107                        $lastfile and print "</td></tr>\n";
6108                        if ($alternate++) {
6109                                print "<tr class=\"dark\">\n";
6110                        } else {
6111                                print "<tr class=\"light\">\n";
6112                        }
6113                        $file_href = href(action=>"blob", hash_base=>$co{'id'},
6114                                          file_name=>$file);
6115                        print "<td class=\"list\">".
6116                                $cgi->a({-href => $file_href, -class => "list"}, esc_path($file));
6117                        print "</td><td>\n";
6118                        $lastfile = $file;
6119                }
6120                if ($binary) {
6121                        print "<div class=\"binary\">Binary file</div>\n";
6122                } else {
6123                        $ltext = untabify($ltext);
6124                        if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6125                                $ltext = esc_html($1, -nbsp=>1);
6126                                $ltext .= '<span class="match">';
6127                                $ltext .= esc_html($2, -nbsp=>1);
6128                                $ltext .= '</span>';
6129                                $ltext .= esc_html($3, -nbsp=>1);
6130                        } else {
6131                                $ltext = esc_html($ltext, -nbsp=>1);
6132                        }
6133                        print "<div class=\"pre\">" .
6134                                $cgi->a({-href => $file_href.'#l'.$lno,
6135                                        -class => "linenr"}, sprintf('%4i', $lno)) .
6136                                ' ' .  $ltext . "</div>\n";
6137                }
6138        }
6139        if ($lastfile) {
6140                print "</td></tr>\n";
6141                if ($matches > 1000) {
6142                        print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6143                }
6144        } else {
6145                print "<div class=\"diff nodifferences\">No matches found</div>\n";
6146        }
6147        close $fd;
6148
6149        print "</table>\n";
6150
6151        git_footer_html();
6152}
6153
6154sub git_search_grep_body {
6155        my ($commitlist, $from, $to, $extra) = @_;
6156        $from = 0 unless defined $from;
6157        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
6158
6159        print "<table class=\"commit_search\">\n";
6160        my $alternate = 1;
6161        for (my $i = $from; $i <= $to; $i++) {
6162                my %co = %{$commitlist->[$i]};
6163                if (!%co) {
6164                        next;
6165                }
6166                my $commit = $co{'id'};
6167                if ($alternate) {
6168                        print "<tr class=\"dark\">\n";
6169                } else {
6170                        print "<tr class=\"light\">\n";
6171                }
6172                $alternate ^= 1;
6173                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6174                      format_author_html('td', \%co, 15, 5) .
6175                      "<td>" .
6176                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6177                               -class => "list subject"},
6178                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
6179                my $comment = $co{'comment'};
6180                foreach my $line (@$comment) {
6181                        if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
6182                                my ($lead, $match, $trail) = ($1, $2, $3);
6183                                $match = chop_str($match, 70, 5, 'center');
6184                                my $contextlen = int((80 - length($match))/2);
6185                                $contextlen = 30 if ($contextlen > 30);
6186                                $lead  = chop_str($lead,  $contextlen, 10, 'left');
6187                                $trail = chop_str($trail, $contextlen, 10, 'right');
6188
6189                                $lead  = esc_html($lead);
6190                                $match = esc_html($match);
6191                                $trail = esc_html($trail);
6192
6193                                print "$lead<span class=\"match\">$match</span>$trail<br />";
6194                        }
6195                }
6196                print "</td>\n" .
6197                      "<td class=\"link\">" .
6198                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6199                      " | " .
6200                      $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
6201                      " | " .
6202                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6203                print "</td>\n" .
6204                      "</tr>\n";
6205        }
6206        if (defined $extra) {
6207                print "<tr>\n" .
6208                      "<td colspan=\"3\">$extra</td>\n" .
6209                      "</tr>\n";
6210        }
6211        print "</table>\n";
6212}
6213
6214## ======================================================================
6215## ======================================================================
6216## actions
6217
6218sub git_project_list {
6219        my $order = $input_params{'order'};
6220        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6221                die_error(400, "Unknown order parameter");
6222        }
6223
6224        my @list = git_get_projects_list($project_filter, $strict_export);
6225        if (!@list) {
6226                die_error(404, "No projects found");
6227        }
6228
6229        git_header_html();
6230        if (defined $home_text && -f $home_text) {
6231                print "<div class=\"index_include\">\n";
6232                insert_file($home_text);
6233                print "</div>\n";
6234        }
6235
6236        git_project_search_form($searchtext, $search_use_regexp);
6237        git_project_list_body(\@list, $order);
6238        git_footer_html();
6239}
6240
6241sub git_forks {
6242        my $order = $input_params{'order'};
6243        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6244                die_error(400, "Unknown order parameter");
6245        }
6246
6247        my $filter = $project;
6248        $filter =~ s/\.git$//;
6249        my @list = git_get_projects_list($filter);
6250        if (!@list) {
6251                die_error(404, "No forks found");
6252        }
6253
6254        git_header_html();
6255        git_print_page_nav('','');
6256        git_print_header_div('summary', "$project forks");
6257        git_project_list_body(\@list, $order);
6258        git_footer_html();
6259}
6260
6261sub git_project_index {
6262        my @projects = git_get_projects_list($project_filter, $strict_export);
6263        if (!@projects) {
6264                die_error(404, "No projects found");
6265        }
6266
6267        print $cgi->header(
6268                -type => 'text/plain',
6269                -charset => 'utf-8',
6270                -content_disposition => 'inline; filename="index.aux"');
6271
6272        foreach my $pr (@projects) {
6273                if (!exists $pr->{'owner'}) {
6274                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6275                }
6276
6277                my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6278                # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6279                $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6280                $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6281                $path  =~ s/ /\+/g;
6282                $owner =~ s/ /\+/g;
6283
6284                print "$path $owner\n";
6285        }
6286}
6287
6288sub git_summary {
6289        my $descr = git_get_project_description($project) || "none";
6290        my %co = parse_commit("HEAD");
6291        my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6292        my $head = $co{'id'};
6293        my $remote_heads = gitweb_check_feature('remote_heads');
6294
6295        my $owner = git_get_project_owner($project);
6296
6297        my $refs = git_get_references();
6298        # These get_*_list functions return one more to allow us to see if
6299        # there are more ...
6300        my @taglist  = git_get_tags_list(16);
6301        my @headlist = git_get_heads_list(16);
6302        my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6303        my @forklist;
6304        my $check_forks = gitweb_check_feature('forks');
6305
6306        if ($check_forks) {
6307                # find forks of a project
6308                my $filter = $project;
6309                $filter =~ s/\.git$//;
6310                @forklist = git_get_projects_list($filter);
6311                # filter out forks of forks
6312                @forklist = filter_forks_from_projects_list(\@forklist)
6313                        if (@forklist);
6314        }
6315
6316        git_header_html();
6317        git_print_page_nav('summary','', $head);
6318
6319        print "<div class=\"title\">&nbsp;</div>\n";
6320        print "<table class=\"projects_list\">\n" .
6321              "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
6322              "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6323        if (defined $cd{'rfc2822'}) {
6324                print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6325                      "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6326        }
6327
6328        # use per project git URL list in $projectroot/$project/cloneurl
6329        # or make project git URL from git base URL and project name
6330        my $url_tag = "URL";
6331        my @url_list = git_get_project_url_list($project);
6332        @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6333        foreach my $git_url (@url_list) {
6334                next unless $git_url;
6335                print format_repo_url($url_tag, $git_url);
6336                $url_tag = "";
6337        }
6338
6339        # Tag cloud
6340        my $show_ctags = gitweb_check_feature('ctags');
6341        if ($show_ctags) {
6342                my $ctags = git_get_project_ctags($project);
6343                if (%$ctags) {
6344                        # without ability to add tags, don't show if there are none
6345                        my $cloud = git_populate_project_tagcloud($ctags);
6346                        print "<tr id=\"metadata_ctags\">" .
6347                              "<td>content tags</td>" .
6348                              "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6349                              "</tr>\n";
6350                }
6351        }
6352
6353        print "</table>\n";
6354
6355        # If XSS prevention is on, we don't include README.html.
6356        # TODO: Allow a readme in some safe format.
6357        if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6358                print "<div class=\"title\">readme</div>\n" .
6359                      "<div class=\"readme\">\n";
6360                insert_file("$projectroot/$project/README.html");
6361                print "\n</div>\n"; # class="readme"
6362        }
6363
6364        # we need to request one more than 16 (0..15) to check if
6365        # those 16 are all
6366        my @commitlist = $head ? parse_commits($head, 17) : ();
6367        if (@commitlist) {
6368                git_print_header_div('shortlog');
6369                git_shortlog_body(\@commitlist, 0, 15, $refs,
6370                                  $#commitlist <=  15 ? undef :
6371                                  $cgi->a({-href => href(action=>"shortlog")}, "..."));
6372        }
6373
6374        if (@taglist) {
6375                git_print_header_div('tags');
6376                git_tags_body(\@taglist, 0, 15,
6377                              $#taglist <=  15 ? undef :
6378                              $cgi->a({-href => href(action=>"tags")}, "..."));
6379        }
6380
6381        if (@headlist) {
6382                git_print_header_div('heads');
6383                git_heads_body(\@headlist, $head, 0, 15,
6384                               $#headlist <= 15 ? undef :
6385                               $cgi->a({-href => href(action=>"heads")}, "..."));
6386        }
6387
6388        if (%remotedata) {
6389                git_print_header_div('remotes');
6390                git_remotes_body(\%remotedata, 15, $head);
6391        }
6392
6393        if (@forklist) {
6394                git_print_header_div('forks');
6395                git_project_list_body(\@forklist, 'age', 0, 15,
6396                                      $#forklist <= 15 ? undef :
6397                                      $cgi->a({-href => href(action=>"forks")}, "..."),
6398                                      'no_header');
6399        }
6400
6401        git_footer_html();
6402}
6403
6404sub git_tag {
6405        my %tag = parse_tag($hash);
6406
6407        if (! %tag) {
6408                die_error(404, "Unknown tag object");
6409        }
6410
6411        my $head = git_get_head_hash($project);
6412        git_header_html();
6413        git_print_page_nav('','', $head,undef,$head);
6414        git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6415        print "<div class=\"title_text\">\n" .
6416              "<table class=\"object_header\">\n" .
6417              "<tr>\n" .
6418              "<td>object</td>\n" .
6419              "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6420                               $tag{'object'}) . "</td>\n" .
6421              "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6422                                              $tag{'type'}) . "</td>\n" .
6423              "</tr>\n";
6424        if (defined($tag{'author'})) {
6425                git_print_authorship_rows(\%tag, 'author');
6426        }
6427        print "</table>\n\n" .
6428              "</div>\n";
6429        print "<div class=\"page_body\">";
6430        my $comment = $tag{'comment'};
6431        foreach my $line (@$comment) {
6432                chomp $line;
6433                print esc_html($line, -nbsp=>1) . "<br/>\n";
6434        }
6435        print "</div>\n";
6436        git_footer_html();
6437}
6438
6439sub git_blame_common {
6440        my $format = shift || 'porcelain';
6441        if ($format eq 'porcelain' && $input_params{'javascript'}) {
6442                $format = 'incremental';
6443                $action = 'blame_incremental'; # for page title etc
6444        }
6445
6446        # permissions
6447        gitweb_check_feature('blame')
6448                or die_error(403, "Blame view not allowed");
6449
6450        # error checking
6451        die_error(400, "No file name given") unless $file_name;
6452        $hash_base ||= git_get_head_hash($project);
6453        die_error(404, "Couldn't find base commit") unless $hash_base;
6454        my %co = parse_commit($hash_base)
6455                or die_error(404, "Commit not found");
6456        my $ftype = "blob";
6457        if (!defined $hash) {
6458                $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6459                        or die_error(404, "Error looking up file");
6460        } else {
6461                $ftype = git_get_type($hash);
6462                if ($ftype !~ "blob") {
6463                        die_error(400, "Object is not a blob");
6464                }
6465        }
6466
6467        my $fd;
6468        if ($format eq 'incremental') {
6469                # get file contents (as base)
6470                open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6471                        or die_error(500, "Open git-cat-file failed");
6472        } elsif ($format eq 'data') {
6473                # run git-blame --incremental
6474                open $fd, "-|", git_cmd(), "blame", "--incremental",
6475                        $hash_base, "--", $file_name
6476                        or die_error(500, "Open git-blame --incremental failed");
6477        } else {
6478                # run git-blame --porcelain
6479                open $fd, "-|", git_cmd(), "blame", '-p',
6480                        $hash_base, '--', $file_name
6481                        or die_error(500, "Open git-blame --porcelain failed");
6482        }
6483
6484        # incremental blame data returns early
6485        if ($format eq 'data') {
6486                print $cgi->header(
6487                        -type=>"text/plain", -charset => "utf-8",
6488                        -status=> "200 OK");
6489                local $| = 1; # output autoflush
6490                while (my $line = <$fd>) {
6491                        print to_utf8($line);
6492                }
6493                close $fd
6494                        or print "ERROR $!\n";
6495
6496                print 'END';
6497                if (defined $t0 && gitweb_check_feature('timed')) {
6498                        print ' '.
6499                              tv_interval($t0, [ gettimeofday() ]).
6500                              ' '.$number_of_git_cmds;
6501                }
6502                print "\n";
6503
6504                return;
6505        }
6506
6507        # page header
6508        git_header_html();
6509        my $formats_nav =
6510                $cgi->a({-href => href(action=>"blob", -replay=>1)},
6511                        "blob") .
6512                " | ";
6513        if ($format eq 'incremental') {
6514                $formats_nav .=
6515                        $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6516                                "blame") . " (non-incremental)";
6517        } else {
6518                $formats_nav .=
6519                        $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6520                                "blame") . " (incremental)";
6521        }
6522        $formats_nav .=
6523                " | " .
6524                $cgi->a({-href => href(action=>"history", -replay=>1)},
6525                        "history") .
6526                " | " .
6527                $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6528                        "HEAD");
6529        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6530        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6531        git_print_page_path($file_name, $ftype, $hash_base);
6532
6533        # page body
6534        if ($format eq 'incremental') {
6535                print "<noscript>\n<div class=\"error\"><center><b>\n".
6536                      "This page requires JavaScript to run.\n Use ".
6537                      $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6538                              'this page').
6539                      " instead.\n".
6540                      "</b></center></div>\n</noscript>\n";
6541
6542                print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6543        }
6544
6545        print qq!<div class="page_body">\n!;
6546        print qq!<div id="progress_info">... / ...</div>\n!
6547                if ($format eq 'incremental');
6548        print qq!<table id="blame_table" class="blame" width="100%">\n!.
6549              #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6550              qq!<thead>\n!.
6551              qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6552              qq!</thead>\n!.
6553              qq!<tbody>\n!;
6554
6555        my @rev_color = qw(light dark);
6556        my $num_colors = scalar(@rev_color);
6557        my $current_color = 0;
6558
6559        if ($format eq 'incremental') {
6560                my $color_class = $rev_color[$current_color];
6561
6562                #contents of a file
6563                my $linenr = 0;
6564        LINE:
6565                while (my $line = <$fd>) {
6566                        chomp $line;
6567                        $linenr++;
6568
6569                        print qq!<tr id="l$linenr" class="$color_class">!.
6570                              qq!<td class="sha1"><a href=""> </a></td>!.
6571                              qq!<td class="linenr">!.
6572                              qq!<a class="linenr" href="">$linenr</a></td>!;
6573                        print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6574                        print qq!</tr>\n!;
6575                }
6576
6577        } else { # porcelain, i.e. ordinary blame
6578                my %metainfo = (); # saves information about commits
6579
6580                # blame data
6581        LINE:
6582                while (my $line = <$fd>) {
6583                        chomp $line;
6584                        # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6585                        # no <lines in group> for subsequent lines in group of lines
6586                        my ($full_rev, $orig_lineno, $lineno, $group_size) =
6587                           ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6588                        if (!exists $metainfo{$full_rev}) {
6589                                $metainfo{$full_rev} = { 'nprevious' => 0 };
6590                        }
6591                        my $meta = $metainfo{$full_rev};
6592                        my $data;
6593                        while ($data = <$fd>) {
6594                                chomp $data;
6595                                last if ($data =~ s/^\t//); # contents of line
6596                                if ($data =~ /^(\S+)(?: (.*))?$/) {
6597                                        $meta->{$1} = $2 unless exists $meta->{$1};
6598                                }
6599                                if ($data =~ /^previous /) {
6600                                        $meta->{'nprevious'}++;
6601                                }
6602                        }
6603                        my $short_rev = substr($full_rev, 0, 8);
6604                        my $author = $meta->{'author'};
6605                        my %date =
6606                                parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6607                        my $date = $date{'iso-tz'};
6608                        if ($group_size) {
6609                                $current_color = ($current_color + 1) % $num_colors;
6610                        }
6611                        my $tr_class = $rev_color[$current_color];
6612                        $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6613                        $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6614                        $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6615                        print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6616                        if ($group_size) {
6617                                print "<td class=\"sha1\"";
6618                                print " title=\"". esc_html($author) . ", $date\"";
6619                                print " rowspan=\"$group_size\"" if ($group_size > 1);
6620                                print ">";
6621                                print $cgi->a({-href => href(action=>"commit",
6622                                                             hash=>$full_rev,
6623                                                             file_name=>$file_name)},
6624                                              esc_html($short_rev));
6625                                if ($group_size >= 2) {
6626                                        my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6627                                        if (@author_initials) {
6628                                                print "<br />" .
6629                                                      esc_html(join('', @author_initials));
6630                                                #           or join('.', ...)
6631                                        }
6632                                }
6633                                print "</td>\n";
6634                        }
6635                        # 'previous' <sha1 of parent commit> <filename at commit>
6636                        if (exists $meta->{'previous'} &&
6637                            $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6638                                $meta->{'parent'} = $1;
6639                                $meta->{'file_parent'} = unquote($2);
6640                        }
6641                        my $linenr_commit =
6642                                exists($meta->{'parent'}) ?
6643                                $meta->{'parent'} : $full_rev;
6644                        my $linenr_filename =
6645                                exists($meta->{'file_parent'}) ?
6646                                $meta->{'file_parent'} : unquote($meta->{'filename'});
6647                        my $blamed = href(action => 'blame',
6648                                          file_name => $linenr_filename,
6649                                          hash_base => $linenr_commit);
6650                        print "<td class=\"linenr\">";
6651                        print $cgi->a({ -href => "$blamed#l$orig_lineno",
6652                                        -class => "linenr" },
6653                                      esc_html($lineno));
6654                        print "</td>";
6655                        print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6656                        print "</tr>\n";
6657                } # end while
6658
6659        }
6660
6661        # footer
6662        print "</tbody>\n".
6663              "</table>\n"; # class="blame"
6664        print "</div>\n";   # class="blame_body"
6665        close $fd
6666                or print "Reading blob failed\n";
6667
6668        git_footer_html();
6669}
6670
6671sub git_blame {
6672        git_blame_common();
6673}
6674
6675sub git_blame_incremental {
6676        git_blame_common('incremental');
6677}
6678
6679sub git_blame_data {
6680        git_blame_common('data');
6681}
6682
6683sub git_tags {
6684        my $head = git_get_head_hash($project);
6685        git_header_html();
6686        git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6687        git_print_header_div('summary', $project);
6688
6689        my @tagslist = git_get_tags_list();
6690        if (@tagslist) {
6691                git_tags_body(\@tagslist);
6692        }
6693        git_footer_html();
6694}
6695
6696sub git_heads {
6697        my $head = git_get_head_hash($project);
6698        git_header_html();
6699        git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6700        git_print_header_div('summary', $project);
6701
6702        my @headslist = git_get_heads_list();
6703        if (@headslist) {
6704                git_heads_body(\@headslist, $head);
6705        }
6706        git_footer_html();
6707}
6708
6709# used both for single remote view and for list of all the remotes
6710sub git_remotes {
6711        gitweb_check_feature('remote_heads')
6712                or die_error(403, "Remote heads view is disabled");
6713
6714        my $head = git_get_head_hash($project);
6715        my $remote = $input_params{'hash'};
6716
6717        my $remotedata = git_get_remotes_list($remote);
6718        die_error(500, "Unable to get remote information") unless defined $remotedata;
6719
6720        unless (%$remotedata) {
6721                die_error(404, defined $remote ?
6722                        "Remote $remote not found" :
6723                        "No remotes found");
6724        }
6725
6726        git_header_html(undef, undef, -action_extra => $remote);
6727        git_print_page_nav('', '',  $head, undef, $head,
6728                format_ref_views($remote ? '' : 'remotes'));
6729
6730        fill_remote_heads($remotedata);
6731        if (defined $remote) {
6732                git_print_header_div('remotes', "$remote remote for $project");
6733                git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6734        } else {
6735                git_print_header_div('summary', "$project remotes");
6736                git_remotes_body($remotedata, undef, $head);
6737        }
6738
6739        git_footer_html();
6740}
6741
6742sub git_blob_plain {
6743        my $type = shift;
6744        my $expires;
6745
6746        if (!defined $hash) {
6747                if (defined $file_name) {
6748                        my $base = $hash_base || git_get_head_hash($project);
6749                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6750                                or die_error(404, "Cannot find file");
6751                } else {
6752                        die_error(400, "No file name defined");
6753                }
6754        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6755                # blobs defined by non-textual hash id's can be cached
6756                $expires = "+1d";
6757        }
6758
6759        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6760                or die_error(500, "Open git-cat-file blob '$hash' failed");
6761
6762        # content-type (can include charset)
6763        $type = blob_contenttype($fd, $file_name, $type);
6764
6765        # "save as" filename, even when no $file_name is given
6766        my $save_as = "$hash";
6767        if (defined $file_name) {
6768                $save_as = $file_name;
6769        } elsif ($type =~ m/^text\//) {
6770                $save_as .= '.txt';
6771        }
6772
6773        # With XSS prevention on, blobs of all types except a few known safe
6774        # ones are served with "Content-Disposition: attachment" to make sure
6775        # they don't run in our security domain.  For certain image types,
6776        # blob view writes an <img> tag referring to blob_plain view, and we
6777        # want to be sure not to break that by serving the image as an
6778        # attachment (though Firefox 3 doesn't seem to care).
6779        my $sandbox = $prevent_xss &&
6780                $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6781
6782        # serve text/* as text/plain
6783        if ($prevent_xss &&
6784            ($type =~ m!^text/[a-z]+\b(.*)$! ||
6785             ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
6786                my $rest = $1;
6787                $rest = defined $rest ? $rest : '';
6788                $type = "text/plain$rest";
6789        }
6790
6791        print $cgi->header(
6792                -type => $type,
6793                -expires => $expires,
6794                -content_disposition =>
6795                        ($sandbox ? 'attachment' : 'inline')
6796                        . '; filename="' . $save_as . '"');
6797        local $/ = undef;
6798        binmode STDOUT, ':raw';
6799        print <$fd>;
6800        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6801        close $fd;
6802}
6803
6804sub git_blob {
6805        my $expires;
6806
6807        if (!defined $hash) {
6808                if (defined $file_name) {
6809                        my $base = $hash_base || git_get_head_hash($project);
6810                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6811                                or die_error(404, "Cannot find file");
6812                } else {
6813                        die_error(400, "No file name defined");
6814                }
6815        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6816                # blobs defined by non-textual hash id's can be cached
6817                $expires = "+1d";
6818        }
6819
6820        my $have_blame = gitweb_check_feature('blame');
6821        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6822                or die_error(500, "Couldn't cat $file_name, $hash");
6823        my $mimetype = blob_mimetype($fd, $file_name);
6824        # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6825        if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6826                close $fd;
6827                return git_blob_plain($mimetype);
6828        }
6829        # we can have blame only for text/* mimetype
6830        $have_blame &&= ($mimetype =~ m!^text/!);
6831
6832        my $highlight = gitweb_check_feature('highlight');
6833        my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6834        $fd = run_highlighter($fd, $highlight, $syntax)
6835                if $syntax;
6836
6837        git_header_html(undef, $expires);
6838        my $formats_nav = '';
6839        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6840                if (defined $file_name) {
6841                        if ($have_blame) {
6842                                $formats_nav .=
6843                                        $cgi->a({-href => href(action=>"blame", -replay=>1)},
6844                                                "blame") .
6845                                        " | ";
6846                        }
6847                        $formats_nav .=
6848                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6849                                        "history") .
6850                                " | " .
6851                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6852                                        "raw") .
6853                                " | " .
6854                                $cgi->a({-href => href(action=>"blob",
6855                                                       hash_base=>"HEAD", file_name=>$file_name)},
6856                                        "HEAD");
6857                } else {
6858                        $formats_nav .=
6859                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6860                                        "raw");
6861                }
6862                git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6863                git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6864        } else {
6865                print "<div class=\"page_nav\">\n" .
6866                      "<br/><br/></div>\n" .
6867                      "<div class=\"title\">".esc_html($hash)."</div>\n";
6868        }
6869        git_print_page_path($file_name, "blob", $hash_base);
6870        print "<div class=\"page_body\">\n";
6871        if ($mimetype =~ m!^image/!) {
6872                print qq!<img type="!.esc_attr($mimetype).qq!"!;
6873                if ($file_name) {
6874                        print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
6875                }
6876                print qq! src="! .
6877                      href(action=>"blob_plain", hash=>$hash,
6878                           hash_base=>$hash_base, file_name=>$file_name) .
6879                      qq!" />\n!;
6880        } else {
6881                my $nr;
6882                while (my $line = <$fd>) {
6883                        chomp $line;
6884                        $nr++;
6885                        $line = untabify($line);
6886                        printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
6887                               $nr, esc_attr(href(-replay => 1)), $nr, $nr,
6888                               $syntax ? sanitize($line) : esc_html($line, -nbsp=>1);
6889                }
6890        }
6891        close $fd
6892                or print "Reading blob failed.\n";
6893        print "</div>";
6894        git_footer_html();
6895}
6896
6897sub git_tree {
6898        if (!defined $hash_base) {
6899                $hash_base = "HEAD";
6900        }
6901        if (!defined $hash) {
6902                if (defined $file_name) {
6903                        $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
6904                } else {
6905                        $hash = $hash_base;
6906                }
6907        }
6908        die_error(404, "No such tree") unless defined($hash);
6909
6910        my $show_sizes = gitweb_check_feature('show-sizes');
6911        my $have_blame = gitweb_check_feature('blame');
6912
6913        my @entries = ();
6914        {
6915                local $/ = "\0";
6916                open my $fd, "-|", git_cmd(), "ls-tree", '-z',
6917                        ($show_sizes ? '-l' : ()), @extra_options, $hash
6918                        or die_error(500, "Open git-ls-tree failed");
6919                @entries = map { chomp; $_ } <$fd>;
6920                close $fd
6921                        or die_error(404, "Reading tree failed");
6922        }
6923
6924        my $refs = git_get_references();
6925        my $ref = format_ref_marker($refs, $hash_base);
6926        git_header_html();
6927        my $basedir = '';
6928        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6929                my @views_nav = ();
6930                if (defined $file_name) {
6931                        push @views_nav,
6932                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6933                                        "history"),
6934                                $cgi->a({-href => href(action=>"tree",
6935                                                       hash_base=>"HEAD", file_name=>$file_name)},
6936                                        "HEAD"),
6937                }
6938                my $snapshot_links = format_snapshot_links($hash);
6939                if (defined $snapshot_links) {
6940                        # FIXME: Should be available when we have no hash base as well.
6941                        push @views_nav, $snapshot_links;
6942                }
6943                git_print_page_nav('tree','', $hash_base, undef, undef,
6944                                   join(' | ', @views_nav));
6945                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6946        } else {
6947                undef $hash_base;
6948                print "<div class=\"page_nav\">\n";
6949                print "<br/><br/></div>\n";
6950                print "<div class=\"title\">".esc_html($hash)."</div>\n";
6951        }
6952        if (defined $file_name) {
6953                $basedir = $file_name;
6954                if ($basedir ne '' && substr($basedir, -1) ne '/') {
6955                        $basedir .= '/';
6956                }
6957                git_print_page_path($file_name, 'tree', $hash_base);
6958        }
6959        print "<div class=\"page_body\">\n";
6960        print "<table class=\"tree\">\n";
6961        my $alternate = 1;
6962        # '..' (top directory) link if possible
6963        if (defined $hash_base &&
6964            defined $file_name && $file_name =~ m![^/]+$!) {
6965                if ($alternate) {
6966                        print "<tr class=\"dark\">\n";
6967                } else {
6968                        print "<tr class=\"light\">\n";
6969                }
6970                $alternate ^= 1;
6971
6972                my $up = $file_name;
6973                $up =~ s!/?[^/]+$!!;
6974                undef $up unless $up;
6975                # based on git_print_tree_entry
6976                print '<td class="mode">' . mode_str('040000') . "</td>\n";
6977                print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6978                print '<td class="list">';
6979                print $cgi->a({-href => href(action=>"tree",
6980                                             hash_base=>$hash_base,
6981                                             file_name=>$up)},
6982                              "..");
6983                print "</td>\n";
6984                print "<td class=\"link\"></td>\n";
6985
6986                print "</tr>\n";
6987        }
6988        foreach my $line (@entries) {
6989                my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6990
6991                if ($alternate) {
6992                        print "<tr class=\"dark\">\n";
6993                } else {
6994                        print "<tr class=\"light\">\n";
6995                }
6996                $alternate ^= 1;
6997
6998                git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6999
7000                print "</tr>\n";
7001        }
7002        print "</table>\n" .
7003              "</div>";
7004        git_footer_html();
7005}
7006
7007sub snapshot_name {
7008        my ($project, $hash) = @_;
7009
7010        # path/to/project.git  -> project
7011        # path/to/project/.git -> project
7012        my $name = to_utf8($project);
7013        $name =~ s,([^/])/*\.git$,$1,;
7014        $name = basename($name);
7015        # sanitize name
7016        $name =~ s/[[:cntrl:]]/?/g;
7017
7018        my $ver = $hash;
7019        if ($hash =~ /^[0-9a-fA-F]+$/) {
7020                # shorten SHA-1 hash
7021                my $full_hash = git_get_full_hash($project, $hash);
7022                if ($full_hash =~ /^$hash/ && length($hash) > 7) {
7023                        $ver = git_get_short_hash($project, $hash);
7024                }
7025        } elsif ($hash =~ m!^refs/tags/(.*)$!) {
7026                # tags don't need shortened SHA-1 hash
7027                $ver = $1;
7028        } else {
7029                # branches and other need shortened SHA-1 hash
7030                if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
7031                        $ver = $1;
7032                }
7033                $ver .= '-' . git_get_short_hash($project, $hash);
7034        }
7035        # in case of hierarchical branch names
7036        $ver =~ s!/!.!g;
7037
7038        # name = project-version_string
7039        $name = "$name-$ver";
7040
7041        return wantarray ? ($name, $name) : $name;
7042}
7043
7044sub git_snapshot {
7045        my $format = $input_params{'snapshot_format'};
7046        if (!@snapshot_fmts) {
7047                die_error(403, "Snapshots not allowed");
7048        }
7049        # default to first supported snapshot format
7050        $format ||= $snapshot_fmts[0];
7051        if ($format !~ m/^[a-z0-9]+$/) {
7052                die_error(400, "Invalid snapshot format parameter");
7053        } elsif (!exists($known_snapshot_formats{$format})) {
7054                die_error(400, "Unknown snapshot format");
7055        } elsif ($known_snapshot_formats{$format}{'disabled'}) {
7056                die_error(403, "Snapshot format not allowed");
7057        } elsif (!grep($_ eq $format, @snapshot_fmts)) {
7058                die_error(403, "Unsupported snapshot format");
7059        }
7060
7061        my $type = git_get_type("$hash^{}");
7062        if (!$type) {
7063                die_error(404, 'Object does not exist');
7064        }  elsif ($type eq 'blob') {
7065                die_error(400, 'Object is not a tree-ish');
7066        }
7067
7068        my ($name, $prefix) = snapshot_name($project, $hash);
7069        my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
7070        my $cmd = quote_command(
7071                git_cmd(), 'archive',
7072                "--format=$known_snapshot_formats{$format}{'format'}",
7073                "--prefix=$prefix/", $hash);
7074        if (exists $known_snapshot_formats{$format}{'compressor'}) {
7075                $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
7076        }
7077
7078        $filename =~ s/(["\\])/\\$1/g;
7079        print $cgi->header(
7080                -type => $known_snapshot_formats{$format}{'type'},
7081                -content_disposition => 'inline; filename="' . $filename . '"',
7082                -status => '200 OK');
7083
7084        open my $fd, "-|", $cmd
7085                or die_error(500, "Execute git-archive failed");
7086        binmode STDOUT, ':raw';
7087        print <$fd>;
7088        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
7089        close $fd;
7090}
7091
7092sub git_log_generic {
7093        my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
7094
7095        my $head = git_get_head_hash($project);
7096        if (!defined $base) {
7097                $base = $head;
7098        }
7099        if (!defined $page) {
7100                $page = 0;
7101        }
7102        my $refs = git_get_references();
7103
7104        my $commit_hash = $base;
7105        if (defined $parent) {
7106                $commit_hash = "$parent..$base";
7107        }
7108        my @commitlist =
7109                parse_commits($commit_hash, 101, (100 * $page),
7110                              defined $file_name ? ($file_name, "--full-history") : ());
7111
7112        my $ftype;
7113        if (!defined $file_hash && defined $file_name) {
7114                # some commits could have deleted file in question,
7115                # and not have it in tree, but one of them has to have it
7116                for (my $i = 0; $i < @commitlist; $i++) {
7117                        $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
7118                        last if defined $file_hash;
7119                }
7120        }
7121        if (defined $file_hash) {
7122                $ftype = git_get_type($file_hash);
7123        }
7124        if (defined $file_name && !defined $ftype) {
7125                die_error(500, "Unknown type of object");
7126        }
7127        my %co;
7128        if (defined $file_name) {
7129                %co = parse_commit($base)
7130                        or die_error(404, "Unknown commit object");
7131        }
7132
7133
7134        my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
7135        my $next_link = '';
7136        if ($#commitlist >= 100) {
7137                $next_link =
7138                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
7139                                 -accesskey => "n", -title => "Alt-n"}, "next");
7140        }
7141        my $patch_max = gitweb_get_feature('patches');
7142        if ($patch_max && !defined $file_name) {
7143                if ($patch_max < 0 || @commitlist <= $patch_max) {
7144                        $paging_nav .= " &sdot; " .
7145                                $cgi->a({-href => href(action=>"patches", -replay=>1)},
7146                                        "patches");
7147                }
7148        }
7149
7150        git_header_html();
7151        git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
7152        if (defined $file_name) {
7153                git_print_header_div('commit', esc_html($co{'title'}), $base);
7154        } else {
7155                git_print_header_div('summary', $project)
7156        }
7157        git_print_page_path($file_name, $ftype, $hash_base)
7158                if (defined $file_name);
7159
7160        $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
7161                     $file_name, $file_hash, $ftype);
7162
7163        git_footer_html();
7164}
7165
7166sub git_log {
7167        git_log_generic('log', \&git_log_body,
7168                        $hash, $hash_parent);
7169}
7170
7171sub git_commit {
7172        $hash ||= $hash_base || "HEAD";
7173        my %co = parse_commit($hash)
7174            or die_error(404, "Unknown commit object");
7175
7176        my $parent  = $co{'parent'};
7177        my $parents = $co{'parents'}; # listref
7178
7179        # we need to prepare $formats_nav before any parameter munging
7180        my $formats_nav;
7181        if (!defined $parent) {
7182                # --root commitdiff
7183                $formats_nav .= '(initial)';
7184        } elsif (@$parents == 1) {
7185                # single parent commit
7186                $formats_nav .=
7187                        '(parent: ' .
7188                        $cgi->a({-href => href(action=>"commit",
7189                                               hash=>$parent)},
7190                                esc_html(substr($parent, 0, 7))) .
7191                        ')';
7192        } else {
7193                # merge commit
7194                $formats_nav .=
7195                        '(merge: ' .
7196                        join(' ', map {
7197                                $cgi->a({-href => href(action=>"commit",
7198                                                       hash=>$_)},
7199                                        esc_html(substr($_, 0, 7)));
7200                        } @$parents ) .
7201                        ')';
7202        }
7203        if (gitweb_check_feature('patches') && @$parents <= 1) {
7204                $formats_nav .= " | " .
7205                        $cgi->a({-href => href(action=>"patch", -replay=>1)},
7206                                "patch");
7207        }
7208
7209        if (!defined $parent) {
7210                $parent = "--root";
7211        }
7212        my @difftree;
7213        open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
7214                @diff_opts,
7215                (@$parents <= 1 ? $parent : '-c'),
7216                $hash, "--"
7217                or die_error(500, "Open git-diff-tree failed");
7218        @difftree = map { chomp; $_ } <$fd>;
7219        close $fd or die_error(404, "Reading git-diff-tree failed");
7220
7221        # non-textual hash id's can be cached
7222        my $expires;
7223        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7224                $expires = "+1d";
7225        }
7226        my $refs = git_get_references();
7227        my $ref = format_ref_marker($refs, $co{'id'});
7228
7229        git_header_html(undef, $expires);
7230        git_print_page_nav('commit', '',
7231                           $hash, $co{'tree'}, $hash,
7232                           $formats_nav);
7233
7234        if (defined $co{'parent'}) {
7235                git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
7236        } else {
7237                git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
7238        }
7239        print "<div class=\"title_text\">\n" .
7240              "<table class=\"object_header\">\n";
7241        git_print_authorship_rows(\%co);
7242        print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
7243        print "<tr>" .
7244              "<td>tree</td>" .
7245              "<td class=\"sha1\">" .
7246              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7247                       class => "list"}, $co{'tree'}) .
7248              "</td>" .
7249              "<td class=\"link\">" .
7250              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7251                      "tree");
7252        my $snapshot_links = format_snapshot_links($hash);
7253        if (defined $snapshot_links) {
7254                print " | " . $snapshot_links;
7255        }
7256        print "</td>" .
7257              "</tr>\n";
7258
7259        foreach my $par (@$parents) {
7260                print "<tr>" .
7261                      "<td>parent</td>" .
7262                      "<td class=\"sha1\">" .
7263                      $cgi->a({-href => href(action=>"commit", hash=>$par),
7264                               class => "list"}, $par) .
7265                      "</td>" .
7266                      "<td class=\"link\">" .
7267                      $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7268                      " | " .
7269                      $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7270                      "</td>" .
7271                      "</tr>\n";
7272        }
7273        print "</table>".
7274              "</div>\n";
7275
7276        print "<div class=\"page_body\">\n";
7277        git_print_log($co{'comment'});
7278        print "</div>\n";
7279
7280        git_difftree_body(\@difftree, $hash, @$parents);
7281
7282        git_footer_html();
7283}
7284
7285sub git_object {
7286        # object is defined by:
7287        # - hash or hash_base alone
7288        # - hash_base and file_name
7289        my $type;
7290
7291        # - hash or hash_base alone
7292        if ($hash || ($hash_base && !defined $file_name)) {
7293                my $object_id = $hash || $hash_base;
7294
7295                open my $fd, "-|", quote_command(
7296                        git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7297                        or die_error(404, "Object does not exist");
7298                $type = <$fd>;
7299                chomp $type;
7300                close $fd
7301                        or die_error(404, "Object does not exist");
7302
7303        # - hash_base and file_name
7304        } elsif ($hash_base && defined $file_name) {
7305                $file_name =~ s,/+$,,;
7306
7307                system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7308                        or die_error(404, "Base object does not exist");
7309
7310                # here errors should not hapen
7311                open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7312                        or die_error(500, "Open git-ls-tree failed");
7313                my $line = <$fd>;
7314                close $fd;
7315
7316                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7317                unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7318                        die_error(404, "File or directory for given base does not exist");
7319                }
7320                $type = $2;
7321                $hash = $3;
7322        } else {
7323                die_error(400, "Not enough information to find object");
7324        }
7325
7326        print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7327                                          hash=>$hash, hash_base=>$hash_base,
7328                                          file_name=>$file_name),
7329                             -status => '302 Found');
7330}
7331
7332sub git_blobdiff {
7333        my $format = shift || 'html';
7334        my $diff_style = $input_params{'diff_style'} || 'inline';
7335
7336        my $fd;
7337        my @difftree;
7338        my %diffinfo;
7339        my $expires;
7340
7341        # preparing $fd and %diffinfo for git_patchset_body
7342        # new style URI
7343        if (defined $hash_base && defined $hash_parent_base) {
7344                if (defined $file_name) {
7345                        # read raw output
7346                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7347                                $hash_parent_base, $hash_base,
7348                                "--", (defined $file_parent ? $file_parent : ()), $file_name
7349                                or die_error(500, "Open git-diff-tree failed");
7350                        @difftree = map { chomp; $_ } <$fd>;
7351                        close $fd
7352                                or die_error(404, "Reading git-diff-tree failed");
7353                        @difftree
7354                                or die_error(404, "Blob diff not found");
7355
7356                } elsif (defined $hash &&
7357                         $hash =~ /[0-9a-fA-F]{40}/) {
7358                        # try to find filename from $hash
7359
7360                        # read filtered raw output
7361                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7362                                $hash_parent_base, $hash_base, "--"
7363                                or die_error(500, "Open git-diff-tree failed");
7364                        @difftree =
7365                                # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7366                                # $hash == to_id
7367                                grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7368                                map { chomp; $_ } <$fd>;
7369                        close $fd
7370                                or die_error(404, "Reading git-diff-tree failed");
7371                        @difftree
7372                                or die_error(404, "Blob diff not found");
7373
7374                } else {
7375                        die_error(400, "Missing one of the blob diff parameters");
7376                }
7377
7378                if (@difftree > 1) {
7379                        die_error(400, "Ambiguous blob diff specification");
7380                }
7381
7382                %diffinfo = parse_difftree_raw_line($difftree[0]);
7383                $file_parent ||= $diffinfo{'from_file'} || $file_name;
7384                $file_name   ||= $diffinfo{'to_file'};
7385
7386                $hash_parent ||= $diffinfo{'from_id'};
7387                $hash        ||= $diffinfo{'to_id'};
7388
7389                # non-textual hash id's can be cached
7390                if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7391                    $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7392                        $expires = '+1d';
7393                }
7394
7395                # open patch output
7396                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7397                        '-p', ($format eq 'html' ? "--full-index" : ()),
7398                        $hash_parent_base, $hash_base,
7399                        "--", (defined $file_parent ? $file_parent : ()), $file_name
7400                        or die_error(500, "Open git-diff-tree failed");
7401        }
7402
7403        # old/legacy style URI -- not generated anymore since 1.4.3.
7404        if (!%diffinfo) {
7405                die_error('404 Not Found', "Missing one of the blob diff parameters")
7406        }
7407
7408        # header
7409        if ($format eq 'html') {
7410                my $formats_nav =
7411                        $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7412                                "raw");
7413                $formats_nav .= diff_style_nav($diff_style);
7414                git_header_html(undef, $expires);
7415                if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7416                        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7417                        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7418                } else {
7419                        print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7420                        print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7421                }
7422                if (defined $file_name) {
7423                        git_print_page_path($file_name, "blob", $hash_base);
7424                } else {
7425                        print "<div class=\"page_path\"></div>\n";
7426                }
7427
7428        } elsif ($format eq 'plain') {
7429                print $cgi->header(
7430                        -type => 'text/plain',
7431                        -charset => 'utf-8',
7432                        -expires => $expires,
7433                        -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7434
7435                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7436
7437        } else {
7438                die_error(400, "Unknown blobdiff format");
7439        }
7440
7441        # patch
7442        if ($format eq 'html') {
7443                print "<div class=\"page_body\">\n";
7444
7445                git_patchset_body($fd, $diff_style,
7446                                  [ \%diffinfo ], $hash_base, $hash_parent_base);
7447                close $fd;
7448
7449                print "</div>\n"; # class="page_body"
7450                git_footer_html();
7451
7452        } else {
7453                while (my $line = <$fd>) {
7454                        $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7455                        $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7456
7457                        print $line;
7458
7459                        last if $line =~ m!^\+\+\+!;
7460                }
7461                local $/ = undef;
7462                print <$fd>;
7463                close $fd;
7464        }
7465}
7466
7467sub git_blobdiff_plain {
7468        git_blobdiff('plain');
7469}
7470
7471# assumes that it is added as later part of already existing navigation,
7472# so it returns "| foo | bar" rather than just "foo | bar"
7473sub diff_style_nav {
7474        my ($diff_style, $is_combined) = @_;
7475        $diff_style ||= 'inline';
7476
7477        return "" if ($is_combined);
7478
7479        my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7480        my %styles = @styles;
7481        @styles =
7482                @styles[ map { $_ * 2 } 0..$#styles/2 ];
7483
7484        return join '',
7485                map { " | ".$_ }
7486                map {
7487                        $_ eq $diff_style ? $styles{$_} :
7488                        $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7489                } @styles;
7490}
7491
7492sub git_commitdiff {
7493        my %params = @_;
7494        my $format = $params{-format} || 'html';
7495        my $diff_style = $input_params{'diff_style'} || 'inline';
7496
7497        my ($patch_max) = gitweb_get_feature('patches');
7498        if ($format eq 'patch') {
7499                die_error(403, "Patch view not allowed") unless $patch_max;
7500        }
7501
7502        $hash ||= $hash_base || "HEAD";
7503        my %co = parse_commit($hash)
7504            or die_error(404, "Unknown commit object");
7505
7506        # choose format for commitdiff for merge
7507        if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7508                $hash_parent = '--cc';
7509        }
7510        # we need to prepare $formats_nav before almost any parameter munging
7511        my $formats_nav;
7512        if ($format eq 'html') {
7513                $formats_nav =
7514                        $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7515                                "raw");
7516                if ($patch_max && @{$co{'parents'}} <= 1) {
7517                        $formats_nav .= " | " .
7518                                $cgi->a({-href => href(action=>"patch", -replay=>1)},
7519                                        "patch");
7520                }
7521                $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7522
7523                if (defined $hash_parent &&
7524                    $hash_parent ne '-c' && $hash_parent ne '--cc') {
7525                        # commitdiff with two commits given
7526                        my $hash_parent_short = $hash_parent;
7527                        if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7528                                $hash_parent_short = substr($hash_parent, 0, 7);
7529                        }
7530                        $formats_nav .=
7531                                ' (from';
7532                        for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7533                                if ($co{'parents'}[$i] eq $hash_parent) {
7534                                        $formats_nav .= ' parent ' . ($i+1);
7535                                        last;
7536                                }
7537                        }
7538                        $formats_nav .= ': ' .
7539                                $cgi->a({-href => href(-replay=>1,
7540                                                       hash=>$hash_parent, hash_base=>undef)},
7541                                        esc_html($hash_parent_short)) .
7542                                ')';
7543                } elsif (!$co{'parent'}) {
7544                        # --root commitdiff
7545                        $formats_nav .= ' (initial)';
7546                } elsif (scalar @{$co{'parents'}} == 1) {
7547                        # single parent commit
7548                        $formats_nav .=
7549                                ' (parent: ' .
7550                                $cgi->a({-href => href(-replay=>1,
7551                                                       hash=>$co{'parent'}, hash_base=>undef)},
7552                                        esc_html(substr($co{'parent'}, 0, 7))) .
7553                                ')';
7554                } else {
7555                        # merge commit
7556                        if ($hash_parent eq '--cc') {
7557                                $formats_nav .= ' | ' .
7558                                        $cgi->a({-href => href(-replay=>1,
7559                                                               hash=>$hash, hash_parent=>'-c')},
7560                                                'combined');
7561                        } else { # $hash_parent eq '-c'
7562                                $formats_nav .= ' | ' .
7563                                        $cgi->a({-href => href(-replay=>1,
7564                                                               hash=>$hash, hash_parent=>'--cc')},
7565                                                'compact');
7566                        }
7567                        $formats_nav .=
7568                                ' (merge: ' .
7569                                join(' ', map {
7570                                        $cgi->a({-href => href(-replay=>1,
7571                                                               hash=>$_, hash_base=>undef)},
7572                                                esc_html(substr($_, 0, 7)));
7573                                } @{$co{'parents'}} ) .
7574                                ')';
7575                }
7576        }
7577
7578        my $hash_parent_param = $hash_parent;
7579        if (!defined $hash_parent_param) {
7580                # --cc for multiple parents, --root for parentless
7581                $hash_parent_param =
7582                        @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7583        }
7584
7585        # read commitdiff
7586        my $fd;
7587        my @difftree;
7588        if ($format eq 'html') {
7589                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7590                        "--no-commit-id", "--patch-with-raw", "--full-index",
7591                        $hash_parent_param, $hash, "--"
7592                        or die_error(500, "Open git-diff-tree failed");
7593
7594                while (my $line = <$fd>) {
7595                        chomp $line;
7596                        # empty line ends raw part of diff-tree output
7597                        last unless $line;
7598                        push @difftree, scalar parse_difftree_raw_line($line);
7599                }
7600
7601        } elsif ($format eq 'plain') {
7602                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7603                        '-p', $hash_parent_param, $hash, "--"
7604                        or die_error(500, "Open git-diff-tree failed");
7605        } elsif ($format eq 'patch') {
7606                # For commit ranges, we limit the output to the number of
7607                # patches specified in the 'patches' feature.
7608                # For single commits, we limit the output to a single patch,
7609                # diverging from the git-format-patch default.
7610                my @commit_spec = ();
7611                if ($hash_parent) {
7612                        if ($patch_max > 0) {
7613                                push @commit_spec, "-$patch_max";
7614                        }
7615                        push @commit_spec, '-n', "$hash_parent..$hash";
7616                } else {
7617                        if ($params{-single}) {
7618                                push @commit_spec, '-1';
7619                        } else {
7620                                if ($patch_max > 0) {
7621                                        push @commit_spec, "-$patch_max";
7622                                }
7623                                push @commit_spec, "-n";
7624                        }
7625                        push @commit_spec, '--root', $hash;
7626                }
7627                open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7628                        '--encoding=utf8', '--stdout', @commit_spec
7629                        or die_error(500, "Open git-format-patch failed");
7630        } else {
7631                die_error(400, "Unknown commitdiff format");
7632        }
7633
7634        # non-textual hash id's can be cached
7635        my $expires;
7636        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7637                $expires = "+1d";
7638        }
7639
7640        # write commit message
7641        if ($format eq 'html') {
7642                my $refs = git_get_references();
7643                my $ref = format_ref_marker($refs, $co{'id'});
7644
7645                git_header_html(undef, $expires);
7646                git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7647                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7648                print "<div class=\"title_text\">\n" .
7649                      "<table class=\"object_header\">\n";
7650                git_print_authorship_rows(\%co);
7651                print "</table>".
7652                      "</div>\n";
7653                print "<div class=\"page_body\">\n";
7654                if (@{$co{'comment'}} > 1) {
7655                        print "<div class=\"log\">\n";
7656                        git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7657                        print "</div>\n"; # class="log"
7658                }
7659
7660        } elsif ($format eq 'plain') {
7661                my $refs = git_get_references("tags");
7662                my $tagname = git_get_rev_name_tags($hash);
7663                my $filename = basename($project) . "-$hash.patch";
7664
7665                print $cgi->header(
7666                        -type => 'text/plain',
7667                        -charset => 'utf-8',
7668                        -expires => $expires,
7669                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7670                my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7671                print "From: " . to_utf8($co{'author'}) . "\n";
7672                print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7673                print "Subject: " . to_utf8($co{'title'}) . "\n";
7674
7675                print "X-Git-Tag: $tagname\n" if $tagname;
7676                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7677
7678                foreach my $line (@{$co{'comment'}}) {
7679                        print to_utf8($line) . "\n";
7680                }
7681                print "---\n\n";
7682        } elsif ($format eq 'patch') {
7683                my $filename = basename($project) . "-$hash.patch";
7684
7685                print $cgi->header(
7686                        -type => 'text/plain',
7687                        -charset => 'utf-8',
7688                        -expires => $expires,
7689                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7690        }
7691
7692        # write patch
7693        if ($format eq 'html') {
7694                my $use_parents = !defined $hash_parent ||
7695                        $hash_parent eq '-c' || $hash_parent eq '--cc';
7696                git_difftree_body(\@difftree, $hash,
7697                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7698                print "<br/>\n";
7699
7700                git_patchset_body($fd, $diff_style,
7701                                  \@difftree, $hash,
7702                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7703                close $fd;
7704                print "</div>\n"; # class="page_body"
7705                git_footer_html();
7706
7707        } elsif ($format eq 'plain') {
7708                local $/ = undef;
7709                print <$fd>;
7710                close $fd
7711                        or print "Reading git-diff-tree failed\n";
7712        } elsif ($format eq 'patch') {
7713                local $/ = undef;
7714                print <$fd>;
7715                close $fd
7716                        or print "Reading git-format-patch failed\n";
7717        }
7718}
7719
7720sub git_commitdiff_plain {
7721        git_commitdiff(-format => 'plain');
7722}
7723
7724# format-patch-style patches
7725sub git_patch {
7726        git_commitdiff(-format => 'patch', -single => 1);
7727}
7728
7729sub git_patches {
7730        git_commitdiff(-format => 'patch');
7731}
7732
7733sub git_history {
7734        git_log_generic('history', \&git_history_body,
7735                        $hash_base, $hash_parent_base,
7736                        $file_name, $hash);
7737}
7738
7739sub git_search {
7740        $searchtype ||= 'commit';
7741
7742        # check if appropriate features are enabled
7743        gitweb_check_feature('search')
7744                or die_error(403, "Search is disabled");
7745        if ($searchtype eq 'pickaxe') {
7746                # pickaxe may take all resources of your box and run for several minutes
7747                # with every query - so decide by yourself how public you make this feature
7748                gitweb_check_feature('pickaxe')
7749                        or die_error(403, "Pickaxe search is disabled");
7750        }
7751        if ($searchtype eq 'grep') {
7752                # grep search might be potentially CPU-intensive, too
7753                gitweb_check_feature('grep')
7754                        or die_error(403, "Grep search is disabled");
7755        }
7756
7757        if (!defined $searchtext) {
7758                die_error(400, "Text field is empty");
7759        }
7760        if (!defined $hash) {
7761                $hash = git_get_head_hash($project);
7762        }
7763        my %co = parse_commit($hash);
7764        if (!%co) {
7765                die_error(404, "Unknown commit object");
7766        }
7767        if (!defined $page) {
7768                $page = 0;
7769        }
7770
7771        if ($searchtype eq 'commit' ||
7772            $searchtype eq 'author' ||
7773            $searchtype eq 'committer') {
7774                git_search_message(%co);
7775        } elsif ($searchtype eq 'pickaxe') {
7776                git_search_changes(%co);
7777        } elsif ($searchtype eq 'grep') {
7778                git_search_files(%co);
7779        } else {
7780                die_error(400, "Unknown search type");
7781        }
7782}
7783
7784sub git_search_help {
7785        git_header_html();
7786        git_print_page_nav('','', $hash,$hash,$hash);
7787        print <<EOT;
7788<p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7789regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7790the pattern entered is recognized as the POSIX extended
7791<a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7792insensitive).</p>
7793<dl>
7794<dt><b>commit</b></dt>
7795<dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7796EOT
7797        my $have_grep = gitweb_check_feature('grep');
7798        if ($have_grep) {
7799                print <<EOT;
7800<dt><b>grep</b></dt>
7801<dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7802    a different one) are searched for the given pattern. On large trees, this search can take
7803a while and put some strain on the server, so please use it with some consideration. Note that
7804due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7805case-sensitive.</dd>
7806EOT
7807        }
7808        print <<EOT;
7809<dt><b>author</b></dt>
7810<dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7811<dt><b>committer</b></dt>
7812<dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7813EOT
7814        my $have_pickaxe = gitweb_check_feature('pickaxe');
7815        if ($have_pickaxe) {
7816                print <<EOT;
7817<dt><b>pickaxe</b></dt>
7818<dd>All commits that caused the string to appear or disappear from any file (changes that
7819added, removed or "modified" the string) will be listed. This search can take a while and
7820takes a lot of strain on the server, so please use it wisely. Note that since you may be
7821interested even in changes just changing the case as well, this search is case sensitive.</dd>
7822EOT
7823        }
7824        print "</dl>\n";
7825        git_footer_html();
7826}
7827
7828sub git_shortlog {
7829        git_log_generic('shortlog', \&git_shortlog_body,
7830                        $hash, $hash_parent);
7831}
7832
7833## ......................................................................
7834## feeds (RSS, Atom; OPML)
7835
7836sub git_feed {
7837        my $format = shift || 'atom';
7838        my $have_blame = gitweb_check_feature('blame');
7839
7840        # Atom: http://www.atomenabled.org/developers/syndication/
7841        # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7842        if ($format ne 'rss' && $format ne 'atom') {
7843                die_error(400, "Unknown web feed format");
7844        }
7845
7846        # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7847        my $head = $hash || 'HEAD';
7848        my @commitlist = parse_commits($head, 150, 0, $file_name);
7849
7850        my %latest_commit;
7851        my %latest_date;
7852        my $content_type = "application/$format+xml";
7853        if (defined $cgi->http('HTTP_ACCEPT') &&
7854                 $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7855                # browser (feed reader) prefers text/xml
7856                $content_type = 'text/xml';
7857        }
7858        if (defined($commitlist[0])) {
7859                %latest_commit = %{$commitlist[0]};
7860                my $latest_epoch = $latest_commit{'committer_epoch'};
7861                %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7862                my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7863                if (defined $if_modified) {
7864                        my $since;
7865                        if (eval { require HTTP::Date; 1; }) {
7866                                $since = HTTP::Date::str2time($if_modified);
7867                        } elsif (eval { require Time::ParseDate; 1; }) {
7868                                $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7869                        }
7870                        if (defined $since && $latest_epoch <= $since) {
7871                                print $cgi->header(
7872                                        -type => $content_type,
7873                                        -charset => 'utf-8',
7874                                        -last_modified => $latest_date{'rfc2822'},
7875                                        -status => '304 Not Modified');
7876                                return;
7877                        }
7878                }
7879                print $cgi->header(
7880                        -type => $content_type,
7881                        -charset => 'utf-8',
7882                        -last_modified => $latest_date{'rfc2822'});
7883        } else {
7884                print $cgi->header(
7885                        -type => $content_type,
7886                        -charset => 'utf-8');
7887        }
7888
7889        # Optimization: skip generating the body if client asks only
7890        # for Last-Modified date.
7891        return if ($cgi->request_method() eq 'HEAD');
7892
7893        # header variables
7894        my $title = "$site_name - $project/$action";
7895        my $feed_type = 'log';
7896        if (defined $hash) {
7897                $title .= " - '$hash'";
7898                $feed_type = 'branch log';
7899                if (defined $file_name) {
7900                        $title .= " :: $file_name";
7901                        $feed_type = 'history';
7902                }
7903        } elsif (defined $file_name) {
7904                $title .= " - $file_name";
7905                $feed_type = 'history';
7906        }
7907        $title .= " $feed_type";
7908        my $descr = git_get_project_description($project);
7909        if (defined $descr) {
7910                $descr = esc_html($descr);
7911        } else {
7912                $descr = "$project " .
7913                         ($format eq 'rss' ? 'RSS' : 'Atom') .
7914                         " feed";
7915        }
7916        my $owner = git_get_project_owner($project);
7917        $owner = esc_html($owner);
7918
7919        #header
7920        my $alt_url;
7921        if (defined $file_name) {
7922                $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7923        } elsif (defined $hash) {
7924                $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7925        } else {
7926                $alt_url = href(-full=>1, action=>"summary");
7927        }
7928        print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7929        if ($format eq 'rss') {
7930                print <<XML;
7931<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7932<channel>
7933XML
7934                print "<title>$title</title>\n" .
7935                      "<link>$alt_url</link>\n" .
7936                      "<description>$descr</description>\n" .
7937                      "<language>en</language>\n" .
7938                      # project owner is responsible for 'editorial' content
7939                      "<managingEditor>$owner</managingEditor>\n";
7940                if (defined $logo || defined $favicon) {
7941                        # prefer the logo to the favicon, since RSS
7942                        # doesn't allow both
7943                        my $img = esc_url($logo || $favicon);
7944                        print "<image>\n" .
7945                              "<url>$img</url>\n" .
7946                              "<title>$title</title>\n" .
7947                              "<link>$alt_url</link>\n" .
7948                              "</image>\n";
7949                }
7950                if (%latest_date) {
7951                        print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7952                        print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7953                }
7954                print "<generator>gitweb v.$version/$git_version</generator>\n";
7955        } elsif ($format eq 'atom') {
7956                print <<XML;
7957<feed xmlns="http://www.w3.org/2005/Atom">
7958XML
7959                print "<title>$title</title>\n" .
7960                      "<subtitle>$descr</subtitle>\n" .
7961                      '<link rel="alternate" type="text/html" href="' .
7962                      $alt_url . '" />' . "\n" .
7963                      '<link rel="self" type="' . $content_type . '" href="' .
7964                      $cgi->self_url() . '" />' . "\n" .
7965                      "<id>" . href(-full=>1) . "</id>\n" .
7966                      # use project owner for feed author
7967                      "<author><name>$owner</name></author>\n";
7968                if (defined $favicon) {
7969                        print "<icon>" . esc_url($favicon) . "</icon>\n";
7970                }
7971                if (defined $logo) {
7972                        # not twice as wide as tall: 72 x 27 pixels
7973                        print "<logo>" . esc_url($logo) . "</logo>\n";
7974                }
7975                if (! %latest_date) {
7976                        # dummy date to keep the feed valid until commits trickle in:
7977                        print "<updated>1970-01-01T00:00:00Z</updated>\n";
7978                } else {
7979                        print "<updated>$latest_date{'iso-8601'}</updated>\n";
7980                }
7981                print "<generator version='$version/$git_version'>gitweb</generator>\n";
7982        }
7983
7984        # contents
7985        for (my $i = 0; $i <= $#commitlist; $i++) {
7986                my %co = %{$commitlist[$i]};
7987                my $commit = $co{'id'};
7988                # we read 150, we always show 30 and the ones more recent than 48 hours
7989                if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7990                        last;
7991                }
7992                my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7993
7994                # get list of changed files
7995                open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7996                        $co{'parent'} || "--root",
7997                        $co{'id'}, "--", (defined $file_name ? $file_name : ())
7998                        or next;
7999                my @difftree = map { chomp; $_ } <$fd>;
8000                close $fd
8001                        or next;
8002
8003                # print element (entry, item)
8004                my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
8005                if ($format eq 'rss') {
8006                        print "<item>\n" .
8007                              "<title>" . esc_html($co{'title'}) . "</title>\n" .
8008                              "<author>" . esc_html($co{'author'}) . "</author>\n" .
8009                              "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
8010                              "<guid isPermaLink=\"true\">$co_url</guid>\n" .
8011                              "<link>$co_url</link>\n" .
8012                              "<description>" . esc_html($co{'title'}) . "</description>\n" .
8013                              "<content:encoded>" .
8014                              "<![CDATA[\n";
8015                } elsif ($format eq 'atom') {
8016                        print "<entry>\n" .
8017                              "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
8018                              "<updated>$cd{'iso-8601'}</updated>\n" .
8019                              "<author>\n" .
8020                              "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
8021                        if ($co{'author_email'}) {
8022                                print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
8023                        }
8024                        print "</author>\n" .
8025                              # use committer for contributor
8026                              "<contributor>\n" .
8027                              "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
8028                        if ($co{'committer_email'}) {
8029                                print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
8030                        }
8031                        print "</contributor>\n" .
8032                              "<published>$cd{'iso-8601'}</published>\n" .
8033                              "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
8034                              "<id>$co_url</id>\n" .
8035                              "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
8036                              "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
8037                }
8038                my $comment = $co{'comment'};
8039                print "<pre>\n";
8040                foreach my $line (@$comment) {
8041                        $line = esc_html($line);
8042                        print "$line\n";
8043                }
8044                print "</pre><ul>\n";
8045                foreach my $difftree_line (@difftree) {
8046                        my %difftree = parse_difftree_raw_line($difftree_line);
8047                        next if !$difftree{'from_id'};
8048
8049                        my $file = $difftree{'file'} || $difftree{'to_file'};
8050
8051                        print "<li>" .
8052                              "[" .
8053                              $cgi->a({-href => href(-full=>1, action=>"blobdiff",
8054                                                     hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
8055                                                     hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
8056                                                     file_name=>$file, file_parent=>$difftree{'from_file'}),
8057                                      -title => "diff"}, 'D');
8058                        if ($have_blame) {
8059                                print $cgi->a({-href => href(-full=>1, action=>"blame",
8060                                                             file_name=>$file, hash_base=>$commit),
8061                                              -title => "blame"}, 'B');
8062                        }
8063                        # if this is not a feed of a file history
8064                        if (!defined $file_name || $file_name ne $file) {
8065                                print $cgi->a({-href => href(-full=>1, action=>"history",
8066                                                             file_name=>$file, hash=>$commit),
8067                                              -title => "history"}, 'H');
8068                        }
8069                        $file = esc_path($file);
8070                        print "] ".
8071                              "$file</li>\n";
8072                }
8073                if ($format eq 'rss') {
8074                        print "</ul>]]>\n" .
8075                              "</content:encoded>\n" .
8076                              "</item>\n";
8077                } elsif ($format eq 'atom') {
8078                        print "</ul>\n</div>\n" .
8079                              "</content>\n" .
8080                              "</entry>\n";
8081                }
8082        }
8083
8084        # end of feed
8085        if ($format eq 'rss') {
8086                print "</channel>\n</rss>\n";
8087        } elsif ($format eq 'atom') {
8088                print "</feed>\n";
8089        }
8090}
8091
8092sub git_rss {
8093        git_feed('rss');
8094}
8095
8096sub git_atom {
8097        git_feed('atom');
8098}
8099
8100sub git_opml {
8101        my @list = git_get_projects_list($project_filter, $strict_export);
8102        if (!@list) {
8103                die_error(404, "No projects found");
8104        }
8105
8106        print $cgi->header(
8107                -type => 'text/xml',
8108                -charset => 'utf-8',
8109                -content_disposition => 'inline; filename="opml.xml"');
8110
8111        my $title = esc_html($site_name);
8112        my $filter = " within subdirectory ";
8113        if (defined $project_filter) {
8114                $filter .= esc_html($project_filter);
8115        } else {
8116                $filter = "";
8117        }
8118        print <<XML;
8119<?xml version="1.0" encoding="utf-8"?>
8120<opml version="1.0">
8121<head>
8122  <title>$title OPML Export$filter</title>
8123</head>
8124<body>
8125<outline text="git RSS feeds">
8126XML
8127
8128        foreach my $pr (@list) {
8129                my %proj = %$pr;
8130                my $head = git_get_head_hash($proj{'path'});
8131                if (!defined $head) {
8132                        next;
8133                }
8134                $git_dir = "$projectroot/$proj{'path'}";
8135                my %co = parse_commit($head);
8136                if (!%co) {
8137                        next;
8138                }
8139
8140                my $path = esc_html(chop_str($proj{'path'}, 25, 5));
8141                my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
8142                my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
8143                print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
8144        }
8145        print <<XML;
8146</outline>
8147</body>
8148</opml>
8149XML
8150}