gitweb / gitweb.perlon commit utf8: release strbuf on error return in strbuf_utf8_replace() (9a012bf)
   1#!/usr/bin/perl
   2
   3# gitweb - simple web interface to track changes in git repositories
   4#
   5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
   6# (C) 2005, Christian Gierke
   7#
   8# This program is licensed under the GPLv2
   9
  10use 5.008;
  11use strict;
  12use warnings;
  13use CGI qw(:standard :escapeHTML -nosticky);
  14use CGI::Util qw(unescape);
  15use CGI::Carp qw(fatalsToBrowser set_message);
  16use Encode;
  17use Fcntl ':mode';
  18use File::Find qw();
  19use File::Basename qw(basename);
  20use Time::HiRes qw(gettimeofday tv_interval);
  21binmode STDOUT, ':utf8';
  22
  23if (!defined($CGI::VERSION) || $CGI::VERSION < 4.08) {
  24        eval 'sub CGI::multi_param { CGI::param(@_) }'
  25}
  26
  27our $t0 = [ gettimeofday() ];
  28our $number_of_git_cmds = 0;
  29
  30BEGIN {
  31        CGI->compile() if $ENV{'MOD_PERL'};
  32}
  33
  34our $version = "++GIT_VERSION++";
  35
  36our ($my_url, $my_uri, $base_url, $path_info, $home_link);
  37sub evaluate_uri {
  38        our $cgi;
  39
  40        our $my_url = $cgi->url();
  41        our $my_uri = $cgi->url(-absolute => 1);
  42
  43        # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
  44        # needed and used only for URLs with nonempty PATH_INFO
  45        our $base_url = $my_url;
  46
  47        # When the script is used as DirectoryIndex, the URL does not contain the name
  48        # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
  49        # have to do it ourselves. We make $path_info global because it's also used
  50        # later on.
  51        #
  52        # Another issue with the script being the DirectoryIndex is that the resulting
  53        # $my_url data is not the full script URL: this is good, because we want
  54        # generated links to keep implying the script name if it wasn't explicitly
  55        # indicated in the URL we're handling, but it means that $my_url cannot be used
  56        # as base URL.
  57        # Therefore, if we needed to strip PATH_INFO, then we know that we have
  58        # to build the base URL ourselves:
  59        our $path_info = decode_utf8($ENV{"PATH_INFO"});
  60        if ($path_info) {
  61                # $path_info has already been URL-decoded by the web server, but
  62                # $my_url and $my_uri have not. URL-decode them so we can properly
  63                # strip $path_info.
  64                $my_url = unescape($my_url);
  65                $my_uri = unescape($my_uri);
  66                if ($my_url =~ s,\Q$path_info\E$,, &&
  67                    $my_uri =~ s,\Q$path_info\E$,, &&
  68                    defined $ENV{'SCRIPT_NAME'}) {
  69                        $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
  70                }
  71        }
  72
  73        # target of the home link on top of all pages
  74        our $home_link = $my_uri || "/";
  75}
  76
  77# core git executable to use
  78# this can just be "git" if your webserver has a sensible PATH
  79our $GIT = "++GIT_BINDIR++/git";
  80
  81# absolute fs-path which will be prepended to the project path
  82#our $projectroot = "/pub/scm";
  83our $projectroot = "++GITWEB_PROJECTROOT++";
  84
  85# fs traversing limit for getting project list
  86# the number is relative to the projectroot
  87our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
  88
  89# string of the home link on top of all pages
  90our $home_link_str = "++GITWEB_HOME_LINK_STR++";
  91
  92# extra breadcrumbs preceding the home link
  93our @extra_breadcrumbs = ();
  94
  95# name of your site or organization to appear in page titles
  96# replace this with something more descriptive for clearer bookmarks
  97our $site_name = "++GITWEB_SITENAME++"
  98                 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
  99
 100# html snippet to include in the <head> section of each page
 101our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
 102# filename of html text to include at top of each page
 103our $site_header = "++GITWEB_SITE_HEADER++";
 104# html text to include at home page
 105our $home_text = "++GITWEB_HOMETEXT++";
 106# filename of html text to include at bottom of each page
 107our $site_footer = "++GITWEB_SITE_FOOTER++";
 108
 109# URI of stylesheets
 110our @stylesheets = ("++GITWEB_CSS++");
 111# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
 112our $stylesheet = undef;
 113# URI of GIT logo (72x27 size)
 114our $logo = "++GITWEB_LOGO++";
 115# URI of GIT favicon, assumed to be image/png type
 116our $favicon = "++GITWEB_FAVICON++";
 117# URI of gitweb.js (JavaScript code for gitweb)
 118our $javascript = "++GITWEB_JS++";
 119
 120# URI and label (title) of GIT logo link
 121#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
 122#our $logo_label = "git documentation";
 123our $logo_url = "http://git-scm.com/";
 124our $logo_label = "git homepage";
 125
 126# source of projects list
 127our $projects_list = "++GITWEB_LIST++";
 128
 129# the width (in characters) of the projects list "Description" column
 130our $projects_list_description_width = 25;
 131
 132# group projects by category on the projects list
 133# (enabled if this variable evaluates to true)
 134our $projects_list_group_categories = 0;
 135
 136# default category if none specified
 137# (leave the empty string for no category)
 138our $project_list_default_category = "";
 139
 140# default order of projects list
 141# valid values are none, project, descr, owner, and age
 142our $default_projects_order = "project";
 143
 144# show repository only if this file exists
 145# (only effective if this variable evaluates to true)
 146our $export_ok = "++GITWEB_EXPORT_OK++";
 147
 148# don't generate age column on the projects list page
 149our $omit_age_column = 0;
 150
 151# don't generate information about owners of repositories
 152our $omit_owner=0;
 153
 154# show repository only if this subroutine returns true
 155# when given the path to the project, for example:
 156#    sub { return -e "$_[0]/git-daemon-export-ok"; }
 157our $export_auth_hook = undef;
 158
 159# only allow viewing of repositories also shown on the overview page
 160our $strict_export = "++GITWEB_STRICT_EXPORT++";
 161
 162# list of git base URLs used for URL to where fetch project from,
 163# i.e. full URL is "$git_base_url/$project"
 164our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
 165
 166# default blob_plain mimetype and default charset for text/plain blob
 167our $default_blob_plain_mimetype = 'text/plain';
 168our $default_text_plain_charset  = undef;
 169
 170# file to use for guessing MIME types before trying /etc/mime.types
 171# (relative to the current git repository)
 172our $mimetypes_file = undef;
 173
 174# assume this charset if line contains non-UTF-8 characters;
 175# it should be valid encoding (see Encoding::Supported(3pm) for list),
 176# for which encoding all byte sequences are valid, for example
 177# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
 178# could be even 'utf-8' for the old behavior)
 179our $fallback_encoding = 'latin1';
 180
 181# rename detection options for git-diff and git-diff-tree
 182# - default is '-M', with the cost proportional to
 183#   (number of removed files) * (number of new files).
 184# - more costly is '-C' (which implies '-M'), with the cost proportional to
 185#   (number of changed files + number of removed files) * (number of new files)
 186# - even more costly is '-C', '--find-copies-harder' with cost
 187#   (number of files in the original tree) * (number of new files)
 188# - one might want to include '-B' option, e.g. '-B', '-M'
 189our @diff_opts = ('-M'); # taken from git_commit
 190
 191# Disables features that would allow repository owners to inject script into
 192# the gitweb domain.
 193our $prevent_xss = 0;
 194
 195# Path to the highlight executable to use (must be the one from
 196# http://www.andre-simon.de due to assumptions about parameters and output).
 197# Useful if highlight is not installed on your webserver's PATH.
 198# [Default: highlight]
 199our $highlight_bin = "++HIGHLIGHT_BIN++";
 200
 201# information about snapshot formats that gitweb is capable of serving
 202our %known_snapshot_formats = (
 203        # name => {
 204        #       'display' => display name,
 205        #       'type' => mime type,
 206        #       'suffix' => filename suffix,
 207        #       'format' => --format for git-archive,
 208        #       'compressor' => [compressor command and arguments]
 209        #                       (array reference, optional)
 210        #       'disabled' => boolean (optional)}
 211        #
 212        'tgz' => {
 213                'display' => 'tar.gz',
 214                'type' => 'application/x-gzip',
 215                'suffix' => '.tar.gz',
 216                'format' => 'tar',
 217                'compressor' => ['gzip', '-n']},
 218
 219        'tbz2' => {
 220                'display' => 'tar.bz2',
 221                'type' => 'application/x-bzip2',
 222                'suffix' => '.tar.bz2',
 223                'format' => 'tar',
 224                'compressor' => ['bzip2']},
 225
 226        'txz' => {
 227                'display' => 'tar.xz',
 228                'type' => 'application/x-xz',
 229                'suffix' => '.tar.xz',
 230                'format' => 'tar',
 231                'compressor' => ['xz'],
 232                'disabled' => 1},
 233
 234        'zip' => {
 235                'display' => 'zip',
 236                'type' => 'application/x-zip',
 237                'suffix' => '.zip',
 238                'format' => 'zip'},
 239);
 240
 241# Aliases so we understand old gitweb.snapshot values in repository
 242# configuration.
 243our %known_snapshot_format_aliases = (
 244        'gzip'  => 'tgz',
 245        'bzip2' => 'tbz2',
 246        'xz'    => 'txz',
 247
 248        # backward compatibility: legacy gitweb config support
 249        'x-gzip' => undef, 'gz' => undef,
 250        'x-bzip2' => undef, 'bz2' => undef,
 251        'x-zip' => undef, '' => undef,
 252);
 253
 254# Pixel sizes for icons and avatars. If the default font sizes or lineheights
 255# are changed, it may be appropriate to change these values too via
 256# $GITWEB_CONFIG.
 257our %avatar_size = (
 258        'default' => 16,
 259        'double'  => 32
 260);
 261
 262# Used to set the maximum load that we will still respond to gitweb queries.
 263# If server load exceed this value then return "503 server busy" error.
 264# If gitweb cannot determined server load, it is taken to be 0.
 265# Leave it undefined (or set to 'undef') to turn off load checking.
 266our $maxload = 300;
 267
 268# configuration for 'highlight' (http://www.andre-simon.de/)
 269# match by basename
 270our %highlight_basename = (
 271        #'Program' => 'py',
 272        #'Library' => 'py',
 273        'SConstruct' => 'py', # SCons equivalent of Makefile
 274        'Makefile' => 'make',
 275);
 276# match by extension
 277our %highlight_ext = (
 278        # main extensions, defining name of syntax;
 279        # see files in /usr/share/highlight/langDefs/ directory
 280        (map { $_ => $_ } qw(py rb java css js tex bib xml awk bat ini spec tcl sql)),
 281        # alternate extensions, see /etc/highlight/filetypes.conf
 282        (map { $_ => 'c'   } qw(c h)),
 283        (map { $_ => 'sh'  } qw(sh bash zsh ksh)),
 284        (map { $_ => 'cpp' } qw(cpp cxx c++ cc)),
 285        (map { $_ => 'php' } qw(php php3 php4 php5 phps)),
 286        (map { $_ => 'pl'  } qw(pl perl pm)), # perhaps also 'cgi'
 287        (map { $_ => 'make'} qw(make mak mk)),
 288        (map { $_ => 'xml' } qw(xml xhtml html htm)),
 289);
 290
 291# You define site-wide feature defaults here; override them with
 292# $GITWEB_CONFIG as necessary.
 293our %feature = (
 294        # feature => {
 295        #       'sub' => feature-sub (subroutine),
 296        #       'override' => allow-override (boolean),
 297        #       'default' => [ default options...] (array reference)}
 298        #
 299        # if feature is overridable (it means that allow-override has true value),
 300        # then feature-sub will be called with default options as parameters;
 301        # return value of feature-sub indicates if to enable specified feature
 302        #
 303        # if there is no 'sub' key (no feature-sub), then feature cannot be
 304        # overridden
 305        #
 306        # use gitweb_get_feature(<feature>) to retrieve the <feature> value
 307        # (an array) or gitweb_check_feature(<feature>) to check if <feature>
 308        # is enabled
 309
 310        # Enable the 'blame' blob view, showing the last commit that modified
 311        # each line in the file. This can be very CPU-intensive.
 312
 313        # To enable system wide have in $GITWEB_CONFIG
 314        # $feature{'blame'}{'default'} = [1];
 315        # To have project specific config enable override in $GITWEB_CONFIG
 316        # $feature{'blame'}{'override'} = 1;
 317        # and in project config gitweb.blame = 0|1;
 318        'blame' => {
 319                'sub' => sub { feature_bool('blame', @_) },
 320                'override' => 0,
 321                'default' => [0]},
 322
 323        # Enable the 'snapshot' link, providing a compressed archive of any
 324        # tree. This can potentially generate high traffic if you have large
 325        # project.
 326
 327        # Value is a list of formats defined in %known_snapshot_formats that
 328        # you wish to offer.
 329        # To disable system wide have in $GITWEB_CONFIG
 330        # $feature{'snapshot'}{'default'} = [];
 331        # To have project specific config enable override in $GITWEB_CONFIG
 332        # $feature{'snapshot'}{'override'} = 1;
 333        # and in project config, a comma-separated list of formats or "none"
 334        # to disable.  Example: gitweb.snapshot = tbz2,zip;
 335        'snapshot' => {
 336                'sub' => \&feature_snapshot,
 337                'override' => 0,
 338                'default' => ['tgz']},
 339
 340        # Enable text search, which will list the commits which match author,
 341        # committer or commit text to a given string.  Enabled by default.
 342        # Project specific override is not supported.
 343        #
 344        # Note that this controls all search features, which means that if
 345        # it is disabled, then 'grep' and 'pickaxe' search would also be
 346        # disabled.
 347        'search' => {
 348                'override' => 0,
 349                'default' => [1]},
 350
 351        # Enable grep search, which will list the files in currently selected
 352        # tree containing the given string. Enabled by default. This can be
 353        # potentially CPU-intensive, of course.
 354        # Note that you need to have 'search' feature enabled too.
 355
 356        # To enable system wide have in $GITWEB_CONFIG
 357        # $feature{'grep'}{'default'} = [1];
 358        # To have project specific config enable override in $GITWEB_CONFIG
 359        # $feature{'grep'}{'override'} = 1;
 360        # and in project config gitweb.grep = 0|1;
 361        'grep' => {
 362                'sub' => sub { feature_bool('grep', @_) },
 363                'override' => 0,
 364                'default' => [1]},
 365
 366        # Enable the pickaxe search, which will list the commits that modified
 367        # a given string in a file. This can be practical and quite faster
 368        # alternative to 'blame', but still potentially CPU-intensive.
 369        # Note that you need to have 'search' feature enabled too.
 370
 371        # To enable system wide have in $GITWEB_CONFIG
 372        # $feature{'pickaxe'}{'default'} = [1];
 373        # To have project specific config enable override in $GITWEB_CONFIG
 374        # $feature{'pickaxe'}{'override'} = 1;
 375        # and in project config gitweb.pickaxe = 0|1;
 376        'pickaxe' => {
 377                'sub' => sub { feature_bool('pickaxe', @_) },
 378                'override' => 0,
 379                'default' => [1]},
 380
 381        # Enable showing size of blobs in a 'tree' view, in a separate
 382        # column, similar to what 'ls -l' does.  This cost a bit of IO.
 383
 384        # To disable system wide have in $GITWEB_CONFIG
 385        # $feature{'show-sizes'}{'default'} = [0];
 386        # To have project specific config enable override in $GITWEB_CONFIG
 387        # $feature{'show-sizes'}{'override'} = 1;
 388        # and in project config gitweb.showsizes = 0|1;
 389        'show-sizes' => {
 390                'sub' => sub { feature_bool('showsizes', @_) },
 391                'override' => 0,
 392                'default' => [1]},
 393
 394        # Make gitweb use an alternative format of the URLs which can be
 395        # more readable and natural-looking: project name is embedded
 396        # directly in the path and the query string contains other
 397        # auxiliary information. All gitweb installations recognize
 398        # URL in either format; this configures in which formats gitweb
 399        # generates links.
 400
 401        # To enable system wide have in $GITWEB_CONFIG
 402        # $feature{'pathinfo'}{'default'} = [1];
 403        # Project specific override is not supported.
 404
 405        # Note that you will need to change the default location of CSS,
 406        # favicon, logo and possibly other files to an absolute URL. Also,
 407        # if gitweb.cgi serves as your indexfile, you will need to force
 408        # $my_uri to contain the script name in your $GITWEB_CONFIG.
 409        'pathinfo' => {
 410                'override' => 0,
 411                'default' => [0]},
 412
 413        # Make gitweb consider projects in project root subdirectories
 414        # to be forks of existing projects. Given project $projname.git,
 415        # projects matching $projname/*.git will not be shown in the main
 416        # projects list, instead a '+' mark will be added to $projname
 417        # there and a 'forks' view will be enabled for the project, listing
 418        # all the forks. If project list is taken from a file, forks have
 419        # to be listed after the main project.
 420
 421        # To enable system wide have in $GITWEB_CONFIG
 422        # $feature{'forks'}{'default'} = [1];
 423        # Project specific override is not supported.
 424        'forks' => {
 425                'override' => 0,
 426                'default' => [0]},
 427
 428        # Insert custom links to the action bar of all project pages.
 429        # This enables you mainly to link to third-party scripts integrating
 430        # into gitweb; e.g. git-browser for graphical history representation
 431        # or custom web-based repository administration interface.
 432
 433        # The 'default' value consists of a list of triplets in the form
 434        # (label, link, position) where position is the label after which
 435        # to insert the link and link is a format string where %n expands
 436        # to the project name, %f to the project path within the filesystem,
 437        # %h to the current hash (h gitweb parameter) and %b to the current
 438        # hash base (hb gitweb parameter); %% expands to %.
 439
 440        # To enable system wide have in $GITWEB_CONFIG e.g.
 441        # $feature{'actions'}{'default'} = [('graphiclog',
 442        #       '/git-browser/by-commit.html?r=%n', 'summary')];
 443        # Project specific override is not supported.
 444        'actions' => {
 445                'override' => 0,
 446                'default' => []},
 447
 448        # Allow gitweb scan project content tags of project repository,
 449        # and display the popular Web 2.0-ish "tag cloud" near the projects
 450        # list.  Note that this is something COMPLETELY different from the
 451        # normal Git tags.
 452
 453        # gitweb by itself can show existing tags, but it does not handle
 454        # tagging itself; you need to do it externally, outside gitweb.
 455        # The format is described in git_get_project_ctags() subroutine.
 456        # You may want to install the HTML::TagCloud Perl module to get
 457        # a pretty tag cloud instead of just a list of tags.
 458
 459        # To enable system wide have in $GITWEB_CONFIG
 460        # $feature{'ctags'}{'default'} = [1];
 461        # Project specific override is not supported.
 462
 463        # In the future whether ctags editing is enabled might depend
 464        # on the value, but using 1 should always mean no editing of ctags.
 465        'ctags' => {
 466                'override' => 0,
 467                'default' => [0]},
 468
 469        # The maximum number of patches in a patchset generated in patch
 470        # view. Set this to 0 or undef to disable patch view, or to a
 471        # negative number to remove any limit.
 472
 473        # To disable system wide have in $GITWEB_CONFIG
 474        # $feature{'patches'}{'default'} = [0];
 475        # To have project specific config enable override in $GITWEB_CONFIG
 476        # $feature{'patches'}{'override'} = 1;
 477        # and in project config gitweb.patches = 0|n;
 478        # where n is the maximum number of patches allowed in a patchset.
 479        'patches' => {
 480                'sub' => \&feature_patches,
 481                'override' => 0,
 482                'default' => [16]},
 483
 484        # Avatar support. When this feature is enabled, views such as
 485        # shortlog or commit will display an avatar associated with
 486        # the email of the committer(s) and/or author(s).
 487
 488        # Currently available providers are gravatar and picon.
 489        # If an unknown provider is specified, the feature is disabled.
 490
 491        # Gravatar depends on Digest::MD5.
 492        # Picon currently relies on the indiana.edu database.
 493
 494        # To enable system wide have in $GITWEB_CONFIG
 495        # $feature{'avatar'}{'default'} = ['<provider>'];
 496        # where <provider> is either gravatar or picon.
 497        # To have project specific config enable override in $GITWEB_CONFIG
 498        # $feature{'avatar'}{'override'} = 1;
 499        # and in project config gitweb.avatar = <provider>;
 500        'avatar' => {
 501                'sub' => \&feature_avatar,
 502                'override' => 0,
 503                'default' => ['']},
 504
 505        # Enable displaying how much time and how many git commands
 506        # it took to generate and display page.  Disabled by default.
 507        # Project specific override is not supported.
 508        'timed' => {
 509                'override' => 0,
 510                'default' => [0]},
 511
 512        # Enable turning some links into links to actions which require
 513        # JavaScript to run (like 'blame_incremental').  Not enabled by
 514        # default.  Project specific override is currently not supported.
 515        'javascript-actions' => {
 516                'override' => 0,
 517                'default' => [0]},
 518
 519        # Enable and configure ability to change common timezone for dates
 520        # in gitweb output via JavaScript.  Enabled by default.
 521        # Project specific override is not supported.
 522        'javascript-timezone' => {
 523                'override' => 0,
 524                'default' => [
 525                        'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
 526                                     # or undef to turn off this feature
 527                        'gitweb_tz', # name of cookie where to store selected timezone
 528                        'datetime',  # CSS class used to mark up dates for manipulation
 529                ]},
 530
 531        # Syntax highlighting support. This is based on Daniel Svensson's
 532        # and Sham Chukoury's work in gitweb-xmms2.git.
 533        # It requires the 'highlight' program present in $PATH,
 534        # and therefore is disabled by default.
 535
 536        # To enable system wide have in $GITWEB_CONFIG
 537        # $feature{'highlight'}{'default'} = [1];
 538
 539        'highlight' => {
 540                'sub' => sub { feature_bool('highlight', @_) },
 541                'override' => 0,
 542                'default' => [0]},
 543
 544        # Enable displaying of remote heads in the heads list
 545
 546        # To enable system wide have in $GITWEB_CONFIG
 547        # $feature{'remote_heads'}{'default'} = [1];
 548        # To have project specific config enable override in $GITWEB_CONFIG
 549        # $feature{'remote_heads'}{'override'} = 1;
 550        # and in project config gitweb.remoteheads = 0|1;
 551        'remote_heads' => {
 552                'sub' => sub { feature_bool('remote_heads', @_) },
 553                'override' => 0,
 554                'default' => [0]},
 555
 556        # Enable showing branches under other refs in addition to heads
 557
 558        # To set system wide extra branch refs have in $GITWEB_CONFIG
 559        # $feature{'extra-branch-refs'}{'default'} = ['dirs', 'of', 'choice'];
 560        # To have project specific config enable override in $GITWEB_CONFIG
 561        # $feature{'extra-branch-refs'}{'override'} = 1;
 562        # and in project config gitweb.extrabranchrefs = dirs of choice
 563        # Every directory is separated with whitespace.
 564
 565        'extra-branch-refs' => {
 566                'sub' => \&feature_extra_branch_refs,
 567                'override' => 0,
 568                'default' => []},
 569);
 570
 571sub gitweb_get_feature {
 572        my ($name) = @_;
 573        return unless exists $feature{$name};
 574        my ($sub, $override, @defaults) = (
 575                $feature{$name}{'sub'},
 576                $feature{$name}{'override'},
 577                @{$feature{$name}{'default'}});
 578        # project specific override is possible only if we have project
 579        our $git_dir; # global variable, declared later
 580        if (!$override || !defined $git_dir) {
 581                return @defaults;
 582        }
 583        if (!defined $sub) {
 584                warn "feature $name is not overridable";
 585                return @defaults;
 586        }
 587        return $sub->(@defaults);
 588}
 589
 590# A wrapper to check if a given feature is enabled.
 591# With this, you can say
 592#
 593#   my $bool_feat = gitweb_check_feature('bool_feat');
 594#   gitweb_check_feature('bool_feat') or somecode;
 595#
 596# instead of
 597#
 598#   my ($bool_feat) = gitweb_get_feature('bool_feat');
 599#   (gitweb_get_feature('bool_feat'))[0] or somecode;
 600#
 601sub gitweb_check_feature {
 602        return (gitweb_get_feature(@_))[0];
 603}
 604
 605
 606sub feature_bool {
 607        my $key = shift;
 608        my ($val) = git_get_project_config($key, '--bool');
 609
 610        if (!defined $val) {
 611                return ($_[0]);
 612        } elsif ($val eq 'true') {
 613                return (1);
 614        } elsif ($val eq 'false') {
 615                return (0);
 616        }
 617}
 618
 619sub feature_snapshot {
 620        my (@fmts) = @_;
 621
 622        my ($val) = git_get_project_config('snapshot');
 623
 624        if ($val) {
 625                @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
 626        }
 627
 628        return @fmts;
 629}
 630
 631sub feature_patches {
 632        my @val = (git_get_project_config('patches', '--int'));
 633
 634        if (@val) {
 635                return @val;
 636        }
 637
 638        return ($_[0]);
 639}
 640
 641sub feature_avatar {
 642        my @val = (git_get_project_config('avatar'));
 643
 644        return @val ? @val : @_;
 645}
 646
 647sub feature_extra_branch_refs {
 648        my (@branch_refs) = @_;
 649        my $values = git_get_project_config('extrabranchrefs');
 650
 651        if ($values) {
 652                $values = config_to_multi ($values);
 653                @branch_refs = ();
 654                foreach my $value (@{$values}) {
 655                        push @branch_refs, split /\s+/, $value;
 656                }
 657        }
 658
 659        return @branch_refs;
 660}
 661
 662# checking HEAD file with -e is fragile if the repository was
 663# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
 664# and then pruned.
 665sub check_head_link {
 666        my ($dir) = @_;
 667        my $headfile = "$dir/HEAD";
 668        return ((-e $headfile) ||
 669                (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
 670}
 671
 672sub check_export_ok {
 673        my ($dir) = @_;
 674        return (check_head_link($dir) &&
 675                (!$export_ok || -e "$dir/$export_ok") &&
 676                (!$export_auth_hook || $export_auth_hook->($dir)));
 677}
 678
 679# process alternate names for backward compatibility
 680# filter out unsupported (unknown) snapshot formats
 681sub filter_snapshot_fmts {
 682        my @fmts = @_;
 683
 684        @fmts = map {
 685                exists $known_snapshot_format_aliases{$_} ?
 686                       $known_snapshot_format_aliases{$_} : $_} @fmts;
 687        @fmts = grep {
 688                exists $known_snapshot_formats{$_} &&
 689                !$known_snapshot_formats{$_}{'disabled'}} @fmts;
 690}
 691
 692sub filter_and_validate_refs {
 693        my @refs = @_;
 694        my %unique_refs = ();
 695
 696        foreach my $ref (@refs) {
 697                die_error(500, "Invalid ref '$ref' in 'extra-branch-refs' feature") unless (is_valid_ref_format($ref));
 698                # 'heads' are added implicitly in get_branch_refs().
 699                $unique_refs{$ref} = 1 if ($ref ne 'heads');
 700        }
 701        return sort keys %unique_refs;
 702}
 703
 704# If it is set to code reference, it is code that it is to be run once per
 705# request, allowing updating configurations that change with each request,
 706# while running other code in config file only once.
 707#
 708# Otherwise, if it is false then gitweb would process config file only once;
 709# if it is true then gitweb config would be run for each request.
 710our $per_request_config = 1;
 711
 712# read and parse gitweb config file given by its parameter.
 713# returns true on success, false on recoverable error, allowing
 714# to chain this subroutine, using first file that exists.
 715# dies on errors during parsing config file, as it is unrecoverable.
 716sub read_config_file {
 717        my $filename = shift;
 718        return unless defined $filename;
 719        # die if there are errors parsing config file
 720        if (-e $filename) {
 721                do $filename;
 722                die $@ if $@;
 723                return 1;
 724        }
 725        return;
 726}
 727
 728our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
 729sub evaluate_gitweb_config {
 730        our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
 731        our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
 732        our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
 733
 734        # Protect against duplications of file names, to not read config twice.
 735        # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
 736        # there possibility of duplication of filename there doesn't matter.
 737        $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
 738        $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
 739
 740        # Common system-wide settings for convenience.
 741        # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
 742        read_config_file($GITWEB_CONFIG_COMMON);
 743
 744        # Use first config file that exists.  This means use the per-instance
 745        # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
 746        read_config_file($GITWEB_CONFIG) and return;
 747        read_config_file($GITWEB_CONFIG_SYSTEM);
 748}
 749
 750# Get loadavg of system, to compare against $maxload.
 751# Currently it requires '/proc/loadavg' present to get loadavg;
 752# if it is not present it returns 0, which means no load checking.
 753sub get_loadavg {
 754        if( -e '/proc/loadavg' ){
 755                open my $fd, '<', '/proc/loadavg'
 756                        or return 0;
 757                my @load = split(/\s+/, scalar <$fd>);
 758                close $fd;
 759
 760                # The first three columns measure CPU and IO utilization of the last one,
 761                # five, and 10 minute periods.  The fourth column shows the number of
 762                # currently running processes and the total number of processes in the m/n
 763                # format.  The last column displays the last process ID used.
 764                return $load[0] || 0;
 765        }
 766        # additional checks for load average should go here for things that don't export
 767        # /proc/loadavg
 768
 769        return 0;
 770}
 771
 772# version of the core git binary
 773our $git_version;
 774sub evaluate_git_version {
 775        our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
 776        $number_of_git_cmds++;
 777}
 778
 779sub check_loadavg {
 780        if (defined $maxload && get_loadavg() > $maxload) {
 781                die_error(503, "The load average on the server is too high");
 782        }
 783}
 784
 785# ======================================================================
 786# input validation and dispatch
 787
 788# input parameters can be collected from a variety of sources (presently, CGI
 789# and PATH_INFO), so we define an %input_params hash that collects them all
 790# together during validation: this allows subsequent uses (e.g. href()) to be
 791# agnostic of the parameter origin
 792
 793our %input_params = ();
 794
 795# input parameters are stored with the long parameter name as key. This will
 796# also be used in the href subroutine to convert parameters to their CGI
 797# equivalent, and since the href() usage is the most frequent one, we store
 798# the name -> CGI key mapping here, instead of the reverse.
 799#
 800# XXX: Warning: If you touch this, check the search form for updating,
 801# too.
 802
 803our @cgi_param_mapping = (
 804        project => "p",
 805        action => "a",
 806        file_name => "f",
 807        file_parent => "fp",
 808        hash => "h",
 809        hash_parent => "hp",
 810        hash_base => "hb",
 811        hash_parent_base => "hpb",
 812        page => "pg",
 813        order => "o",
 814        searchtext => "s",
 815        searchtype => "st",
 816        snapshot_format => "sf",
 817        extra_options => "opt",
 818        search_use_regexp => "sr",
 819        ctag => "by_tag",
 820        diff_style => "ds",
 821        project_filter => "pf",
 822        # this must be last entry (for manipulation from JavaScript)
 823        javascript => "js"
 824);
 825our %cgi_param_mapping = @cgi_param_mapping;
 826
 827# we will also need to know the possible actions, for validation
 828our %actions = (
 829        "blame" => \&git_blame,
 830        "blame_incremental" => \&git_blame_incremental,
 831        "blame_data" => \&git_blame_data,
 832        "blobdiff" => \&git_blobdiff,
 833        "blobdiff_plain" => \&git_blobdiff_plain,
 834        "blob" => \&git_blob,
 835        "blob_plain" => \&git_blob_plain,
 836        "commitdiff" => \&git_commitdiff,
 837        "commitdiff_plain" => \&git_commitdiff_plain,
 838        "commit" => \&git_commit,
 839        "forks" => \&git_forks,
 840        "heads" => \&git_heads,
 841        "history" => \&git_history,
 842        "log" => \&git_log,
 843        "patch" => \&git_patch,
 844        "patches" => \&git_patches,
 845        "remotes" => \&git_remotes,
 846        "rss" => \&git_rss,
 847        "atom" => \&git_atom,
 848        "search" => \&git_search,
 849        "search_help" => \&git_search_help,
 850        "shortlog" => \&git_shortlog,
 851        "summary" => \&git_summary,
 852        "tag" => \&git_tag,
 853        "tags" => \&git_tags,
 854        "tree" => \&git_tree,
 855        "snapshot" => \&git_snapshot,
 856        "object" => \&git_object,
 857        # those below don't need $project
 858        "opml" => \&git_opml,
 859        "project_list" => \&git_project_list,
 860        "project_index" => \&git_project_index,
 861);
 862
 863# finally, we have the hash of allowed extra_options for the commands that
 864# allow them
 865our %allowed_options = (
 866        "--no-merges" => [ qw(rss atom log shortlog history) ],
 867);
 868
 869# fill %input_params with the CGI parameters. All values except for 'opt'
 870# should be single values, but opt can be an array. We should probably
 871# build an array of parameters that can be multi-valued, but since for the time
 872# being it's only this one, we just single it out
 873sub evaluate_query_params {
 874        our $cgi;
 875
 876        while (my ($name, $symbol) = each %cgi_param_mapping) {
 877                if ($symbol eq 'opt') {
 878                        $input_params{$name} = [ map { decode_utf8($_) } $cgi->multi_param($symbol) ];
 879                } else {
 880                        $input_params{$name} = decode_utf8($cgi->param($symbol));
 881                }
 882        }
 883}
 884
 885# now read PATH_INFO and update the parameter list for missing parameters
 886sub evaluate_path_info {
 887        return if defined $input_params{'project'};
 888        return if !$path_info;
 889        $path_info =~ s,^/+,,;
 890        return if !$path_info;
 891
 892        # find which part of PATH_INFO is project
 893        my $project = $path_info;
 894        $project =~ s,/+$,,;
 895        while ($project && !check_head_link("$projectroot/$project")) {
 896                $project =~ s,/*[^/]*$,,;
 897        }
 898        return unless $project;
 899        $input_params{'project'} = $project;
 900
 901        # do not change any parameters if an action is given using the query string
 902        return if $input_params{'action'};
 903        $path_info =~ s,^\Q$project\E/*,,;
 904
 905        # next, check if we have an action
 906        my $action = $path_info;
 907        $action =~ s,/.*$,,;
 908        if (exists $actions{$action}) {
 909                $path_info =~ s,^$action/*,,;
 910                $input_params{'action'} = $action;
 911        }
 912
 913        # list of actions that want hash_base instead of hash, but can have no
 914        # pathname (f) parameter
 915        my @wants_base = (
 916                'tree',
 917                'history',
 918        );
 919
 920        # we want to catch, among others
 921        # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
 922        my ($parentrefname, $parentpathname, $refname, $pathname) =
 923                ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
 924
 925        # first, analyze the 'current' part
 926        if (defined $pathname) {
 927                # we got "branch:filename" or "branch:dir/"
 928                # we could use git_get_type(branch:pathname), but:
 929                # - it needs $git_dir
 930                # - it does a git() call
 931                # - the convention of terminating directories with a slash
 932                #   makes it superfluous
 933                # - embedding the action in the PATH_INFO would make it even
 934                #   more superfluous
 935                $pathname =~ s,^/+,,;
 936                if (!$pathname || substr($pathname, -1) eq "/") {
 937                        $input_params{'action'} ||= "tree";
 938                        $pathname =~ s,/$,,;
 939                } else {
 940                        # the default action depends on whether we had parent info
 941                        # or not
 942                        if ($parentrefname) {
 943                                $input_params{'action'} ||= "blobdiff_plain";
 944                        } else {
 945                                $input_params{'action'} ||= "blob_plain";
 946                        }
 947                }
 948                $input_params{'hash_base'} ||= $refname;
 949                $input_params{'file_name'} ||= $pathname;
 950        } elsif (defined $refname) {
 951                # we got "branch". In this case we have to choose if we have to
 952                # set hash or hash_base.
 953                #
 954                # Most of the actions without a pathname only want hash to be
 955                # set, except for the ones specified in @wants_base that want
 956                # hash_base instead. It should also be noted that hand-crafted
 957                # links having 'history' as an action and no pathname or hash
 958                # set will fail, but that happens regardless of PATH_INFO.
 959                if (defined $parentrefname) {
 960                        # if there is parent let the default be 'shortlog' action
 961                        # (for http://git.example.com/repo.git/A..B links); if there
 962                        # is no parent, dispatch will detect type of object and set
 963                        # action appropriately if required (if action is not set)
 964                        $input_params{'action'} ||= "shortlog";
 965                }
 966                if ($input_params{'action'} &&
 967                    grep { $_ eq $input_params{'action'} } @wants_base) {
 968                        $input_params{'hash_base'} ||= $refname;
 969                } else {
 970                        $input_params{'hash'} ||= $refname;
 971                }
 972        }
 973
 974        # next, handle the 'parent' part, if present
 975        if (defined $parentrefname) {
 976                # a missing pathspec defaults to the 'current' filename, allowing e.g.
 977                # someproject/blobdiff/oldrev..newrev:/filename
 978                if ($parentpathname) {
 979                        $parentpathname =~ s,^/+,,;
 980                        $parentpathname =~ s,/$,,;
 981                        $input_params{'file_parent'} ||= $parentpathname;
 982                } else {
 983                        $input_params{'file_parent'} ||= $input_params{'file_name'};
 984                }
 985                # we assume that hash_parent_base is wanted if a path was specified,
 986                # or if the action wants hash_base instead of hash
 987                if (defined $input_params{'file_parent'} ||
 988                        grep { $_ eq $input_params{'action'} } @wants_base) {
 989                        $input_params{'hash_parent_base'} ||= $parentrefname;
 990                } else {
 991                        $input_params{'hash_parent'} ||= $parentrefname;
 992                }
 993        }
 994
 995        # for the snapshot action, we allow URLs in the form
 996        # $project/snapshot/$hash.ext
 997        # where .ext determines the snapshot and gets removed from the
 998        # passed $refname to provide the $hash.
 999        #
1000        # To be able to tell that $refname includes the format extension, we
1001        # require the following two conditions to be satisfied:
1002        # - the hash input parameter MUST have been set from the $refname part
1003        #   of the URL (i.e. they must be equal)
1004        # - the snapshot format MUST NOT have been defined already (e.g. from
1005        #   CGI parameter sf)
1006        # It's also useless to try any matching unless $refname has a dot,
1007        # so we check for that too
1008        if (defined $input_params{'action'} &&
1009                $input_params{'action'} eq 'snapshot' &&
1010                defined $refname && index($refname, '.') != -1 &&
1011                $refname eq $input_params{'hash'} &&
1012                !defined $input_params{'snapshot_format'}) {
1013                # We loop over the known snapshot formats, checking for
1014                # extensions. Allowed extensions are both the defined suffix
1015                # (which includes the initial dot already) and the snapshot
1016                # format key itself, with a prepended dot
1017                while (my ($fmt, $opt) = each %known_snapshot_formats) {
1018                        my $hash = $refname;
1019                        unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
1020                                next;
1021                        }
1022                        my $sfx = $1;
1023                        # a valid suffix was found, so set the snapshot format
1024                        # and reset the hash parameter
1025                        $input_params{'snapshot_format'} = $fmt;
1026                        $input_params{'hash'} = $hash;
1027                        # we also set the format suffix to the one requested
1028                        # in the URL: this way a request for e.g. .tgz returns
1029                        # a .tgz instead of a .tar.gz
1030                        $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
1031                        last;
1032                }
1033        }
1034}
1035
1036our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
1037     $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
1038     $searchtext, $search_regexp, $project_filter);
1039sub evaluate_and_validate_params {
1040        our $action = $input_params{'action'};
1041        if (defined $action) {
1042                if (!is_valid_action($action)) {
1043                        die_error(400, "Invalid action parameter");
1044                }
1045        }
1046
1047        # parameters which are pathnames
1048        our $project = $input_params{'project'};
1049        if (defined $project) {
1050                if (!is_valid_project($project)) {
1051                        undef $project;
1052                        die_error(404, "No such project");
1053                }
1054        }
1055
1056        our $project_filter = $input_params{'project_filter'};
1057        if (defined $project_filter) {
1058                if (!is_valid_pathname($project_filter)) {
1059                        die_error(404, "Invalid project_filter parameter");
1060                }
1061        }
1062
1063        our $file_name = $input_params{'file_name'};
1064        if (defined $file_name) {
1065                if (!is_valid_pathname($file_name)) {
1066                        die_error(400, "Invalid file parameter");
1067                }
1068        }
1069
1070        our $file_parent = $input_params{'file_parent'};
1071        if (defined $file_parent) {
1072                if (!is_valid_pathname($file_parent)) {
1073                        die_error(400, "Invalid file parent parameter");
1074                }
1075        }
1076
1077        # parameters which are refnames
1078        our $hash = $input_params{'hash'};
1079        if (defined $hash) {
1080                if (!is_valid_refname($hash)) {
1081                        die_error(400, "Invalid hash parameter");
1082                }
1083        }
1084
1085        our $hash_parent = $input_params{'hash_parent'};
1086        if (defined $hash_parent) {
1087                if (!is_valid_refname($hash_parent)) {
1088                        die_error(400, "Invalid hash parent parameter");
1089                }
1090        }
1091
1092        our $hash_base = $input_params{'hash_base'};
1093        if (defined $hash_base) {
1094                if (!is_valid_refname($hash_base)) {
1095                        die_error(400, "Invalid hash base parameter");
1096                }
1097        }
1098
1099        our @extra_options = @{$input_params{'extra_options'}};
1100        # @extra_options is always defined, since it can only be (currently) set from
1101        # CGI, and $cgi->param() returns the empty array in array context if the param
1102        # is not set
1103        foreach my $opt (@extra_options) {
1104                if (not exists $allowed_options{$opt}) {
1105                        die_error(400, "Invalid option parameter");
1106                }
1107                if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1108                        die_error(400, "Invalid option parameter for this action");
1109                }
1110        }
1111
1112        our $hash_parent_base = $input_params{'hash_parent_base'};
1113        if (defined $hash_parent_base) {
1114                if (!is_valid_refname($hash_parent_base)) {
1115                        die_error(400, "Invalid hash parent base parameter");
1116                }
1117        }
1118
1119        # other parameters
1120        our $page = $input_params{'page'};
1121        if (defined $page) {
1122                if ($page =~ m/[^0-9]/) {
1123                        die_error(400, "Invalid page parameter");
1124                }
1125        }
1126
1127        our $searchtype = $input_params{'searchtype'};
1128        if (defined $searchtype) {
1129                if ($searchtype =~ m/[^a-z]/) {
1130                        die_error(400, "Invalid searchtype parameter");
1131                }
1132        }
1133
1134        our $search_use_regexp = $input_params{'search_use_regexp'};
1135
1136        our $searchtext = $input_params{'searchtext'};
1137        our $search_regexp = undef;
1138        if (defined $searchtext) {
1139                if (length($searchtext) < 2) {
1140                        die_error(403, "At least two characters are required for search parameter");
1141                }
1142                if ($search_use_regexp) {
1143                        $search_regexp = $searchtext;
1144                        if (!eval { qr/$search_regexp/; 1; }) {
1145                                (my $error = $@) =~ s/ at \S+ line \d+.*\n?//;
1146                                die_error(400, "Invalid search regexp '$search_regexp'",
1147                                          esc_html($error));
1148                        }
1149                } else {
1150                        $search_regexp = quotemeta $searchtext;
1151                }
1152        }
1153}
1154
1155# path to the current git repository
1156our $git_dir;
1157sub evaluate_git_dir {
1158        our $git_dir = "$projectroot/$project" if $project;
1159}
1160
1161our (@snapshot_fmts, $git_avatar, @extra_branch_refs);
1162sub configure_gitweb_features {
1163        # list of supported snapshot formats
1164        our @snapshot_fmts = gitweb_get_feature('snapshot');
1165        @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1166
1167        # check that the avatar feature is set to a known provider name,
1168        # and for each provider check if the dependencies are satisfied.
1169        # if the provider name is invalid or the dependencies are not met,
1170        # reset $git_avatar to the empty string.
1171        our ($git_avatar) = gitweb_get_feature('avatar');
1172        if ($git_avatar eq 'gravatar') {
1173                $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1174        } elsif ($git_avatar eq 'picon') {
1175                # no dependencies
1176        } else {
1177                $git_avatar = '';
1178        }
1179
1180        our @extra_branch_refs = gitweb_get_feature('extra-branch-refs');
1181        @extra_branch_refs = filter_and_validate_refs (@extra_branch_refs);
1182}
1183
1184sub get_branch_refs {
1185        return ('heads', @extra_branch_refs);
1186}
1187
1188# custom error handler: 'die <message>' is Internal Server Error
1189sub handle_errors_html {
1190        my $msg = shift; # it is already HTML escaped
1191
1192        # to avoid infinite loop where error occurs in die_error,
1193        # change handler to default handler, disabling handle_errors_html
1194        set_message("Error occurred when inside die_error:\n$msg");
1195
1196        # you cannot jump out of die_error when called as error handler;
1197        # the subroutine set via CGI::Carp::set_message is called _after_
1198        # HTTP headers are already written, so it cannot write them itself
1199        die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1200}
1201set_message(\&handle_errors_html);
1202
1203# dispatch
1204sub dispatch {
1205        if (!defined $action) {
1206                if (defined $hash) {
1207                        $action = git_get_type($hash);
1208                        $action or die_error(404, "Object does not exist");
1209                } elsif (defined $hash_base && defined $file_name) {
1210                        $action = git_get_type("$hash_base:$file_name");
1211                        $action or die_error(404, "File or directory does not exist");
1212                } elsif (defined $project) {
1213                        $action = 'summary';
1214                } else {
1215                        $action = 'project_list';
1216                }
1217        }
1218        if (!defined($actions{$action})) {
1219                die_error(400, "Unknown action");
1220        }
1221        if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1222            !$project) {
1223                die_error(400, "Project needed");
1224        }
1225        $actions{$action}->();
1226}
1227
1228sub reset_timer {
1229        our $t0 = [ gettimeofday() ]
1230                if defined $t0;
1231        our $number_of_git_cmds = 0;
1232}
1233
1234our $first_request = 1;
1235sub run_request {
1236        reset_timer();
1237
1238        evaluate_uri();
1239        if ($first_request) {
1240                evaluate_gitweb_config();
1241                evaluate_git_version();
1242        }
1243        if ($per_request_config) {
1244                if (ref($per_request_config) eq 'CODE') {
1245                        $per_request_config->();
1246                } elsif (!$first_request) {
1247                        evaluate_gitweb_config();
1248                }
1249        }
1250        check_loadavg();
1251
1252        # $projectroot and $projects_list might be set in gitweb config file
1253        $projects_list ||= $projectroot;
1254
1255        evaluate_query_params();
1256        evaluate_path_info();
1257        evaluate_and_validate_params();
1258        evaluate_git_dir();
1259
1260        configure_gitweb_features();
1261
1262        dispatch();
1263}
1264
1265our $is_last_request = sub { 1 };
1266our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1267our $CGI = 'CGI';
1268our $cgi;
1269sub configure_as_fcgi {
1270        require CGI::Fast;
1271        our $CGI = 'CGI::Fast';
1272
1273        my $request_number = 0;
1274        # let each child service 100 requests
1275        our $is_last_request = sub { ++$request_number > 100 };
1276}
1277sub evaluate_argv {
1278        my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1279        configure_as_fcgi()
1280                if $script_name =~ /\.fcgi$/;
1281
1282        return unless (@ARGV);
1283
1284        require Getopt::Long;
1285        Getopt::Long::GetOptions(
1286                'fastcgi|fcgi|f' => \&configure_as_fcgi,
1287                'nproc|n=i' => sub {
1288                        my ($arg, $val) = @_;
1289                        return unless eval { require FCGI::ProcManager; 1; };
1290                        my $proc_manager = FCGI::ProcManager->new({
1291                                n_processes => $val,
1292                        });
1293                        our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1294                        our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1295                        our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1296                },
1297        );
1298}
1299
1300sub run {
1301        evaluate_argv();
1302
1303        $first_request = 1;
1304        $pre_listen_hook->()
1305                if $pre_listen_hook;
1306
1307 REQUEST:
1308        while ($cgi = $CGI->new()) {
1309                $pre_dispatch_hook->()
1310                        if $pre_dispatch_hook;
1311
1312                run_request();
1313
1314                $post_dispatch_hook->()
1315                        if $post_dispatch_hook;
1316                $first_request = 0;
1317
1318                last REQUEST if ($is_last_request->());
1319        }
1320
1321 DONE_GITWEB:
1322        1;
1323}
1324
1325run();
1326
1327if (defined caller) {
1328        # wrapped in a subroutine processing requests,
1329        # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1330        return;
1331} else {
1332        # pure CGI script, serving single request
1333        exit;
1334}
1335
1336## ======================================================================
1337## action links
1338
1339# possible values of extra options
1340# -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1341# -replay => 1      - start from a current view (replay with modifications)
1342# -path_info => 0|1 - don't use/use path_info URL (if possible)
1343# -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1344sub href {
1345        my %params = @_;
1346        # default is to use -absolute url() i.e. $my_uri
1347        my $href = $params{-full} ? $my_url : $my_uri;
1348
1349        # implicit -replay, must be first of implicit params
1350        $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1351
1352        $params{'project'} = $project unless exists $params{'project'};
1353
1354        if ($params{-replay}) {
1355                while (my ($name, $symbol) = each %cgi_param_mapping) {
1356                        if (!exists $params{$name}) {
1357                                $params{$name} = $input_params{$name};
1358                        }
1359                }
1360        }
1361
1362        my $use_pathinfo = gitweb_check_feature('pathinfo');
1363        if (defined $params{'project'} &&
1364            (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1365                # try to put as many parameters as possible in PATH_INFO:
1366                #   - project name
1367                #   - action
1368                #   - hash_parent or hash_parent_base:/file_parent
1369                #   - hash or hash_base:/filename
1370                #   - the snapshot_format as an appropriate suffix
1371
1372                # When the script is the root DirectoryIndex for the domain,
1373                # $href here would be something like http://gitweb.example.com/
1374                # Thus, we strip any trailing / from $href, to spare us double
1375                # slashes in the final URL
1376                $href =~ s,/$,,;
1377
1378                # Then add the project name, if present
1379                $href .= "/".esc_path_info($params{'project'});
1380                delete $params{'project'};
1381
1382                # since we destructively absorb parameters, we keep this
1383                # boolean that remembers if we're handling a snapshot
1384                my $is_snapshot = $params{'action'} eq 'snapshot';
1385
1386                # Summary just uses the project path URL, any other action is
1387                # added to the URL
1388                if (defined $params{'action'}) {
1389                        $href .= "/".esc_path_info($params{'action'})
1390                                unless $params{'action'} eq 'summary';
1391                        delete $params{'action'};
1392                }
1393
1394                # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1395                # stripping nonexistent or useless pieces
1396                $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1397                        || $params{'hash_parent'} || $params{'hash'});
1398                if (defined $params{'hash_base'}) {
1399                        if (defined $params{'hash_parent_base'}) {
1400                                $href .= esc_path_info($params{'hash_parent_base'});
1401                                # skip the file_parent if it's the same as the file_name
1402                                if (defined $params{'file_parent'}) {
1403                                        if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1404                                                delete $params{'file_parent'};
1405                                        } elsif ($params{'file_parent'} !~ /\.\./) {
1406                                                $href .= ":/".esc_path_info($params{'file_parent'});
1407                                                delete $params{'file_parent'};
1408                                        }
1409                                }
1410                                $href .= "..";
1411                                delete $params{'hash_parent'};
1412                                delete $params{'hash_parent_base'};
1413                        } elsif (defined $params{'hash_parent'}) {
1414                                $href .= esc_path_info($params{'hash_parent'}). "..";
1415                                delete $params{'hash_parent'};
1416                        }
1417
1418                        $href .= esc_path_info($params{'hash_base'});
1419                        if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1420                                $href .= ":/".esc_path_info($params{'file_name'});
1421                                delete $params{'file_name'};
1422                        }
1423                        delete $params{'hash'};
1424                        delete $params{'hash_base'};
1425                } elsif (defined $params{'hash'}) {
1426                        $href .= esc_path_info($params{'hash'});
1427                        delete $params{'hash'};
1428                }
1429
1430                # If the action was a snapshot, we can absorb the
1431                # snapshot_format parameter too
1432                if ($is_snapshot) {
1433                        my $fmt = $params{'snapshot_format'};
1434                        # snapshot_format should always be defined when href()
1435                        # is called, but just in case some code forgets, we
1436                        # fall back to the default
1437                        $fmt ||= $snapshot_fmts[0];
1438                        $href .= $known_snapshot_formats{$fmt}{'suffix'};
1439                        delete $params{'snapshot_format'};
1440                }
1441        }
1442
1443        # now encode the parameters explicitly
1444        my @result = ();
1445        for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1446                my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1447                if (defined $params{$name}) {
1448                        if (ref($params{$name}) eq "ARRAY") {
1449                                foreach my $par (@{$params{$name}}) {
1450                                        push @result, $symbol . "=" . esc_param($par);
1451                                }
1452                        } else {
1453                                push @result, $symbol . "=" . esc_param($params{$name});
1454                        }
1455                }
1456        }
1457        $href .= "?" . join(';', @result) if scalar @result;
1458
1459        # final transformation: trailing spaces must be escaped (URI-encoded)
1460        $href =~ s/(\s+)$/CGI::escape($1)/e;
1461
1462        if ($params{-anchor}) {
1463                $href .= "#".esc_param($params{-anchor});
1464        }
1465
1466        return $href;
1467}
1468
1469
1470## ======================================================================
1471## validation, quoting/unquoting and escaping
1472
1473sub is_valid_action {
1474        my $input = shift;
1475        return undef unless exists $actions{$input};
1476        return 1;
1477}
1478
1479sub is_valid_project {
1480        my $input = shift;
1481
1482        return unless defined $input;
1483        if (!is_valid_pathname($input) ||
1484                !(-d "$projectroot/$input") ||
1485                !check_export_ok("$projectroot/$input") ||
1486                ($strict_export && !project_in_list($input))) {
1487                return undef;
1488        } else {
1489                return 1;
1490        }
1491}
1492
1493sub is_valid_pathname {
1494        my $input = shift;
1495
1496        return undef unless defined $input;
1497        # no '.' or '..' as elements of path, i.e. no '.' or '..'
1498        # at the beginning, at the end, and between slashes.
1499        # also this catches doubled slashes
1500        if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1501                return undef;
1502        }
1503        # no null characters
1504        if ($input =~ m!\0!) {
1505                return undef;
1506        }
1507        return 1;
1508}
1509
1510sub is_valid_ref_format {
1511        my $input = shift;
1512
1513        return undef unless defined $input;
1514        # restrictions on ref name according to git-check-ref-format
1515        if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1516                return undef;
1517        }
1518        return 1;
1519}
1520
1521sub is_valid_refname {
1522        my $input = shift;
1523
1524        return undef unless defined $input;
1525        # textual hashes are O.K.
1526        if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1527                return 1;
1528        }
1529        # it must be correct pathname
1530        is_valid_pathname($input) or return undef;
1531        # check git-check-ref-format restrictions
1532        is_valid_ref_format($input) or return undef;
1533        return 1;
1534}
1535
1536# decode sequences of octets in utf8 into Perl's internal form,
1537# which is utf-8 with utf8 flag set if needed.  gitweb writes out
1538# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1539sub to_utf8 {
1540        my $str = shift;
1541        return undef unless defined $str;
1542
1543        if (utf8::is_utf8($str) || utf8::decode($str)) {
1544                return $str;
1545        } else {
1546                return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1547        }
1548}
1549
1550# quote unsafe chars, but keep the slash, even when it's not
1551# correct, but quoted slashes look too horrible in bookmarks
1552sub esc_param {
1553        my $str = shift;
1554        return undef unless defined $str;
1555        $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1556        $str =~ s/ /\+/g;
1557        return $str;
1558}
1559
1560# the quoting rules for path_info fragment are slightly different
1561sub esc_path_info {
1562        my $str = shift;
1563        return undef unless defined $str;
1564
1565        # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1566        $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1567
1568        return $str;
1569}
1570
1571# quote unsafe chars in whole URL, so some characters cannot be quoted
1572sub esc_url {
1573        my $str = shift;
1574        return undef unless defined $str;
1575        $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1576        $str =~ s/ /\+/g;
1577        return $str;
1578}
1579
1580# quote unsafe characters in HTML attributes
1581sub esc_attr {
1582
1583        # for XHTML conformance escaping '"' to '&quot;' is not enough
1584        return esc_html(@_);
1585}
1586
1587# replace invalid utf8 character with SUBSTITUTION sequence
1588sub esc_html {
1589        my $str = shift;
1590        my %opts = @_;
1591
1592        return undef unless defined $str;
1593
1594        $str = to_utf8($str);
1595        $str = $cgi->escapeHTML($str);
1596        if ($opts{'-nbsp'}) {
1597                $str =~ s/ /&nbsp;/g;
1598        }
1599        $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1600        return $str;
1601}
1602
1603# quote control characters and escape filename to HTML
1604sub esc_path {
1605        my $str = shift;
1606        my %opts = @_;
1607
1608        return undef unless defined $str;
1609
1610        $str = to_utf8($str);
1611        $str = $cgi->escapeHTML($str);
1612        if ($opts{'-nbsp'}) {
1613                $str =~ s/ /&nbsp;/g;
1614        }
1615        $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1616        return $str;
1617}
1618
1619# Sanitize for use in XHTML + application/xml+xhtml (valid XML 1.0)
1620sub sanitize {
1621        my $str = shift;
1622
1623        return undef unless defined $str;
1624
1625        $str = to_utf8($str);
1626        $str =~ s|([[:cntrl:]])|(index("\t\n\r", $1) != -1 ? $1 : quot_cec($1))|eg;
1627        return $str;
1628}
1629
1630# Make control characters "printable", using character escape codes (CEC)
1631sub quot_cec {
1632        my $cntrl = shift;
1633        my %opts = @_;
1634        my %es = ( # character escape codes, aka escape sequences
1635                "\t" => '\t',   # tab            (HT)
1636                "\n" => '\n',   # line feed      (LF)
1637                "\r" => '\r',   # carrige return (CR)
1638                "\f" => '\f',   # form feed      (FF)
1639                "\b" => '\b',   # backspace      (BS)
1640                "\a" => '\a',   # alarm (bell)   (BEL)
1641                "\e" => '\e',   # escape         (ESC)
1642                "\013" => '\v', # vertical tab   (VT)
1643                "\000" => '\0', # nul character  (NUL)
1644        );
1645        my $chr = ( (exists $es{$cntrl})
1646                    ? $es{$cntrl}
1647                    : sprintf('\%2x', ord($cntrl)) );
1648        if ($opts{-nohtml}) {
1649                return $chr;
1650        } else {
1651                return "<span class=\"cntrl\">$chr</span>";
1652        }
1653}
1654
1655# Alternatively use unicode control pictures codepoints,
1656# Unicode "printable representation" (PR)
1657sub quot_upr {
1658        my $cntrl = shift;
1659        my %opts = @_;
1660
1661        my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1662        if ($opts{-nohtml}) {
1663                return $chr;
1664        } else {
1665                return "<span class=\"cntrl\">$chr</span>";
1666        }
1667}
1668
1669# git may return quoted and escaped filenames
1670sub unquote {
1671        my $str = shift;
1672
1673        sub unq {
1674                my $seq = shift;
1675                my %es = ( # character escape codes, aka escape sequences
1676                        't' => "\t",   # tab            (HT, TAB)
1677                        'n' => "\n",   # newline        (NL)
1678                        'r' => "\r",   # return         (CR)
1679                        'f' => "\f",   # form feed      (FF)
1680                        'b' => "\b",   # backspace      (BS)
1681                        'a' => "\a",   # alarm (bell)   (BEL)
1682                        'e' => "\e",   # escape         (ESC)
1683                        'v' => "\013", # vertical tab   (VT)
1684                );
1685
1686                if ($seq =~ m/^[0-7]{1,3}$/) {
1687                        # octal char sequence
1688                        return chr(oct($seq));
1689                } elsif (exists $es{$seq}) {
1690                        # C escape sequence, aka character escape code
1691                        return $es{$seq};
1692                }
1693                # quoted ordinary character
1694                return $seq;
1695        }
1696
1697        if ($str =~ m/^"(.*)"$/) {
1698                # needs unquoting
1699                $str = $1;
1700                $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1701        }
1702        return $str;
1703}
1704
1705# escape tabs (convert tabs to spaces)
1706sub untabify {
1707        my $line = shift;
1708
1709        while ((my $pos = index($line, "\t")) != -1) {
1710                if (my $count = (8 - ($pos % 8))) {
1711                        my $spaces = ' ' x $count;
1712                        $line =~ s/\t/$spaces/;
1713                }
1714        }
1715
1716        return $line;
1717}
1718
1719sub project_in_list {
1720        my $project = shift;
1721        my @list = git_get_projects_list();
1722        return @list && scalar(grep { $_->{'path'} eq $project } @list);
1723}
1724
1725## ----------------------------------------------------------------------
1726## HTML aware string manipulation
1727
1728# Try to chop given string on a word boundary between position
1729# $len and $len+$add_len. If there is no word boundary there,
1730# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1731# (marking chopped part) would be longer than given string.
1732sub chop_str {
1733        my $str = shift;
1734        my $len = shift;
1735        my $add_len = shift || 10;
1736        my $where = shift || 'right'; # 'left' | 'center' | 'right'
1737
1738        # Make sure perl knows it is utf8 encoded so we don't
1739        # cut in the middle of a utf8 multibyte char.
1740        $str = to_utf8($str);
1741
1742        # allow only $len chars, but don't cut a word if it would fit in $add_len
1743        # if it doesn't fit, cut it if it's still longer than the dots we would add
1744        # remove chopped character entities entirely
1745
1746        # when chopping in the middle, distribute $len into left and right part
1747        # return early if chopping wouldn't make string shorter
1748        if ($where eq 'center') {
1749                return $str if ($len + 5 >= length($str)); # filler is length 5
1750                $len = int($len/2);
1751        } else {
1752                return $str if ($len + 4 >= length($str)); # filler is length 4
1753        }
1754
1755        # regexps: ending and beginning with word part up to $add_len
1756        my $endre = qr/.{$len}\w{0,$add_len}/;
1757        my $begre = qr/\w{0,$add_len}.{$len}/;
1758
1759        if ($where eq 'left') {
1760                $str =~ m/^(.*?)($begre)$/;
1761                my ($lead, $body) = ($1, $2);
1762                if (length($lead) > 4) {
1763                        $lead = " ...";
1764                }
1765                return "$lead$body";
1766
1767        } elsif ($where eq 'center') {
1768                $str =~ m/^($endre)(.*)$/;
1769                my ($left, $str)  = ($1, $2);
1770                $str =~ m/^(.*?)($begre)$/;
1771                my ($mid, $right) = ($1, $2);
1772                if (length($mid) > 5) {
1773                        $mid = " ... ";
1774                }
1775                return "$left$mid$right";
1776
1777        } else {
1778                $str =~ m/^($endre)(.*)$/;
1779                my $body = $1;
1780                my $tail = $2;
1781                if (length($tail) > 4) {
1782                        $tail = "... ";
1783                }
1784                return "$body$tail";
1785        }
1786}
1787
1788# takes the same arguments as chop_str, but also wraps a <span> around the
1789# result with a title attribute if it does get chopped. Additionally, the
1790# string is HTML-escaped.
1791sub chop_and_escape_str {
1792        my ($str) = @_;
1793
1794        my $chopped = chop_str(@_);
1795        $str = to_utf8($str);
1796        if ($chopped eq $str) {
1797                return esc_html($chopped);
1798        } else {
1799                $str =~ s/[[:cntrl:]]/?/g;
1800                return $cgi->span({-title=>$str}, esc_html($chopped));
1801        }
1802}
1803
1804# Highlight selected fragments of string, using given CSS class,
1805# and escape HTML.  It is assumed that fragments do not overlap.
1806# Regions are passed as list of pairs (array references).
1807#
1808# Example: esc_html_hl_regions("foobar", "mark", [ 0, 3 ]) returns
1809# '<span class="mark">foo</span>bar'
1810sub esc_html_hl_regions {
1811        my ($str, $css_class, @sel) = @_;
1812        my %opts = grep { ref($_) ne 'ARRAY' } @sel;
1813        @sel     = grep { ref($_) eq 'ARRAY' } @sel;
1814        return esc_html($str, %opts) unless @sel;
1815
1816        my $out = '';
1817        my $pos = 0;
1818
1819        for my $s (@sel) {
1820                my ($begin, $end) = @$s;
1821
1822                # Don't create empty <span> elements.
1823                next if $end <= $begin;
1824
1825                my $escaped = esc_html(substr($str, $begin, $end - $begin),
1826                                       %opts);
1827
1828                $out .= esc_html(substr($str, $pos, $begin - $pos), %opts)
1829                        if ($begin - $pos > 0);
1830                $out .= $cgi->span({-class => $css_class}, $escaped);
1831
1832                $pos = $end;
1833        }
1834        $out .= esc_html(substr($str, $pos), %opts)
1835                if ($pos < length($str));
1836
1837        return $out;
1838}
1839
1840# return positions of beginning and end of each match
1841sub matchpos_list {
1842        my ($str, $regexp) = @_;
1843        return unless (defined $str && defined $regexp);
1844
1845        my @matches;
1846        while ($str =~ /$regexp/g) {
1847                push @matches, [$-[0], $+[0]];
1848        }
1849        return @matches;
1850}
1851
1852# highlight match (if any), and escape HTML
1853sub esc_html_match_hl {
1854        my ($str, $regexp) = @_;
1855        return esc_html($str) unless defined $regexp;
1856
1857        my @matches = matchpos_list($str, $regexp);
1858        return esc_html($str) unless @matches;
1859
1860        return esc_html_hl_regions($str, 'match', @matches);
1861}
1862
1863
1864# highlight match (if any) of shortened string, and escape HTML
1865sub esc_html_match_hl_chopped {
1866        my ($str, $chopped, $regexp) = @_;
1867        return esc_html_match_hl($str, $regexp) unless defined $chopped;
1868
1869        my @matches = matchpos_list($str, $regexp);
1870        return esc_html($chopped) unless @matches;
1871
1872        # filter matches so that we mark chopped string
1873        my $tail = "... "; # see chop_str
1874        unless ($chopped =~ s/\Q$tail\E$//) {
1875                $tail = '';
1876        }
1877        my $chop_len = length($chopped);
1878        my $tail_len = length($tail);
1879        my @filtered;
1880
1881        for my $m (@matches) {
1882                if ($m->[0] > $chop_len) {
1883                        push @filtered, [ $chop_len, $chop_len + $tail_len ] if ($tail_len > 0);
1884                        last;
1885                } elsif ($m->[1] > $chop_len) {
1886                        push @filtered, [ $m->[0], $chop_len + $tail_len ];
1887                        last;
1888                }
1889                push @filtered, $m;
1890        }
1891
1892        return esc_html_hl_regions($chopped . $tail, 'match', @filtered);
1893}
1894
1895## ----------------------------------------------------------------------
1896## functions returning short strings
1897
1898# CSS class for given age value (in seconds)
1899sub age_class {
1900        my $age = shift;
1901
1902        if (!defined $age) {
1903                return "noage";
1904        } elsif ($age < 60*60*2) {
1905                return "age0";
1906        } elsif ($age < 60*60*24*2) {
1907                return "age1";
1908        } else {
1909                return "age2";
1910        }
1911}
1912
1913# convert age in seconds to "nn units ago" string
1914sub age_string {
1915        my $age = shift;
1916        my $age_str;
1917
1918        if ($age > 60*60*24*365*2) {
1919                $age_str = (int $age/60/60/24/365);
1920                $age_str .= " years ago";
1921        } elsif ($age > 60*60*24*(365/12)*2) {
1922                $age_str = int $age/60/60/24/(365/12);
1923                $age_str .= " months ago";
1924        } elsif ($age > 60*60*24*7*2) {
1925                $age_str = int $age/60/60/24/7;
1926                $age_str .= " weeks ago";
1927        } elsif ($age > 60*60*24*2) {
1928                $age_str = int $age/60/60/24;
1929                $age_str .= " days ago";
1930        } elsif ($age > 60*60*2) {
1931                $age_str = int $age/60/60;
1932                $age_str .= " hours ago";
1933        } elsif ($age > 60*2) {
1934                $age_str = int $age/60;
1935                $age_str .= " min ago";
1936        } elsif ($age > 2) {
1937                $age_str = int $age;
1938                $age_str .= " sec ago";
1939        } else {
1940                $age_str .= " right now";
1941        }
1942        return $age_str;
1943}
1944
1945use constant {
1946        S_IFINVALID => 0030000,
1947        S_IFGITLINK => 0160000,
1948};
1949
1950# submodule/subproject, a commit object reference
1951sub S_ISGITLINK {
1952        my $mode = shift;
1953
1954        return (($mode & S_IFMT) == S_IFGITLINK)
1955}
1956
1957# convert file mode in octal to symbolic file mode string
1958sub mode_str {
1959        my $mode = oct shift;
1960
1961        if (S_ISGITLINK($mode)) {
1962                return 'm---------';
1963        } elsif (S_ISDIR($mode & S_IFMT)) {
1964                return 'drwxr-xr-x';
1965        } elsif (S_ISLNK($mode)) {
1966                return 'lrwxrwxrwx';
1967        } elsif (S_ISREG($mode)) {
1968                # git cares only about the executable bit
1969                if ($mode & S_IXUSR) {
1970                        return '-rwxr-xr-x';
1971                } else {
1972                        return '-rw-r--r--';
1973                };
1974        } else {
1975                return '----------';
1976        }
1977}
1978
1979# convert file mode in octal to file type string
1980sub file_type {
1981        my $mode = shift;
1982
1983        if ($mode !~ m/^[0-7]+$/) {
1984                return $mode;
1985        } else {
1986                $mode = oct $mode;
1987        }
1988
1989        if (S_ISGITLINK($mode)) {
1990                return "submodule";
1991        } elsif (S_ISDIR($mode & S_IFMT)) {
1992                return "directory";
1993        } elsif (S_ISLNK($mode)) {
1994                return "symlink";
1995        } elsif (S_ISREG($mode)) {
1996                return "file";
1997        } else {
1998                return "unknown";
1999        }
2000}
2001
2002# convert file mode in octal to file type description string
2003sub file_type_long {
2004        my $mode = shift;
2005
2006        if ($mode !~ m/^[0-7]+$/) {
2007                return $mode;
2008        } else {
2009                $mode = oct $mode;
2010        }
2011
2012        if (S_ISGITLINK($mode)) {
2013                return "submodule";
2014        } elsif (S_ISDIR($mode & S_IFMT)) {
2015                return "directory";
2016        } elsif (S_ISLNK($mode)) {
2017                return "symlink";
2018        } elsif (S_ISREG($mode)) {
2019                if ($mode & S_IXUSR) {
2020                        return "executable";
2021                } else {
2022                        return "file";
2023                };
2024        } else {
2025                return "unknown";
2026        }
2027}
2028
2029
2030## ----------------------------------------------------------------------
2031## functions returning short HTML fragments, or transforming HTML fragments
2032## which don't belong to other sections
2033
2034# format line of commit message.
2035sub format_log_line_html {
2036        my $line = shift;
2037
2038        $line = esc_html($line, -nbsp=>1);
2039        $line =~ s{
2040        \b
2041        (
2042            # The output of "git describe", e.g. v2.10.0-297-gf6727b0
2043            # or hadoop-20160921-113441-20-g094fb7d
2044            (?<!-) # see strbuf_check_tag_ref(). Tags can't start with -
2045            [A-Za-z0-9.-]+
2046            (?!\.) # refs can't end with ".", see check_refname_format()
2047            -g[0-9a-fA-F]{7,40}
2048            |
2049            # Just a normal looking Git SHA1
2050            [0-9a-fA-F]{7,40}
2051        )
2052        \b
2053    }{
2054                $cgi->a({-href => href(action=>"object", hash=>$1),
2055                                        -class => "text"}, $1);
2056        }egx;
2057
2058        return $line;
2059}
2060
2061# format marker of refs pointing to given object
2062
2063# the destination action is chosen based on object type and current context:
2064# - for annotated tags, we choose the tag view unless it's the current view
2065#   already, in which case we go to shortlog view
2066# - for other refs, we keep the current view if we're in history, shortlog or
2067#   log view, and select shortlog otherwise
2068sub format_ref_marker {
2069        my ($refs, $id) = @_;
2070        my $markers = '';
2071
2072        if (defined $refs->{$id}) {
2073                foreach my $ref (@{$refs->{$id}}) {
2074                        # this code exploits the fact that non-lightweight tags are the
2075                        # only indirect objects, and that they are the only objects for which
2076                        # we want to use tag instead of shortlog as action
2077                        my ($type, $name) = qw();
2078                        my $indirect = ($ref =~ s/\^\{\}$//);
2079                        # e.g. tags/v2.6.11 or heads/next
2080                        if ($ref =~ m!^(.*?)s?/(.*)$!) {
2081                                $type = $1;
2082                                $name = $2;
2083                        } else {
2084                                $type = "ref";
2085                                $name = $ref;
2086                        }
2087
2088                        my $class = $type;
2089                        $class .= " indirect" if $indirect;
2090
2091                        my $dest_action = "shortlog";
2092
2093                        if ($indirect) {
2094                                $dest_action = "tag" unless $action eq "tag";
2095                        } elsif ($action =~ /^(history|(short)?log)$/) {
2096                                $dest_action = $action;
2097                        }
2098
2099                        my $dest = "";
2100                        $dest .= "refs/" unless $ref =~ m!^refs/!;
2101                        $dest .= $ref;
2102
2103                        my $link = $cgi->a({
2104                                -href => href(
2105                                        action=>$dest_action,
2106                                        hash=>$dest
2107                                )}, esc_html($name));
2108
2109                        $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
2110                                $link . "</span>";
2111                }
2112        }
2113
2114        if ($markers) {
2115                return ' <span class="refs">'. $markers . '</span>';
2116        } else {
2117                return "";
2118        }
2119}
2120
2121# format, perhaps shortened and with markers, title line
2122sub format_subject_html {
2123        my ($long, $short, $href, $extra) = @_;
2124        $extra = '' unless defined($extra);
2125
2126        if (length($short) < length($long)) {
2127                $long =~ s/[[:cntrl:]]/?/g;
2128                return $cgi->a({-href => $href, -class => "list subject",
2129                                -title => to_utf8($long)},
2130                       esc_html($short)) . $extra;
2131        } else {
2132                return $cgi->a({-href => $href, -class => "list subject"},
2133                       esc_html($long)) . $extra;
2134        }
2135}
2136
2137# Rather than recomputing the url for an email multiple times, we cache it
2138# after the first hit. This gives a visible benefit in views where the avatar
2139# for the same email is used repeatedly (e.g. shortlog).
2140# The cache is shared by all avatar engines (currently gravatar only), which
2141# are free to use it as preferred. Since only one avatar engine is used for any
2142# given page, there's no risk for cache conflicts.
2143our %avatar_cache = ();
2144
2145# Compute the picon url for a given email, by using the picon search service over at
2146# http://www.cs.indiana.edu/picons/search.html
2147sub picon_url {
2148        my $email = lc shift;
2149        if (!$avatar_cache{$email}) {
2150                my ($user, $domain) = split('@', $email);
2151                $avatar_cache{$email} =
2152                        "//www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
2153                        "$domain/$user/" .
2154                        "users+domains+unknown/up/single";
2155        }
2156        return $avatar_cache{$email};
2157}
2158
2159# Compute the gravatar url for a given email, if it's not in the cache already.
2160# Gravatar stores only the part of the URL before the size, since that's the
2161# one computationally more expensive. This also allows reuse of the cache for
2162# different sizes (for this particular engine).
2163sub gravatar_url {
2164        my $email = lc shift;
2165        my $size = shift;
2166        $avatar_cache{$email} ||=
2167                "//www.gravatar.com/avatar/" .
2168                        Digest::MD5::md5_hex($email) . "?s=";
2169        return $avatar_cache{$email} . $size;
2170}
2171
2172# Insert an avatar for the given $email at the given $size if the feature
2173# is enabled.
2174sub git_get_avatar {
2175        my ($email, %opts) = @_;
2176        my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
2177        my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
2178        $opts{-size} ||= 'default';
2179        my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
2180        my $url = "";
2181        if ($git_avatar eq 'gravatar') {
2182                $url = gravatar_url($email, $size);
2183        } elsif ($git_avatar eq 'picon') {
2184                $url = picon_url($email);
2185        }
2186        # Other providers can be added by extending the if chain, defining $url
2187        # as needed. If no variant puts something in $url, we assume avatars
2188        # are completely disabled/unavailable.
2189        if ($url) {
2190                return $pre_white .
2191                       "<img width=\"$size\" " .
2192                            "class=\"avatar\" " .
2193                            "src=\"".esc_url($url)."\" " .
2194                            "alt=\"\" " .
2195                       "/>" . $post_white;
2196        } else {
2197                return "";
2198        }
2199}
2200
2201sub format_search_author {
2202        my ($author, $searchtype, $displaytext) = @_;
2203        my $have_search = gitweb_check_feature('search');
2204
2205        if ($have_search) {
2206                my $performed = "";
2207                if ($searchtype eq 'author') {
2208                        $performed = "authored";
2209                } elsif ($searchtype eq 'committer') {
2210                        $performed = "committed";
2211                }
2212
2213                return $cgi->a({-href => href(action=>"search", hash=>$hash,
2214                                searchtext=>$author,
2215                                searchtype=>$searchtype), class=>"list",
2216                                title=>"Search for commits $performed by $author"},
2217                                $displaytext);
2218
2219        } else {
2220                return $displaytext;
2221        }
2222}
2223
2224# format the author name of the given commit with the given tag
2225# the author name is chopped and escaped according to the other
2226# optional parameters (see chop_str).
2227sub format_author_html {
2228        my $tag = shift;
2229        my $co = shift;
2230        my $author = chop_and_escape_str($co->{'author_name'}, @_);
2231        return "<$tag class=\"author\">" .
2232               format_search_author($co->{'author_name'}, "author",
2233                       git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2234                       $author) .
2235               "</$tag>";
2236}
2237
2238# format git diff header line, i.e. "diff --(git|combined|cc) ..."
2239sub format_git_diff_header_line {
2240        my $line = shift;
2241        my $diffinfo = shift;
2242        my ($from, $to) = @_;
2243
2244        if ($diffinfo->{'nparents'}) {
2245                # combined diff
2246                $line =~ s!^(diff (.*?) )"?.*$!$1!;
2247                if ($to->{'href'}) {
2248                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2249                                         esc_path($to->{'file'}));
2250                } else { # file was deleted (no href)
2251                        $line .= esc_path($to->{'file'});
2252                }
2253        } else {
2254                # "ordinary" diff
2255                $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2256                if ($from->{'href'}) {
2257                        $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2258                                         'a/' . esc_path($from->{'file'}));
2259                } else { # file was added (no href)
2260                        $line .= 'a/' . esc_path($from->{'file'});
2261                }
2262                $line .= ' ';
2263                if ($to->{'href'}) {
2264                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2265                                         'b/' . esc_path($to->{'file'}));
2266                } else { # file was deleted
2267                        $line .= 'b/' . esc_path($to->{'file'});
2268                }
2269        }
2270
2271        return "<div class=\"diff header\">$line</div>\n";
2272}
2273
2274# format extended diff header line, before patch itself
2275sub format_extended_diff_header_line {
2276        my $line = shift;
2277        my $diffinfo = shift;
2278        my ($from, $to) = @_;
2279
2280        # match <path>
2281        if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2282                $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2283                                       esc_path($from->{'file'}));
2284        }
2285        if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2286                $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2287                                 esc_path($to->{'file'}));
2288        }
2289        # match single <mode>
2290        if ($line =~ m/\s(\d{6})$/) {
2291                $line .= '<span class="info"> (' .
2292                         file_type_long($1) .
2293                         ')</span>';
2294        }
2295        # match <hash>
2296        if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2297                # can match only for combined diff
2298                $line = 'index ';
2299                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2300                        if ($from->{'href'}[$i]) {
2301                                $line .= $cgi->a({-href=>$from->{'href'}[$i],
2302                                                  -class=>"hash"},
2303                                                 substr($diffinfo->{'from_id'}[$i],0,7));
2304                        } else {
2305                                $line .= '0' x 7;
2306                        }
2307                        # separator
2308                        $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2309                }
2310                $line .= '..';
2311                if ($to->{'href'}) {
2312                        $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2313                                         substr($diffinfo->{'to_id'},0,7));
2314                } else {
2315                        $line .= '0' x 7;
2316                }
2317
2318        } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2319                # can match only for ordinary diff
2320                my ($from_link, $to_link);
2321                if ($from->{'href'}) {
2322                        $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2323                                             substr($diffinfo->{'from_id'},0,7));
2324                } else {
2325                        $from_link = '0' x 7;
2326                }
2327                if ($to->{'href'}) {
2328                        $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2329                                           substr($diffinfo->{'to_id'},0,7));
2330                } else {
2331                        $to_link = '0' x 7;
2332                }
2333                my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2334                $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2335        }
2336
2337        return $line . "<br/>\n";
2338}
2339
2340# format from-file/to-file diff header
2341sub format_diff_from_to_header {
2342        my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2343        my $line;
2344        my $result = '';
2345
2346        $line = $from_line;
2347        #assert($line =~ m/^---/) if DEBUG;
2348        # no extra formatting for "^--- /dev/null"
2349        if (! $diffinfo->{'nparents'}) {
2350                # ordinary (single parent) diff
2351                if ($line =~ m!^--- "?a/!) {
2352                        if ($from->{'href'}) {
2353                                $line = '--- a/' .
2354                                        $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2355                                                esc_path($from->{'file'}));
2356                        } else {
2357                                $line = '--- a/' .
2358                                        esc_path($from->{'file'});
2359                        }
2360                }
2361                $result .= qq!<div class="diff from_file">$line</div>\n!;
2362
2363        } else {
2364                # combined diff (merge commit)
2365                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2366                        if ($from->{'href'}[$i]) {
2367                                $line = '--- ' .
2368                                        $cgi->a({-href=>href(action=>"blobdiff",
2369                                                             hash_parent=>$diffinfo->{'from_id'}[$i],
2370                                                             hash_parent_base=>$parents[$i],
2371                                                             file_parent=>$from->{'file'}[$i],
2372                                                             hash=>$diffinfo->{'to_id'},
2373                                                             hash_base=>$hash,
2374                                                             file_name=>$to->{'file'}),
2375                                                 -class=>"path",
2376                                                 -title=>"diff" . ($i+1)},
2377                                                $i+1) .
2378                                        '/' .
2379                                        $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2380                                                esc_path($from->{'file'}[$i]));
2381                        } else {
2382                                $line = '--- /dev/null';
2383                        }
2384                        $result .= qq!<div class="diff from_file">$line</div>\n!;
2385                }
2386        }
2387
2388        $line = $to_line;
2389        #assert($line =~ m/^\+\+\+/) if DEBUG;
2390        # no extra formatting for "^+++ /dev/null"
2391        if ($line =~ m!^\+\+\+ "?b/!) {
2392                if ($to->{'href'}) {
2393                        $line = '+++ b/' .
2394                                $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2395                                        esc_path($to->{'file'}));
2396                } else {
2397                        $line = '+++ b/' .
2398                                esc_path($to->{'file'});
2399                }
2400        }
2401        $result .= qq!<div class="diff to_file">$line</div>\n!;
2402
2403        return $result;
2404}
2405
2406# create note for patch simplified by combined diff
2407sub format_diff_cc_simplified {
2408        my ($diffinfo, @parents) = @_;
2409        my $result = '';
2410
2411        $result .= "<div class=\"diff header\">" .
2412                   "diff --cc ";
2413        if (!is_deleted($diffinfo)) {
2414                $result .= $cgi->a({-href => href(action=>"blob",
2415                                                  hash_base=>$hash,
2416                                                  hash=>$diffinfo->{'to_id'},
2417                                                  file_name=>$diffinfo->{'to_file'}),
2418                                    -class => "path"},
2419                                   esc_path($diffinfo->{'to_file'}));
2420        } else {
2421                $result .= esc_path($diffinfo->{'to_file'});
2422        }
2423        $result .= "</div>\n" . # class="diff header"
2424                   "<div class=\"diff nodifferences\">" .
2425                   "Simple merge" .
2426                   "</div>\n"; # class="diff nodifferences"
2427
2428        return $result;
2429}
2430
2431sub diff_line_class {
2432        my ($line, $from, $to) = @_;
2433
2434        # ordinary diff
2435        my $num_sign = 1;
2436        # combined diff
2437        if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2438                $num_sign = scalar @{$from->{'href'}};
2439        }
2440
2441        my @diff_line_classifier = (
2442                { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2443                { regexp => qr/^\\/,               class => "incomplete"  },
2444                { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2445                # classifier for context must come before classifier add/rem,
2446                # or we would have to use more complicated regexp, for example
2447                # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2448                { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2449                { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2450        );
2451        for my $clsfy (@diff_line_classifier) {
2452                return $clsfy->{'class'}
2453                        if ($line =~ $clsfy->{'regexp'});
2454        }
2455
2456        # fallback
2457        return "";
2458}
2459
2460# assumes that $from and $to are defined and correctly filled,
2461# and that $line holds a line of chunk header for unified diff
2462sub format_unidiff_chunk_header {
2463        my ($line, $from, $to) = @_;
2464
2465        my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2466                $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2467
2468        $from_lines = 0 unless defined $from_lines;
2469        $to_lines   = 0 unless defined $to_lines;
2470
2471        if ($from->{'href'}) {
2472                $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2473                                     -class=>"list"}, $from_text);
2474        }
2475        if ($to->{'href'}) {
2476                $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2477                                     -class=>"list"}, $to_text);
2478        }
2479        $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2480                "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2481        return $line;
2482}
2483
2484# assumes that $from and $to are defined and correctly filled,
2485# and that $line holds a line of chunk header for combined diff
2486sub format_cc_diff_chunk_header {
2487        my ($line, $from, $to) = @_;
2488
2489        my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2490        my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2491
2492        @from_text = split(' ', $ranges);
2493        for (my $i = 0; $i < @from_text; ++$i) {
2494                ($from_start[$i], $from_nlines[$i]) =
2495                        (split(',', substr($from_text[$i], 1)), 0);
2496        }
2497
2498        $to_text   = pop @from_text;
2499        $to_start  = pop @from_start;
2500        $to_nlines = pop @from_nlines;
2501
2502        $line = "<span class=\"chunk_info\">$prefix ";
2503        for (my $i = 0; $i < @from_text; ++$i) {
2504                if ($from->{'href'}[$i]) {
2505                        $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2506                                          -class=>"list"}, $from_text[$i]);
2507                } else {
2508                        $line .= $from_text[$i];
2509                }
2510                $line .= " ";
2511        }
2512        if ($to->{'href'}) {
2513                $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2514                                  -class=>"list"}, $to_text);
2515        } else {
2516                $line .= $to_text;
2517        }
2518        $line .= " $prefix</span>" .
2519                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2520        return $line;
2521}
2522
2523# process patch (diff) line (not to be used for diff headers),
2524# returning HTML-formatted (but not wrapped) line.
2525# If the line is passed as a reference, it is treated as HTML and not
2526# esc_html()'ed.
2527sub format_diff_line {
2528        my ($line, $diff_class, $from, $to) = @_;
2529
2530        if (ref($line)) {
2531                $line = $$line;
2532        } else {
2533                chomp $line;
2534                $line = untabify($line);
2535
2536                if ($from && $to && $line =~ m/^\@{2} /) {
2537                        $line = format_unidiff_chunk_header($line, $from, $to);
2538                } elsif ($from && $to && $line =~ m/^\@{3}/) {
2539                        $line = format_cc_diff_chunk_header($line, $from, $to);
2540                } else {
2541                        $line = esc_html($line, -nbsp=>1);
2542                }
2543        }
2544
2545        my $diff_classes = "diff";
2546        $diff_classes .= " $diff_class" if ($diff_class);
2547        $line = "<div class=\"$diff_classes\">$line</div>\n";
2548
2549        return $line;
2550}
2551
2552# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2553# linked.  Pass the hash of the tree/commit to snapshot.
2554sub format_snapshot_links {
2555        my ($hash) = @_;
2556        my $num_fmts = @snapshot_fmts;
2557        if ($num_fmts > 1) {
2558                # A parenthesized list of links bearing format names.
2559                # e.g. "snapshot (_tar.gz_ _zip_)"
2560                return "snapshot (" . join(' ', map
2561                        $cgi->a({
2562                                -href => href(
2563                                        action=>"snapshot",
2564                                        hash=>$hash,
2565                                        snapshot_format=>$_
2566                                )
2567                        }, $known_snapshot_formats{$_}{'display'})
2568                , @snapshot_fmts) . ")";
2569        } elsif ($num_fmts == 1) {
2570                # A single "snapshot" link whose tooltip bears the format name.
2571                # i.e. "_snapshot_"
2572                my ($fmt) = @snapshot_fmts;
2573                return
2574                        $cgi->a({
2575                                -href => href(
2576                                        action=>"snapshot",
2577                                        hash=>$hash,
2578                                        snapshot_format=>$fmt
2579                                ),
2580                                -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2581                        }, "snapshot");
2582        } else { # $num_fmts == 0
2583                return undef;
2584        }
2585}
2586
2587## ......................................................................
2588## functions returning values to be passed, perhaps after some
2589## transformation, to other functions; e.g. returning arguments to href()
2590
2591# returns hash to be passed to href to generate gitweb URL
2592# in -title key it returns description of link
2593sub get_feed_info {
2594        my $format = shift || 'Atom';
2595        my %res = (action => lc($format));
2596        my $matched_ref = 0;
2597
2598        # feed links are possible only for project views
2599        return unless (defined $project);
2600        # some views should link to OPML, or to generic project feed,
2601        # or don't have specific feed yet (so they should use generic)
2602        return if (!$action || $action =~ /^(?:tags|heads|forks|tag|search)$/x);
2603
2604        my $branch = undef;
2605        # branches refs uses 'refs/' + $get_branch_refs()[x] + '/' prefix
2606        # (fullname) to differentiate from tag links; this also makes
2607        # possible to detect branch links
2608        for my $ref (get_branch_refs()) {
2609                if ((defined $hash_base && $hash_base =~ m!^refs/\Q$ref\E/(.*)$!) ||
2610                    (defined $hash      && $hash      =~ m!^refs/\Q$ref\E/(.*)$!)) {
2611                        $branch = $1;
2612                        $matched_ref = $ref;
2613                        last;
2614                }
2615        }
2616        # find log type for feed description (title)
2617        my $type = 'log';
2618        if (defined $file_name) {
2619                $type  = "history of $file_name";
2620                $type .= "/" if ($action eq 'tree');
2621                $type .= " on '$branch'" if (defined $branch);
2622        } else {
2623                $type = "log of $branch" if (defined $branch);
2624        }
2625
2626        $res{-title} = $type;
2627        $res{'hash'} = (defined $branch ? "refs/$matched_ref/$branch" : undef);
2628        $res{'file_name'} = $file_name;
2629
2630        return %res;
2631}
2632
2633## ----------------------------------------------------------------------
2634## git utility subroutines, invoking git commands
2635
2636# returns path to the core git executable and the --git-dir parameter as list
2637sub git_cmd {
2638        $number_of_git_cmds++;
2639        return $GIT, '--git-dir='.$git_dir;
2640}
2641
2642# quote the given arguments for passing them to the shell
2643# quote_command("command", "arg 1", "arg with ' and ! characters")
2644# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2645# Try to avoid using this function wherever possible.
2646sub quote_command {
2647        return join(' ',
2648                map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2649}
2650
2651# get HEAD ref of given project as hash
2652sub git_get_head_hash {
2653        return git_get_full_hash(shift, 'HEAD');
2654}
2655
2656sub git_get_full_hash {
2657        return git_get_hash(@_);
2658}
2659
2660sub git_get_short_hash {
2661        return git_get_hash(@_, '--short=7');
2662}
2663
2664sub git_get_hash {
2665        my ($project, $hash, @options) = @_;
2666        my $o_git_dir = $git_dir;
2667        my $retval = undef;
2668        $git_dir = "$projectroot/$project";
2669        if (open my $fd, '-|', git_cmd(), 'rev-parse',
2670            '--verify', '-q', @options, $hash) {
2671                $retval = <$fd>;
2672                chomp $retval if defined $retval;
2673                close $fd;
2674        }
2675        if (defined $o_git_dir) {
2676                $git_dir = $o_git_dir;
2677        }
2678        return $retval;
2679}
2680
2681# get type of given object
2682sub git_get_type {
2683        my $hash = shift;
2684
2685        open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2686        my $type = <$fd>;
2687        close $fd or return;
2688        chomp $type;
2689        return $type;
2690}
2691
2692# repository configuration
2693our $config_file = '';
2694our %config;
2695
2696# store multiple values for single key as anonymous array reference
2697# single values stored directly in the hash, not as [ <value> ]
2698sub hash_set_multi {
2699        my ($hash, $key, $value) = @_;
2700
2701        if (!exists $hash->{$key}) {
2702                $hash->{$key} = $value;
2703        } elsif (!ref $hash->{$key}) {
2704                $hash->{$key} = [ $hash->{$key}, $value ];
2705        } else {
2706                push @{$hash->{$key}}, $value;
2707        }
2708}
2709
2710# return hash of git project configuration
2711# optionally limited to some section, e.g. 'gitweb'
2712sub git_parse_project_config {
2713        my $section_regexp = shift;
2714        my %config;
2715
2716        local $/ = "\0";
2717
2718        open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2719                or return;
2720
2721        while (my $keyval = <$fh>) {
2722                chomp $keyval;
2723                my ($key, $value) = split(/\n/, $keyval, 2);
2724
2725                hash_set_multi(\%config, $key, $value)
2726                        if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2727        }
2728        close $fh;
2729
2730        return %config;
2731}
2732
2733# convert config value to boolean: 'true' or 'false'
2734# no value, number > 0, 'true' and 'yes' values are true
2735# rest of values are treated as false (never as error)
2736sub config_to_bool {
2737        my $val = shift;
2738
2739        return 1 if !defined $val;             # section.key
2740
2741        # strip leading and trailing whitespace
2742        $val =~ s/^\s+//;
2743        $val =~ s/\s+$//;
2744
2745        return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2746                ($val =~ /^(?:true|yes)$/i));  # section.key = true
2747}
2748
2749# convert config value to simple decimal number
2750# an optional value suffix of 'k', 'm', or 'g' will cause the value
2751# to be multiplied by 1024, 1048576, or 1073741824
2752sub config_to_int {
2753        my $val = shift;
2754
2755        # strip leading and trailing whitespace
2756        $val =~ s/^\s+//;
2757        $val =~ s/\s+$//;
2758
2759        if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2760                $unit = lc($unit);
2761                # unknown unit is treated as 1
2762                return $num * ($unit eq 'g' ? 1073741824 :
2763                               $unit eq 'm' ?    1048576 :
2764                               $unit eq 'k' ?       1024 : 1);
2765        }
2766        return $val;
2767}
2768
2769# convert config value to array reference, if needed
2770sub config_to_multi {
2771        my $val = shift;
2772
2773        return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2774}
2775
2776sub git_get_project_config {
2777        my ($key, $type) = @_;
2778
2779        return unless defined $git_dir;
2780
2781        # key sanity check
2782        return unless ($key);
2783        # only subsection, if exists, is case sensitive,
2784        # and not lowercased by 'git config -z -l'
2785        if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2786                $lo =~ s/_//g;
2787                $key = join(".", lc($hi), $mi, lc($lo));
2788                return if ($lo =~ /\W/ || $hi =~ /\W/);
2789        } else {
2790                $key = lc($key);
2791                $key =~ s/_//g;
2792                return if ($key =~ /\W/);
2793        }
2794        $key =~ s/^gitweb\.//;
2795
2796        # type sanity check
2797        if (defined $type) {
2798                $type =~ s/^--//;
2799                $type = undef
2800                        unless ($type eq 'bool' || $type eq 'int');
2801        }
2802
2803        # get config
2804        if (!defined $config_file ||
2805            $config_file ne "$git_dir/config") {
2806                %config = git_parse_project_config('gitweb');
2807                $config_file = "$git_dir/config";
2808        }
2809
2810        # check if config variable (key) exists
2811        return unless exists $config{"gitweb.$key"};
2812
2813        # ensure given type
2814        if (!defined $type) {
2815                return $config{"gitweb.$key"};
2816        } elsif ($type eq 'bool') {
2817                # backward compatibility: 'git config --bool' returns true/false
2818                return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2819        } elsif ($type eq 'int') {
2820                return config_to_int($config{"gitweb.$key"});
2821        }
2822        return $config{"gitweb.$key"};
2823}
2824
2825# get hash of given path at given ref
2826sub git_get_hash_by_path {
2827        my $base = shift;
2828        my $path = shift || return undef;
2829        my $type = shift;
2830
2831        $path =~ s,/+$,,;
2832
2833        open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2834                or die_error(500, "Open git-ls-tree failed");
2835        my $line = <$fd>;
2836        close $fd or return undef;
2837
2838        if (!defined $line) {
2839                # there is no tree or hash given by $path at $base
2840                return undef;
2841        }
2842
2843        #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2844        $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2845        if (defined $type && $type ne $2) {
2846                # type doesn't match
2847                return undef;
2848        }
2849        return $3;
2850}
2851
2852# get path of entry with given hash at given tree-ish (ref)
2853# used to get 'from' filename for combined diff (merge commit) for renames
2854sub git_get_path_by_hash {
2855        my $base = shift || return;
2856        my $hash = shift || return;
2857
2858        local $/ = "\0";
2859
2860        open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2861                or return undef;
2862        while (my $line = <$fd>) {
2863                chomp $line;
2864
2865                #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2866                #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2867                if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2868                        close $fd;
2869                        return $1;
2870                }
2871        }
2872        close $fd;
2873        return undef;
2874}
2875
2876## ......................................................................
2877## git utility functions, directly accessing git repository
2878
2879# get the value of config variable either from file named as the variable
2880# itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2881# configuration variable in the repository config file.
2882sub git_get_file_or_project_config {
2883        my ($path, $name) = @_;
2884
2885        $git_dir = "$projectroot/$path";
2886        open my $fd, '<', "$git_dir/$name"
2887                or return git_get_project_config($name);
2888        my $conf = <$fd>;
2889        close $fd;
2890        if (defined $conf) {
2891                chomp $conf;
2892        }
2893        return $conf;
2894}
2895
2896sub git_get_project_description {
2897        my $path = shift;
2898        return git_get_file_or_project_config($path, 'description');
2899}
2900
2901sub git_get_project_category {
2902        my $path = shift;
2903        return git_get_file_or_project_config($path, 'category');
2904}
2905
2906
2907# supported formats:
2908# * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2909#   - if its contents is a number, use it as tag weight,
2910#   - otherwise add a tag with weight 1
2911# * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2912#   the same value multiple times increases tag weight
2913# * `gitweb.ctag' multi-valued repo config variable
2914sub git_get_project_ctags {
2915        my $project = shift;
2916        my $ctags = {};
2917
2918        $git_dir = "$projectroot/$project";
2919        if (opendir my $dh, "$git_dir/ctags") {
2920                my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2921                foreach my $tagfile (@files) {
2922                        open my $ct, '<', $tagfile
2923                                or next;
2924                        my $val = <$ct>;
2925                        chomp $val if $val;
2926                        close $ct;
2927
2928                        (my $ctag = $tagfile) =~ s#.*/##;
2929                        if ($val =~ /^\d+$/) {
2930                                $ctags->{$ctag} = $val;
2931                        } else {
2932                                $ctags->{$ctag} = 1;
2933                        }
2934                }
2935                closedir $dh;
2936
2937        } elsif (open my $fh, '<', "$git_dir/ctags") {
2938                while (my $line = <$fh>) {
2939                        chomp $line;
2940                        $ctags->{$line}++ if $line;
2941                }
2942                close $fh;
2943
2944        } else {
2945                my $taglist = config_to_multi(git_get_project_config('ctag'));
2946                foreach my $tag (@$taglist) {
2947                        $ctags->{$tag}++;
2948                }
2949        }
2950
2951        return $ctags;
2952}
2953
2954# return hash, where keys are content tags ('ctags'),
2955# and values are sum of weights of given tag in every project
2956sub git_gather_all_ctags {
2957        my $projects = shift;
2958        my $ctags = {};
2959
2960        foreach my $p (@$projects) {
2961                foreach my $ct (keys %{$p->{'ctags'}}) {
2962                        $ctags->{$ct} += $p->{'ctags'}->{$ct};
2963                }
2964        }
2965
2966        return $ctags;
2967}
2968
2969sub git_populate_project_tagcloud {
2970        my $ctags = shift;
2971
2972        # First, merge different-cased tags; tags vote on casing
2973        my %ctags_lc;
2974        foreach (keys %$ctags) {
2975                $ctags_lc{lc $_}->{count} += $ctags->{$_};
2976                if (not $ctags_lc{lc $_}->{topcount}
2977                    or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2978                        $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2979                        $ctags_lc{lc $_}->{topname} = $_;
2980                }
2981        }
2982
2983        my $cloud;
2984        my $matched = $input_params{'ctag'};
2985        if (eval { require HTML::TagCloud; 1; }) {
2986                $cloud = HTML::TagCloud->new;
2987                foreach my $ctag (sort keys %ctags_lc) {
2988                        # Pad the title with spaces so that the cloud looks
2989                        # less crammed.
2990                        my $title = esc_html($ctags_lc{$ctag}->{topname});
2991                        $title =~ s/ /&nbsp;/g;
2992                        $title =~ s/^/&nbsp;/g;
2993                        $title =~ s/$/&nbsp;/g;
2994                        if (defined $matched && $matched eq $ctag) {
2995                                $title = qq(<span class="match">$title</span>);
2996                        }
2997                        $cloud->add($title, href(project=>undef, ctag=>$ctag),
2998                                    $ctags_lc{$ctag}->{count});
2999                }
3000        } else {
3001                $cloud = {};
3002                foreach my $ctag (keys %ctags_lc) {
3003                        my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
3004                        if (defined $matched && $matched eq $ctag) {
3005                                $title = qq(<span class="match">$title</span>);
3006                        }
3007                        $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
3008                        $cloud->{$ctag}{ctag} =
3009                                $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
3010                }
3011        }
3012        return $cloud;
3013}
3014
3015sub git_show_project_tagcloud {
3016        my ($cloud, $count) = @_;
3017        if (ref $cloud eq 'HTML::TagCloud') {
3018                return $cloud->html_and_css($count);
3019        } else {
3020                my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
3021                return
3022                        '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
3023                        join (', ', map {
3024                                $cloud->{$_}->{'ctag'}
3025                        } splice(@tags, 0, $count)) .
3026                        '</div>';
3027        }
3028}
3029
3030sub git_get_project_url_list {
3031        my $path = shift;
3032
3033        $git_dir = "$projectroot/$path";
3034        open my $fd, '<', "$git_dir/cloneurl"
3035                or return wantarray ?
3036                @{ config_to_multi(git_get_project_config('url')) } :
3037                   config_to_multi(git_get_project_config('url'));
3038        my @git_project_url_list = map { chomp; $_ } <$fd>;
3039        close $fd;
3040
3041        return wantarray ? @git_project_url_list : \@git_project_url_list;
3042}
3043
3044sub git_get_projects_list {
3045        my $filter = shift || '';
3046        my $paranoid = shift;
3047        my @list;
3048
3049        if (-d $projects_list) {
3050                # search in directory
3051                my $dir = $projects_list;
3052                # remove the trailing "/"
3053                $dir =~ s!/+$!!;
3054                my $pfxlen = length("$dir");
3055                my $pfxdepth = ($dir =~ tr!/!!);
3056                # when filtering, search only given subdirectory
3057                if ($filter && !$paranoid) {
3058                        $dir .= "/$filter";
3059                        $dir =~ s!/+$!!;
3060                }
3061
3062                File::Find::find({
3063                        follow_fast => 1, # follow symbolic links
3064                        follow_skip => 2, # ignore duplicates
3065                        dangling_symlinks => 0, # ignore dangling symlinks, silently
3066                        wanted => sub {
3067                                # global variables
3068                                our $project_maxdepth;
3069                                our $projectroot;
3070                                # skip project-list toplevel, if we get it.
3071                                return if (m!^[/.]$!);
3072                                # only directories can be git repositories
3073                                return unless (-d $_);
3074                                # need search permission
3075                                return unless (-x $_);
3076                                # don't traverse too deep (Find is super slow on os x)
3077                                # $project_maxdepth excludes depth of $projectroot
3078                                if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
3079                                        $File::Find::prune = 1;
3080                                        return;
3081                                }
3082
3083                                my $path = substr($File::Find::name, $pfxlen + 1);
3084                                # paranoidly only filter here
3085                                if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
3086                                        next;
3087                                }
3088                                # we check related file in $projectroot
3089                                if (check_export_ok("$projectroot/$path")) {
3090                                        push @list, { path => $path };
3091                                        $File::Find::prune = 1;
3092                                }
3093                        },
3094                }, "$dir");
3095
3096        } elsif (-f $projects_list) {
3097                # read from file(url-encoded):
3098                # 'git%2Fgit.git Linus+Torvalds'
3099                # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3100                # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3101                open my $fd, '<', $projects_list or return;
3102        PROJECT:
3103                while (my $line = <$fd>) {
3104                        chomp $line;
3105                        my ($path, $owner) = split ' ', $line;
3106                        $path = unescape($path);
3107                        $owner = unescape($owner);
3108                        if (!defined $path) {
3109                                next;
3110                        }
3111                        # if $filter is rpovided, check if $path begins with $filter
3112                        if ($filter && $path !~ m!^\Q$filter\E/!) {
3113                                next;
3114                        }
3115                        if (check_export_ok("$projectroot/$path")) {
3116                                my $pr = {
3117                                        path => $path
3118                                };
3119                                if ($owner) {
3120                                        $pr->{'owner'} = to_utf8($owner);
3121                                }
3122                                push @list, $pr;
3123                        }
3124                }
3125                close $fd;
3126        }
3127        return @list;
3128}
3129
3130# written with help of Tree::Trie module (Perl Artistic License, GPL compatible)
3131# as side effects it sets 'forks' field to list of forks for forked projects
3132sub filter_forks_from_projects_list {
3133        my $projects = shift;
3134
3135        my %trie; # prefix tree of directories (path components)
3136        # generate trie out of those directories that might contain forks
3137        foreach my $pr (@$projects) {
3138                my $path = $pr->{'path'};
3139                $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
3140                next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
3141                next unless ($path);      # skip '.git' repository: tests, git-instaweb
3142                next unless (-d "$projectroot/$path"); # containing directory exists
3143                $pr->{'forks'} = [];      # there can be 0 or more forks of project
3144
3145                # add to trie
3146                my @dirs = split('/', $path);
3147                # walk the trie, until either runs out of components or out of trie
3148                my $ref = \%trie;
3149                while (scalar @dirs &&
3150                       exists($ref->{$dirs[0]})) {
3151                        $ref = $ref->{shift @dirs};
3152                }
3153                # create rest of trie structure from rest of components
3154                foreach my $dir (@dirs) {
3155                        $ref = $ref->{$dir} = {};
3156                }
3157                # create end marker, store $pr as a data
3158                $ref->{''} = $pr if (!exists $ref->{''});
3159        }
3160
3161        # filter out forks, by finding shortest prefix match for paths
3162        my @filtered;
3163 PROJECT:
3164        foreach my $pr (@$projects) {
3165                # trie lookup
3166                my $ref = \%trie;
3167        DIR:
3168                foreach my $dir (split('/', $pr->{'path'})) {
3169                        if (exists $ref->{''}) {
3170                                # found [shortest] prefix, is a fork - skip it
3171                                push @{$ref->{''}{'forks'}}, $pr;
3172                                next PROJECT;
3173                        }
3174                        if (!exists $ref->{$dir}) {
3175                                # not in trie, cannot have prefix, not a fork
3176                                push @filtered, $pr;
3177                                next PROJECT;
3178                        }
3179                        # If the dir is there, we just walk one step down the trie.
3180                        $ref = $ref->{$dir};
3181                }
3182                # we ran out of trie
3183                # (shouldn't happen: it's either no match, or end marker)
3184                push @filtered, $pr;
3185        }
3186
3187        return @filtered;
3188}
3189
3190# note: fill_project_list_info must be run first,
3191# for 'descr_long' and 'ctags' to be filled
3192sub search_projects_list {
3193        my ($projlist, %opts) = @_;
3194        my $tagfilter  = $opts{'tagfilter'};
3195        my $search_re = $opts{'search_regexp'};
3196
3197        return @$projlist
3198                unless ($tagfilter || $search_re);
3199
3200        # searching projects require filling to be run before it;
3201        fill_project_list_info($projlist,
3202                               $tagfilter  ? 'ctags' : (),
3203                               $search_re ? ('path', 'descr') : ());
3204        my @projects;
3205 PROJECT:
3206        foreach my $pr (@$projlist) {
3207
3208                if ($tagfilter) {
3209                        next unless ref($pr->{'ctags'}) eq 'HASH';
3210                        next unless
3211                                grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
3212                }
3213
3214                if ($search_re) {
3215                        next unless
3216                                $pr->{'path'} =~ /$search_re/ ||
3217                                $pr->{'descr_long'} =~ /$search_re/;
3218                }
3219
3220                push @projects, $pr;
3221        }
3222
3223        return @projects;
3224}
3225
3226our $gitweb_project_owner = undef;
3227sub git_get_project_list_from_file {
3228
3229        return if (defined $gitweb_project_owner);
3230
3231        $gitweb_project_owner = {};
3232        # read from file (url-encoded):
3233        # 'git%2Fgit.git Linus+Torvalds'
3234        # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3235        # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3236        if (-f $projects_list) {
3237                open(my $fd, '<', $projects_list);
3238                while (my $line = <$fd>) {
3239                        chomp $line;
3240                        my ($pr, $ow) = split ' ', $line;
3241                        $pr = unescape($pr);
3242                        $ow = unescape($ow);
3243                        $gitweb_project_owner->{$pr} = to_utf8($ow);
3244                }
3245                close $fd;
3246        }
3247}
3248
3249sub git_get_project_owner {
3250        my $project = shift;
3251        my $owner;
3252
3253        return undef unless $project;
3254        $git_dir = "$projectroot/$project";
3255
3256        if (!defined $gitweb_project_owner) {
3257                git_get_project_list_from_file();
3258        }
3259
3260        if (exists $gitweb_project_owner->{$project}) {
3261                $owner = $gitweb_project_owner->{$project};
3262        }
3263        if (!defined $owner){
3264                $owner = git_get_project_config('owner');
3265        }
3266        if (!defined $owner) {
3267                $owner = get_file_owner("$git_dir");
3268        }
3269
3270        return $owner;
3271}
3272
3273sub git_get_last_activity {
3274        my ($path) = @_;
3275        my $fd;
3276
3277        $git_dir = "$projectroot/$path";
3278        open($fd, "-|", git_cmd(), 'for-each-ref',
3279             '--format=%(committer)',
3280             '--sort=-committerdate',
3281             '--count=1',
3282             map { "refs/$_" } get_branch_refs ()) or return;
3283        my $most_recent = <$fd>;
3284        close $fd or return;
3285        if (defined $most_recent &&
3286            $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3287                my $timestamp = $1;
3288                my $age = time - $timestamp;
3289                return ($age, age_string($age));
3290        }
3291        return (undef, undef);
3292}
3293
3294# Implementation note: when a single remote is wanted, we cannot use 'git
3295# remote show -n' because that command always work (assuming it's a remote URL
3296# if it's not defined), and we cannot use 'git remote show' because that would
3297# try to make a network roundtrip. So the only way to find if that particular
3298# remote is defined is to walk the list provided by 'git remote -v' and stop if
3299# and when we find what we want.
3300sub git_get_remotes_list {
3301        my $wanted = shift;
3302        my %remotes = ();
3303
3304        open my $fd, '-|' , git_cmd(), 'remote', '-v';
3305        return unless $fd;
3306        while (my $remote = <$fd>) {
3307                chomp $remote;
3308                $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3309                next if $wanted and not $remote eq $wanted;
3310                my ($url, $key) = ($1, $2);
3311
3312                $remotes{$remote} ||= { 'heads' => () };
3313                $remotes{$remote}{$key} = $url;
3314        }
3315        close $fd or return;
3316        return wantarray ? %remotes : \%remotes;
3317}
3318
3319# Takes a hash of remotes as first parameter and fills it by adding the
3320# available remote heads for each of the indicated remotes.
3321sub fill_remote_heads {
3322        my $remotes = shift;
3323        my @heads = map { "remotes/$_" } keys %$remotes;
3324        my @remoteheads = git_get_heads_list(undef, @heads);
3325        foreach my $remote (keys %$remotes) {
3326                $remotes->{$remote}{'heads'} = [ grep {
3327                        $_->{'name'} =~ s!^$remote/!!
3328                        } @remoteheads ];
3329        }
3330}
3331
3332sub git_get_references {
3333        my $type = shift || "";
3334        my %refs;
3335        # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3336        # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3337        open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3338                ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3339                or return;
3340
3341        while (my $line = <$fd>) {
3342                chomp $line;
3343                if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3344                        if (defined $refs{$1}) {
3345                                push @{$refs{$1}}, $2;
3346                        } else {
3347                                $refs{$1} = [ $2 ];
3348                        }
3349                }
3350        }
3351        close $fd or return;
3352        return \%refs;
3353}
3354
3355sub git_get_rev_name_tags {
3356        my $hash = shift || return undef;
3357
3358        open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3359                or return;
3360        my $name_rev = <$fd>;
3361        close $fd;
3362
3363        if ($name_rev =~ m|^$hash tags/(.*)$|) {
3364                return $1;
3365        } else {
3366                # catches also '$hash undefined' output
3367                return undef;
3368        }
3369}
3370
3371## ----------------------------------------------------------------------
3372## parse to hash functions
3373
3374sub parse_date {
3375        my $epoch = shift;
3376        my $tz = shift || "-0000";
3377
3378        my %date;
3379        my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3380        my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3381        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3382        $date{'hour'} = $hour;
3383        $date{'minute'} = $min;
3384        $date{'mday'} = $mday;
3385        $date{'day'} = $days[$wday];
3386        $date{'month'} = $months[$mon];
3387        $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3388                             $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3389        $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3390                             $mday, $months[$mon], $hour ,$min;
3391        $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3392                             1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3393
3394        my ($tz_sign, $tz_hour, $tz_min) =
3395                ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3396        $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3397        my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3398        ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3399        $date{'hour_local'} = $hour;
3400        $date{'minute_local'} = $min;
3401        $date{'tz_local'} = $tz;
3402        $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3403                                  1900+$year, $mon+1, $mday,
3404                                  $hour, $min, $sec, $tz);
3405        return %date;
3406}
3407
3408sub parse_tag {
3409        my $tag_id = shift;
3410        my %tag;
3411        my @comment;
3412
3413        open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3414        $tag{'id'} = $tag_id;
3415        while (my $line = <$fd>) {
3416                chomp $line;
3417                if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3418                        $tag{'object'} = $1;
3419                } elsif ($line =~ m/^type (.+)$/) {
3420                        $tag{'type'} = $1;
3421                } elsif ($line =~ m/^tag (.+)$/) {
3422                        $tag{'name'} = $1;
3423                } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3424                        $tag{'author'} = $1;
3425                        $tag{'author_epoch'} = $2;
3426                        $tag{'author_tz'} = $3;
3427                        if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3428                                $tag{'author_name'}  = $1;
3429                                $tag{'author_email'} = $2;
3430                        } else {
3431                                $tag{'author_name'} = $tag{'author'};
3432                        }
3433                } elsif ($line =~ m/--BEGIN/) {
3434                        push @comment, $line;
3435                        last;
3436                } elsif ($line eq "") {
3437                        last;
3438                }
3439        }
3440        push @comment, <$fd>;
3441        $tag{'comment'} = \@comment;
3442        close $fd or return;
3443        if (!defined $tag{'name'}) {
3444                return
3445        };
3446        return %tag
3447}
3448
3449sub parse_commit_text {
3450        my ($commit_text, $withparents) = @_;
3451        my @commit_lines = split '\n', $commit_text;
3452        my %co;
3453
3454        pop @commit_lines; # Remove '\0'
3455
3456        if (! @commit_lines) {
3457                return;
3458        }
3459
3460        my $header = shift @commit_lines;
3461        if ($header !~ m/^[0-9a-fA-F]{40}/) {
3462                return;
3463        }
3464        ($co{'id'}, my @parents) = split ' ', $header;
3465        while (my $line = shift @commit_lines) {
3466                last if $line eq "\n";
3467                if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3468                        $co{'tree'} = $1;
3469                } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3470                        push @parents, $1;
3471                } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3472                        $co{'author'} = to_utf8($1);
3473                        $co{'author_epoch'} = $2;
3474                        $co{'author_tz'} = $3;
3475                        if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3476                                $co{'author_name'}  = $1;
3477                                $co{'author_email'} = $2;
3478                        } else {
3479                                $co{'author_name'} = $co{'author'};
3480                        }
3481                } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3482                        $co{'committer'} = to_utf8($1);
3483                        $co{'committer_epoch'} = $2;
3484                        $co{'committer_tz'} = $3;
3485                        if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3486                                $co{'committer_name'}  = $1;
3487                                $co{'committer_email'} = $2;
3488                        } else {
3489                                $co{'committer_name'} = $co{'committer'};
3490                        }
3491                }
3492        }
3493        if (!defined $co{'tree'}) {
3494                return;
3495        };
3496        $co{'parents'} = \@parents;
3497        $co{'parent'} = $parents[0];
3498
3499        foreach my $title (@commit_lines) {
3500                $title =~ s/^    //;
3501                if ($title ne "") {
3502                        $co{'title'} = chop_str($title, 80, 5);
3503                        # remove leading stuff of merges to make the interesting part visible
3504                        if (length($title) > 50) {
3505                                $title =~ s/^Automatic //;
3506                                $title =~ s/^merge (of|with) /Merge ... /i;
3507                                if (length($title) > 50) {
3508                                        $title =~ s/(http|rsync):\/\///;
3509                                }
3510                                if (length($title) > 50) {
3511                                        $title =~ s/(master|www|rsync)\.//;
3512                                }
3513                                if (length($title) > 50) {
3514                                        $title =~ s/kernel.org:?//;
3515                                }
3516                                if (length($title) > 50) {
3517                                        $title =~ s/\/pub\/scm//;
3518                                }
3519                        }
3520                        $co{'title_short'} = chop_str($title, 50, 5);
3521                        last;
3522                }
3523        }
3524        if (! defined $co{'title'} || $co{'title'} eq "") {
3525                $co{'title'} = $co{'title_short'} = '(no commit message)';
3526        }
3527        # remove added spaces
3528        foreach my $line (@commit_lines) {
3529                $line =~ s/^    //;
3530        }
3531        $co{'comment'} = \@commit_lines;
3532
3533        my $age = time - $co{'committer_epoch'};
3534        $co{'age'} = $age;
3535        $co{'age_string'} = age_string($age);
3536        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3537        if ($age > 60*60*24*7*2) {
3538                $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3539                $co{'age_string_age'} = $co{'age_string'};
3540        } else {
3541                $co{'age_string_date'} = $co{'age_string'};
3542                $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3543        }
3544        return %co;
3545}
3546
3547sub parse_commit {
3548        my ($commit_id) = @_;
3549        my %co;
3550
3551        local $/ = "\0";
3552
3553        open my $fd, "-|", git_cmd(), "rev-list",
3554                "--parents",
3555                "--header",
3556                "--max-count=1",
3557                $commit_id,
3558                "--",
3559                or die_error(500, "Open git-rev-list failed");
3560        %co = parse_commit_text(<$fd>, 1);
3561        close $fd;
3562
3563        return %co;
3564}
3565
3566sub parse_commits {
3567        my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3568        my @cos;
3569
3570        $maxcount ||= 1;
3571        $skip ||= 0;
3572
3573        local $/ = "\0";
3574
3575        open my $fd, "-|", git_cmd(), "rev-list",
3576                "--header",
3577                @args,
3578                ("--max-count=" . $maxcount),
3579                ("--skip=" . $skip),
3580                @extra_options,
3581                $commit_id,
3582                "--",
3583                ($filename ? ($filename) : ())
3584                or die_error(500, "Open git-rev-list failed");
3585        while (my $line = <$fd>) {
3586                my %co = parse_commit_text($line);
3587                push @cos, \%co;
3588        }
3589        close $fd;
3590
3591        return wantarray ? @cos : \@cos;
3592}
3593
3594# parse line of git-diff-tree "raw" output
3595sub parse_difftree_raw_line {
3596        my $line = shift;
3597        my %res;
3598
3599        # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3600        # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3601        if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3602                $res{'from_mode'} = $1;
3603                $res{'to_mode'} = $2;
3604                $res{'from_id'} = $3;
3605                $res{'to_id'} = $4;
3606                $res{'status'} = $5;
3607                $res{'similarity'} = $6;
3608                if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3609                        ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3610                } else {
3611                        $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3612                }
3613        }
3614        # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3615        # combined diff (for merge commit)
3616        elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3617                $res{'nparents'}  = length($1);
3618                $res{'from_mode'} = [ split(' ', $2) ];
3619                $res{'to_mode'} = pop @{$res{'from_mode'}};
3620                $res{'from_id'} = [ split(' ', $3) ];
3621                $res{'to_id'} = pop @{$res{'from_id'}};
3622                $res{'status'} = [ split('', $4) ];
3623                $res{'to_file'} = unquote($5);
3624        }
3625        # 'c512b523472485aef4fff9e57b229d9d243c967f'
3626        elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3627                $res{'commit'} = $1;
3628        }
3629
3630        return wantarray ? %res : \%res;
3631}
3632
3633# wrapper: return parsed line of git-diff-tree "raw" output
3634# (the argument might be raw line, or parsed info)
3635sub parsed_difftree_line {
3636        my $line_or_ref = shift;
3637
3638        if (ref($line_or_ref) eq "HASH") {
3639                # pre-parsed (or generated by hand)
3640                return $line_or_ref;
3641        } else {
3642                return parse_difftree_raw_line($line_or_ref);
3643        }
3644}
3645
3646# parse line of git-ls-tree output
3647sub parse_ls_tree_line {
3648        my $line = shift;
3649        my %opts = @_;
3650        my %res;
3651
3652        if ($opts{'-l'}) {
3653                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3654                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3655
3656                $res{'mode'} = $1;
3657                $res{'type'} = $2;
3658                $res{'hash'} = $3;
3659                $res{'size'} = $4;
3660                if ($opts{'-z'}) {
3661                        $res{'name'} = $5;
3662                } else {
3663                        $res{'name'} = unquote($5);
3664                }
3665        } else {
3666                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3667                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3668
3669                $res{'mode'} = $1;
3670                $res{'type'} = $2;
3671                $res{'hash'} = $3;
3672                if ($opts{'-z'}) {
3673                        $res{'name'} = $4;
3674                } else {
3675                        $res{'name'} = unquote($4);
3676                }
3677        }
3678
3679        return wantarray ? %res : \%res;
3680}
3681
3682# generates _two_ hashes, references to which are passed as 2 and 3 argument
3683sub parse_from_to_diffinfo {
3684        my ($diffinfo, $from, $to, @parents) = @_;
3685
3686        if ($diffinfo->{'nparents'}) {
3687                # combined diff
3688                $from->{'file'} = [];
3689                $from->{'href'} = [];
3690                fill_from_file_info($diffinfo, @parents)
3691                        unless exists $diffinfo->{'from_file'};
3692                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3693                        $from->{'file'}[$i] =
3694                                defined $diffinfo->{'from_file'}[$i] ?
3695                                        $diffinfo->{'from_file'}[$i] :
3696                                        $diffinfo->{'to_file'};
3697                        if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3698                                $from->{'href'}[$i] = href(action=>"blob",
3699                                                           hash_base=>$parents[$i],
3700                                                           hash=>$diffinfo->{'from_id'}[$i],
3701                                                           file_name=>$from->{'file'}[$i]);
3702                        } else {
3703                                $from->{'href'}[$i] = undef;
3704                        }
3705                }
3706        } else {
3707                # ordinary (not combined) diff
3708                $from->{'file'} = $diffinfo->{'from_file'};
3709                if ($diffinfo->{'status'} ne "A") { # not new (added) file
3710                        $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3711                                               hash=>$diffinfo->{'from_id'},
3712                                               file_name=>$from->{'file'});
3713                } else {
3714                        delete $from->{'href'};
3715                }
3716        }
3717
3718        $to->{'file'} = $diffinfo->{'to_file'};
3719        if (!is_deleted($diffinfo)) { # file exists in result
3720                $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3721                                     hash=>$diffinfo->{'to_id'},
3722                                     file_name=>$to->{'file'});
3723        } else {
3724                delete $to->{'href'};
3725        }
3726}
3727
3728## ......................................................................
3729## parse to array of hashes functions
3730
3731sub git_get_heads_list {
3732        my ($limit, @classes) = @_;
3733        @classes = get_branch_refs() unless @classes;
3734        my @patterns = map { "refs/$_" } @classes;
3735        my @headslist;
3736
3737        open my $fd, '-|', git_cmd(), 'for-each-ref',
3738                ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3739                '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3740                @patterns
3741                or return;
3742        while (my $line = <$fd>) {
3743                my %ref_item;
3744
3745                chomp $line;
3746                my ($refinfo, $committerinfo) = split(/\0/, $line);
3747                my ($hash, $name, $title) = split(' ', $refinfo, 3);
3748                my ($committer, $epoch, $tz) =
3749                        ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3750                $ref_item{'fullname'}  = $name;
3751                my $strip_refs = join '|', map { quotemeta } get_branch_refs();
3752                $name =~ s!^refs/($strip_refs|remotes)/!!;
3753                $ref_item{'name'} = $name;
3754                # for refs neither in 'heads' nor 'remotes' we want to
3755                # show their ref dir
3756                my $ref_dir = (defined $1) ? $1 : '';
3757                if ($ref_dir ne '' and $ref_dir ne 'heads' and $ref_dir ne 'remotes') {
3758                    $ref_item{'name'} .= ' (' . $ref_dir . ')';
3759                }
3760
3761                $ref_item{'id'}    = $hash;
3762                $ref_item{'title'} = $title || '(no commit message)';
3763                $ref_item{'epoch'} = $epoch;
3764                if ($epoch) {
3765                        $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3766                } else {
3767                        $ref_item{'age'} = "unknown";
3768                }
3769
3770                push @headslist, \%ref_item;
3771        }
3772        close $fd;
3773
3774        return wantarray ? @headslist : \@headslist;
3775}
3776
3777sub git_get_tags_list {
3778        my $limit = shift;
3779        my @tagslist;
3780
3781        open my $fd, '-|', git_cmd(), 'for-each-ref',
3782                ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3783                '--format=%(objectname) %(objecttype) %(refname) '.
3784                '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3785                'refs/tags'
3786                or return;
3787        while (my $line = <$fd>) {
3788                my %ref_item;
3789
3790                chomp $line;
3791                my ($refinfo, $creatorinfo) = split(/\0/, $line);
3792                my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3793                my ($creator, $epoch, $tz) =
3794                        ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3795                $ref_item{'fullname'} = $name;
3796                $name =~ s!^refs/tags/!!;
3797
3798                $ref_item{'type'} = $type;
3799                $ref_item{'id'} = $id;
3800                $ref_item{'name'} = $name;
3801                if ($type eq "tag") {
3802                        $ref_item{'subject'} = $title;
3803                        $ref_item{'reftype'} = $reftype;
3804                        $ref_item{'refid'}   = $refid;
3805                } else {
3806                        $ref_item{'reftype'} = $type;
3807                        $ref_item{'refid'}   = $id;
3808                }
3809
3810                if ($type eq "tag" || $type eq "commit") {
3811                        $ref_item{'epoch'} = $epoch;
3812                        if ($epoch) {
3813                                $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3814                        } else {
3815                                $ref_item{'age'} = "unknown";
3816                        }
3817                }
3818
3819                push @tagslist, \%ref_item;
3820        }
3821        close $fd;
3822
3823        return wantarray ? @tagslist : \@tagslist;
3824}
3825
3826## ----------------------------------------------------------------------
3827## filesystem-related functions
3828
3829sub get_file_owner {
3830        my $path = shift;
3831
3832        my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3833        my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3834        if (!defined $gcos) {
3835                return undef;
3836        }
3837        my $owner = $gcos;
3838        $owner =~ s/[,;].*$//;
3839        return to_utf8($owner);
3840}
3841
3842# assume that file exists
3843sub insert_file {
3844        my $filename = shift;
3845
3846        open my $fd, '<', $filename;
3847        print map { to_utf8($_) } <$fd>;
3848        close $fd;
3849}
3850
3851## ......................................................................
3852## mimetype related functions
3853
3854sub mimetype_guess_file {
3855        my $filename = shift;
3856        my $mimemap = shift;
3857        -r $mimemap or return undef;
3858
3859        my %mimemap;
3860        open(my $mh, '<', $mimemap) or return undef;
3861        while (<$mh>) {
3862                next if m/^#/; # skip comments
3863                my ($mimetype, @exts) = split(/\s+/);
3864                foreach my $ext (@exts) {
3865                        $mimemap{$ext} = $mimetype;
3866                }
3867        }
3868        close($mh);
3869
3870        $filename =~ /\.([^.]*)$/;
3871        return $mimemap{$1};
3872}
3873
3874sub mimetype_guess {
3875        my $filename = shift;
3876        my $mime;
3877        $filename =~ /\./ or return undef;
3878
3879        if ($mimetypes_file) {
3880                my $file = $mimetypes_file;
3881                if ($file !~ m!^/!) { # if it is relative path
3882                        # it is relative to project
3883                        $file = "$projectroot/$project/$file";
3884                }
3885                $mime = mimetype_guess_file($filename, $file);
3886        }
3887        $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3888        return $mime;
3889}
3890
3891sub blob_mimetype {
3892        my $fd = shift;
3893        my $filename = shift;
3894
3895        if ($filename) {
3896                my $mime = mimetype_guess($filename);
3897                $mime and return $mime;
3898        }
3899
3900        # just in case
3901        return $default_blob_plain_mimetype unless $fd;
3902
3903        if (-T $fd) {
3904                return 'text/plain';
3905        } elsif (! $filename) {
3906                return 'application/octet-stream';
3907        } elsif ($filename =~ m/\.png$/i) {
3908                return 'image/png';
3909        } elsif ($filename =~ m/\.gif$/i) {
3910                return 'image/gif';
3911        } elsif ($filename =~ m/\.jpe?g$/i) {
3912                return 'image/jpeg';
3913        } else {
3914                return 'application/octet-stream';
3915        }
3916}
3917
3918sub blob_contenttype {
3919        my ($fd, $file_name, $type) = @_;
3920
3921        $type ||= blob_mimetype($fd, $file_name);
3922        if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3923                $type .= "; charset=$default_text_plain_charset";
3924        }
3925
3926        return $type;
3927}
3928
3929# guess file syntax for syntax highlighting; return undef if no highlighting
3930# the name of syntax can (in the future) depend on syntax highlighter used
3931sub guess_file_syntax {
3932        my ($highlight, $file_name) = @_;
3933        return undef unless ($highlight && defined $file_name);
3934        my $basename = basename($file_name, '.in');
3935        return $highlight_basename{$basename}
3936                if exists $highlight_basename{$basename};
3937
3938        $basename =~ /\.([^.]*)$/;
3939        my $ext = $1 or return undef;
3940        return $highlight_ext{$ext}
3941                if exists $highlight_ext{$ext};
3942
3943        return undef;
3944}
3945
3946# run highlighter and return FD of its output,
3947# or return original FD if no highlighting
3948sub run_highlighter {
3949        my ($fd, $highlight, $syntax) = @_;
3950        return $fd unless ($highlight);
3951
3952        close $fd;
3953        my $syntax_arg = (defined $syntax) ? "--syntax $syntax" : "--force";
3954        open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3955                  quote_command($^X, '-CO', '-MEncode=decode,FB_DEFAULT', '-pse',
3956                    '$_ = decode($fe, $_, FB_DEFAULT) if !utf8::decode($_);',
3957                    '--', "-fe=$fallback_encoding")." | ".
3958                  quote_command($highlight_bin).
3959                  " --replace-tabs=8 --fragment $syntax_arg |"
3960                or die_error(500, "Couldn't open file or run syntax highlighter");
3961        return $fd;
3962}
3963
3964## ======================================================================
3965## functions printing HTML: header, footer, error page
3966
3967sub get_page_title {
3968        my $title = to_utf8($site_name);
3969
3970        unless (defined $project) {
3971                if (defined $project_filter) {
3972                        $title .= " - projects in '" . esc_path($project_filter) . "'";
3973                }
3974                return $title;
3975        }
3976        $title .= " - " . to_utf8($project);
3977
3978        return $title unless (defined $action);
3979        $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3980
3981        return $title unless (defined $file_name);
3982        $title .= " - " . esc_path($file_name);
3983        if ($action eq "tree" && $file_name !~ m|/$|) {
3984                $title .= "/";
3985        }
3986
3987        return $title;
3988}
3989
3990sub get_content_type_html {
3991        # require explicit support from the UA if we are to send the page as
3992        # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3993        # we have to do this because MSIE sometimes globs '*/*', pretending to
3994        # support xhtml+xml but choking when it gets what it asked for.
3995        if (defined $cgi->http('HTTP_ACCEPT') &&
3996            $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3997            $cgi->Accept('application/xhtml+xml') != 0) {
3998                return 'application/xhtml+xml';
3999        } else {
4000                return 'text/html';
4001        }
4002}
4003
4004sub print_feed_meta {
4005        if (defined $project) {
4006                my %href_params = get_feed_info();
4007                if (!exists $href_params{'-title'}) {
4008                        $href_params{'-title'} = 'log';
4009                }
4010
4011                foreach my $format (qw(RSS Atom)) {
4012                        my $type = lc($format);
4013                        my %link_attr = (
4014                                '-rel' => 'alternate',
4015                                '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
4016                                '-type' => "application/$type+xml"
4017                        );
4018
4019                        $href_params{'extra_options'} = undef;
4020                        $href_params{'action'} = $type;
4021                        $link_attr{'-href'} = href(%href_params);
4022                        print "<link ".
4023                              "rel=\"$link_attr{'-rel'}\" ".
4024                              "title=\"$link_attr{'-title'}\" ".
4025                              "href=\"$link_attr{'-href'}\" ".
4026                              "type=\"$link_attr{'-type'}\" ".
4027                              "/>\n";
4028
4029                        $href_params{'extra_options'} = '--no-merges';
4030                        $link_attr{'-href'} = href(%href_params);
4031                        $link_attr{'-title'} .= ' (no merges)';
4032                        print "<link ".
4033                              "rel=\"$link_attr{'-rel'}\" ".
4034                              "title=\"$link_attr{'-title'}\" ".
4035                              "href=\"$link_attr{'-href'}\" ".
4036                              "type=\"$link_attr{'-type'}\" ".
4037                              "/>\n";
4038                }
4039
4040        } else {
4041                printf('<link rel="alternate" title="%s projects list" '.
4042                       'href="%s" type="text/plain; charset=utf-8" />'."\n",
4043                       esc_attr($site_name), href(project=>undef, action=>"project_index"));
4044                printf('<link rel="alternate" title="%s projects feeds" '.
4045                       'href="%s" type="text/x-opml" />'."\n",
4046                       esc_attr($site_name), href(project=>undef, action=>"opml"));
4047        }
4048}
4049
4050sub print_header_links {
4051        my $status = shift;
4052
4053        # print out each stylesheet that exist, providing backwards capability
4054        # for those people who defined $stylesheet in a config file
4055        if (defined $stylesheet) {
4056                print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
4057        } else {
4058                foreach my $stylesheet (@stylesheets) {
4059                        next unless $stylesheet;
4060                        print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
4061                }
4062        }
4063        print_feed_meta()
4064                if ($status eq '200 OK');
4065        if (defined $favicon) {
4066                print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
4067        }
4068}
4069
4070sub print_nav_breadcrumbs_path {
4071        my $dirprefix = undef;
4072        while (my $part = shift) {
4073                $dirprefix .= "/" if defined $dirprefix;
4074                $dirprefix .= $part;
4075                print $cgi->a({-href => href(project => undef,
4076                                             project_filter => $dirprefix,
4077                                             action => "project_list")},
4078                              esc_html($part)) . " / ";
4079        }
4080}
4081
4082sub print_nav_breadcrumbs {
4083        my %opts = @_;
4084
4085        for my $crumb (@extra_breadcrumbs, [ $home_link_str => $home_link ]) {
4086                print $cgi->a({-href => esc_url($crumb->[1])}, $crumb->[0]) . " / ";
4087        }
4088        if (defined $project) {
4089                my @dirname = split '/', $project;
4090                my $projectbasename = pop @dirname;
4091                print_nav_breadcrumbs_path(@dirname);
4092                print $cgi->a({-href => href(action=>"summary")}, esc_html($projectbasename));
4093                if (defined $action) {
4094                        my $action_print = $action ;
4095                        if (defined $opts{-action_extra}) {
4096                                $action_print = $cgi->a({-href => href(action=>$action)},
4097                                        $action);
4098                        }
4099                        print " / $action_print";
4100                }
4101                if (defined $opts{-action_extra}) {
4102                        print " / $opts{-action_extra}";
4103                }
4104                print "\n";
4105        } elsif (defined $project_filter) {
4106                print_nav_breadcrumbs_path(split '/', $project_filter);
4107        }
4108}
4109
4110sub print_search_form {
4111        if (!defined $searchtext) {
4112                $searchtext = "";
4113        }
4114        my $search_hash;
4115        if (defined $hash_base) {
4116                $search_hash = $hash_base;
4117        } elsif (defined $hash) {
4118                $search_hash = $hash;
4119        } else {
4120                $search_hash = "HEAD";
4121        }
4122        my $action = $my_uri;
4123        my $use_pathinfo = gitweb_check_feature('pathinfo');
4124        if ($use_pathinfo) {
4125                $action .= "/".esc_url($project);
4126        }
4127        print $cgi->start_form(-method => "get", -action => $action) .
4128              "<div class=\"search\">\n" .
4129              (!$use_pathinfo &&
4130              $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
4131              $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
4132              $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
4133              $cgi->popup_menu(-name => 'st', -default => 'commit',
4134                               -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
4135              " " . $cgi->a({-href => href(action=>"search_help"),
4136                             -title => "search help" }, "?") . " search:\n",
4137              $cgi->textfield(-name => "s", -value => $searchtext, -override => 1) . "\n" .
4138              "<span title=\"Extended regular expression\">" .
4139              $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
4140                             -checked => $search_use_regexp) .
4141              "</span>" .
4142              "</div>" .
4143              $cgi->end_form() . "\n";
4144}
4145
4146sub git_header_html {
4147        my $status = shift || "200 OK";
4148        my $expires = shift;
4149        my %opts = @_;
4150
4151        my $title = get_page_title();
4152        my $content_type = get_content_type_html();
4153        print $cgi->header(-type=>$content_type, -charset => 'utf-8',
4154                           -status=> $status, -expires => $expires)
4155                unless ($opts{'-no_http_header'});
4156        my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
4157        print <<EOF;
4158<?xml version="1.0" encoding="utf-8"?>
4159<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
4160<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
4161<!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
4162<!-- git core binaries version $git_version -->
4163<head>
4164<meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
4165<meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
4166<meta name="robots" content="index, nofollow"/>
4167<title>$title</title>
4168EOF
4169        # the stylesheet, favicon etc urls won't work correctly with path_info
4170        # unless we set the appropriate base URL
4171        if ($ENV{'PATH_INFO'}) {
4172                print "<base href=\"".esc_url($base_url)."\" />\n";
4173        }
4174        print_header_links($status);
4175
4176        if (defined $site_html_head_string) {
4177                print to_utf8($site_html_head_string);
4178        }
4179
4180        print "</head>\n" .
4181              "<body>\n";
4182
4183        if (defined $site_header && -f $site_header) {
4184                insert_file($site_header);
4185        }
4186
4187        print "<div class=\"page_header\">\n";
4188        if (defined $logo) {
4189                print $cgi->a({-href => esc_url($logo_url),
4190                               -title => $logo_label},
4191                              $cgi->img({-src => esc_url($logo),
4192                                         -width => 72, -height => 27,
4193                                         -alt => "git",
4194                                         -class => "logo"}));
4195        }
4196        print_nav_breadcrumbs(%opts);
4197        print "</div>\n";
4198
4199        my $have_search = gitweb_check_feature('search');
4200        if (defined $project && $have_search) {
4201                print_search_form();
4202        }
4203}
4204
4205sub git_footer_html {
4206        my $feed_class = 'rss_logo';
4207
4208        print "<div class=\"page_footer\">\n";
4209        if (defined $project) {
4210                my $descr = git_get_project_description($project);
4211                if (defined $descr) {
4212                        print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
4213                }
4214
4215                my %href_params = get_feed_info();
4216                if (!%href_params) {
4217                        $feed_class .= ' generic';
4218                }
4219                $href_params{'-title'} ||= 'log';
4220
4221                foreach my $format (qw(RSS Atom)) {
4222                        $href_params{'action'} = lc($format);
4223                        print $cgi->a({-href => href(%href_params),
4224                                      -title => "$href_params{'-title'} $format feed",
4225                                      -class => $feed_class}, $format)."\n";
4226                }
4227
4228        } else {
4229                print $cgi->a({-href => href(project=>undef, action=>"opml",
4230                                             project_filter => $project_filter),
4231                              -class => $feed_class}, "OPML") . " ";
4232                print $cgi->a({-href => href(project=>undef, action=>"project_index",
4233                                             project_filter => $project_filter),
4234                              -class => $feed_class}, "TXT") . "\n";
4235        }
4236        print "</div>\n"; # class="page_footer"
4237
4238        if (defined $t0 && gitweb_check_feature('timed')) {
4239                print "<div id=\"generating_info\">\n";
4240                print 'This page took '.
4241                      '<span id="generating_time" class="time_span">'.
4242                      tv_interval($t0, [ gettimeofday() ]).
4243                      ' seconds </span>'.
4244                      ' and '.
4245                      '<span id="generating_cmd">'.
4246                      $number_of_git_cmds.
4247                      '</span> git commands '.
4248                      " to generate.\n";
4249                print "</div>\n"; # class="page_footer"
4250        }
4251
4252        if (defined $site_footer && -f $site_footer) {
4253                insert_file($site_footer);
4254        }
4255
4256        print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
4257        if (defined $action &&
4258            $action eq 'blame_incremental') {
4259                print qq!<script type="text/javascript">\n!.
4260                      qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
4261                      qq!           "!. href() .qq!");\n!.
4262                      qq!</script>\n!;
4263        } else {
4264                my ($jstimezone, $tz_cookie, $datetime_class) =
4265                        gitweb_get_feature('javascript-timezone');
4266
4267                print qq!<script type="text/javascript">\n!.
4268                      qq!window.onload = function () {\n!;
4269                if (gitweb_check_feature('javascript-actions')) {
4270                        print qq!       fixLinks();\n!;
4271                }
4272                if ($jstimezone && $tz_cookie && $datetime_class) {
4273                        print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4274                              qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4275                }
4276                print qq!};\n!.
4277                      qq!</script>\n!;
4278        }
4279
4280        print "</body>\n" .
4281              "</html>";
4282}
4283
4284# die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4285# Example: die_error(404, 'Hash not found')
4286# By convention, use the following status codes (as defined in RFC 2616):
4287# 400: Invalid or missing CGI parameters, or
4288#      requested object exists but has wrong type.
4289# 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4290#      this server or project.
4291# 404: Requested object/revision/project doesn't exist.
4292# 500: The server isn't configured properly, or
4293#      an internal error occurred (e.g. failed assertions caused by bugs), or
4294#      an unknown error occurred (e.g. the git binary died unexpectedly).
4295# 503: The server is currently unavailable (because it is overloaded,
4296#      or down for maintenance).  Generally, this is a temporary state.
4297sub die_error {
4298        my $status = shift || 500;
4299        my $error = esc_html(shift) || "Internal Server Error";
4300        my $extra = shift;
4301        my %opts = @_;
4302
4303        my %http_responses = (
4304                400 => '400 Bad Request',
4305                403 => '403 Forbidden',
4306                404 => '404 Not Found',
4307                500 => '500 Internal Server Error',
4308                503 => '503 Service Unavailable',
4309        );
4310        git_header_html($http_responses{$status}, undef, %opts);
4311        print <<EOF;
4312<div class="page_body">
4313<br /><br />
4314$status - $error
4315<br />
4316EOF
4317        if (defined $extra) {
4318                print "<hr />\n" .
4319                      "$extra\n";
4320        }
4321        print "</div>\n";
4322
4323        git_footer_html();
4324        goto DONE_GITWEB
4325                unless ($opts{'-error_handler'});
4326}
4327
4328## ----------------------------------------------------------------------
4329## functions printing or outputting HTML: navigation
4330
4331sub git_print_page_nav {
4332        my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4333        $extra = '' if !defined $extra; # pager or formats
4334
4335        my @navs = qw(summary shortlog log commit commitdiff tree);
4336        if ($suppress) {
4337                @navs = grep { $_ ne $suppress } @navs;
4338        }
4339
4340        my %arg = map { $_ => {action=>$_} } @navs;
4341        if (defined $head) {
4342                for (qw(commit commitdiff)) {
4343                        $arg{$_}{'hash'} = $head;
4344                }
4345                if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4346                        for (qw(shortlog log)) {
4347                                $arg{$_}{'hash'} = $head;
4348                        }
4349                }
4350        }
4351
4352        $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4353        $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4354
4355        my @actions = gitweb_get_feature('actions');
4356        my %repl = (
4357                '%' => '%',
4358                'n' => $project,         # project name
4359                'f' => $git_dir,         # project path within filesystem
4360                'h' => $treehead || '',  # current hash ('h' parameter)
4361                'b' => $treebase || '',  # hash base ('hb' parameter)
4362        );
4363        while (@actions) {
4364                my ($label, $link, $pos) = splice(@actions,0,3);
4365                # insert
4366                @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4367                # munch munch
4368                $link =~ s/%([%nfhb])/$repl{$1}/g;
4369                $arg{$label}{'_href'} = $link;
4370        }
4371
4372        print "<div class=\"page_nav\">\n" .
4373                (join " | ",
4374                 map { $_ eq $current ?
4375                       $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4376                 } @navs);
4377        print "<br/>\n$extra<br/>\n" .
4378              "</div>\n";
4379}
4380
4381# returns a submenu for the navigation of the refs views (tags, heads,
4382# remotes) with the current view disabled and the remotes view only
4383# available if the feature is enabled
4384sub format_ref_views {
4385        my ($current) = @_;
4386        my @ref_views = qw{tags heads};
4387        push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4388        return join " | ", map {
4389                $_ eq $current ? $_ :
4390                $cgi->a({-href => href(action=>$_)}, $_)
4391        } @ref_views
4392}
4393
4394sub format_paging_nav {
4395        my ($action, $page, $has_next_link) = @_;
4396        my $paging_nav;
4397
4398
4399        if ($page > 0) {
4400                $paging_nav .=
4401                        $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4402                        " &sdot; " .
4403                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
4404                                 -accesskey => "p", -title => "Alt-p"}, "prev");
4405        } else {
4406                $paging_nav .= "first &sdot; prev";
4407        }
4408
4409        if ($has_next_link) {
4410                $paging_nav .= " &sdot; " .
4411                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
4412                                 -accesskey => "n", -title => "Alt-n"}, "next");
4413        } else {
4414                $paging_nav .= " &sdot; next";
4415        }
4416
4417        return $paging_nav;
4418}
4419
4420## ......................................................................
4421## functions printing or outputting HTML: div
4422
4423sub git_print_header_div {
4424        my ($action, $title, $hash, $hash_base) = @_;
4425        my %args = ();
4426
4427        $args{'action'} = $action;
4428        $args{'hash'} = $hash if $hash;
4429        $args{'hash_base'} = $hash_base if $hash_base;
4430
4431        print "<div class=\"header\">\n" .
4432              $cgi->a({-href => href(%args), -class => "title"},
4433              $title ? $title : $action) .
4434              "\n</div>\n";
4435}
4436
4437sub format_repo_url {
4438        my ($name, $url) = @_;
4439        return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4440}
4441
4442# Group output by placing it in a DIV element and adding a header.
4443# Options for start_div() can be provided by passing a hash reference as the
4444# first parameter to the function.
4445# Options to git_print_header_div() can be provided by passing an array
4446# reference. This must follow the options to start_div if they are present.
4447# The content can be a scalar, which is output as-is, a scalar reference, which
4448# is output after html escaping, an IO handle passed either as *handle or
4449# *handle{IO}, or a function reference. In the latter case all following
4450# parameters will be taken as argument to the content function call.
4451sub git_print_section {
4452        my ($div_args, $header_args, $content);
4453        my $arg = shift;
4454        if (ref($arg) eq 'HASH') {
4455                $div_args = $arg;
4456                $arg = shift;
4457        }
4458        if (ref($arg) eq 'ARRAY') {
4459                $header_args = $arg;
4460                $arg = shift;
4461        }
4462        $content = $arg;
4463
4464        print $cgi->start_div($div_args);
4465        git_print_header_div(@$header_args);
4466
4467        if (ref($content) eq 'CODE') {
4468                $content->(@_);
4469        } elsif (ref($content) eq 'SCALAR') {
4470                print esc_html($$content);
4471        } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4472                print <$content>;
4473        } elsif (!ref($content) && defined($content)) {
4474                print $content;
4475        }
4476
4477        print $cgi->end_div;
4478}
4479
4480sub format_timestamp_html {
4481        my $date = shift;
4482        my $strtime = $date->{'rfc2822'};
4483
4484        my (undef, undef, $datetime_class) =
4485                gitweb_get_feature('javascript-timezone');
4486        if ($datetime_class) {
4487                $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4488        }
4489
4490        my $localtime_format = '(%02d:%02d %s)';
4491        if ($date->{'hour_local'} < 6) {
4492                $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4493        }
4494        $strtime .= ' ' .
4495                    sprintf($localtime_format,
4496                            $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4497
4498        return $strtime;
4499}
4500
4501# Outputs the author name and date in long form
4502sub git_print_authorship {
4503        my $co = shift;
4504        my %opts = @_;
4505        my $tag = $opts{-tag} || 'div';
4506        my $author = $co->{'author_name'};
4507
4508        my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4509        print "<$tag class=\"author_date\">" .
4510              format_search_author($author, "author", esc_html($author)) .
4511              " [".format_timestamp_html(\%ad)."]".
4512              git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4513              "</$tag>\n";
4514}
4515
4516# Outputs table rows containing the full author or committer information,
4517# in the format expected for 'commit' view (& similar).
4518# Parameters are a commit hash reference, followed by the list of people
4519# to output information for. If the list is empty it defaults to both
4520# author and committer.
4521sub git_print_authorship_rows {
4522        my $co = shift;
4523        # too bad we can't use @people = @_ || ('author', 'committer')
4524        my @people = @_;
4525        @people = ('author', 'committer') unless @people;
4526        foreach my $who (@people) {
4527                my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4528                print "<tr><td>$who</td><td>" .
4529                      format_search_author($co->{"${who}_name"}, $who,
4530                                           esc_html($co->{"${who}_name"})) . " " .
4531                      format_search_author($co->{"${who}_email"}, $who,
4532                                           esc_html("<" . $co->{"${who}_email"} . ">")) .
4533                      "</td><td rowspan=\"2\">" .
4534                      git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4535                      "</td></tr>\n" .
4536                      "<tr>" .
4537                      "<td></td><td>" .
4538                      format_timestamp_html(\%wd) .
4539                      "</td>" .
4540                      "</tr>\n";
4541        }
4542}
4543
4544sub git_print_page_path {
4545        my $name = shift;
4546        my $type = shift;
4547        my $hb = shift;
4548
4549
4550        print "<div class=\"page_path\">";
4551        print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4552                      -title => 'tree root'}, to_utf8("[$project]"));
4553        print " / ";
4554        if (defined $name) {
4555                my @dirname = split '/', $name;
4556                my $basename = pop @dirname;
4557                my $fullname = '';
4558
4559                foreach my $dir (@dirname) {
4560                        $fullname .= ($fullname ? '/' : '') . $dir;
4561                        print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4562                                                     hash_base=>$hb),
4563                                      -title => $fullname}, esc_path($dir));
4564                        print " / ";
4565                }
4566                if (defined $type && $type eq 'blob') {
4567                        print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4568                                                     hash_base=>$hb),
4569                                      -title => $name}, esc_path($basename));
4570                } elsif (defined $type && $type eq 'tree') {
4571                        print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4572                                                     hash_base=>$hb),
4573                                      -title => $name}, esc_path($basename));
4574                        print " / ";
4575                } else {
4576                        print esc_path($basename);
4577                }
4578        }
4579        print "<br/></div>\n";
4580}
4581
4582sub git_print_log {
4583        my $log = shift;
4584        my %opts = @_;
4585
4586        if ($opts{'-remove_title'}) {
4587                # remove title, i.e. first line of log
4588                shift @$log;
4589        }
4590        # remove leading empty lines
4591        while (defined $log->[0] && $log->[0] eq "") {
4592                shift @$log;
4593        }
4594
4595        # print log
4596        my $skip_blank_line = 0;
4597        foreach my $line (@$log) {
4598                if ($line =~ m/^\s*([A-Z][-A-Za-z]*-[Bb]y|C[Cc]): /) {
4599                        if (! $opts{'-remove_signoff'}) {
4600                                print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4601                                $skip_blank_line = 1;
4602                        }
4603                        next;
4604                }
4605
4606                if ($line =~ m,\s*([a-z]*link): (https?://\S+),i) {
4607                        if (! $opts{'-remove_signoff'}) {
4608                                print "<span class=\"signoff\">" . esc_html($1) . ": " .
4609                                        "<a href=\"" . esc_html($2) . "\">" . esc_html($2) . "</a>" .
4610                                        "</span><br/>\n";
4611                                $skip_blank_line = 1;
4612                        }
4613                        next;
4614                }
4615
4616                # print only one empty line
4617                # do not print empty line after signoff
4618                if ($line eq "") {
4619                        next if ($skip_blank_line);
4620                        $skip_blank_line = 1;
4621                } else {
4622                        $skip_blank_line = 0;
4623                }
4624
4625                print format_log_line_html($line) . "<br/>\n";
4626        }
4627
4628        if ($opts{'-final_empty_line'}) {
4629                # end with single empty line
4630                print "<br/>\n" unless $skip_blank_line;
4631        }
4632}
4633
4634# return link target (what link points to)
4635sub git_get_link_target {
4636        my $hash = shift;
4637        my $link_target;
4638
4639        # read link
4640        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4641                or return;
4642        {
4643                local $/ = undef;
4644                $link_target = <$fd>;
4645        }
4646        close $fd
4647                or return;
4648
4649        return $link_target;
4650}
4651
4652# given link target, and the directory (basedir) the link is in,
4653# return target of link relative to top directory (top tree);
4654# return undef if it is not possible (including absolute links).
4655sub normalize_link_target {
4656        my ($link_target, $basedir) = @_;
4657
4658        # absolute symlinks (beginning with '/') cannot be normalized
4659        return if (substr($link_target, 0, 1) eq '/');
4660
4661        # normalize link target to path from top (root) tree (dir)
4662        my $path;
4663        if ($basedir) {
4664                $path = $basedir . '/' . $link_target;
4665        } else {
4666                # we are in top (root) tree (dir)
4667                $path = $link_target;
4668        }
4669
4670        # remove //, /./, and /../
4671        my @path_parts;
4672        foreach my $part (split('/', $path)) {
4673                # discard '.' and ''
4674                next if (!$part || $part eq '.');
4675                # handle '..'
4676                if ($part eq '..') {
4677                        if (@path_parts) {
4678                                pop @path_parts;
4679                        } else {
4680                                # link leads outside repository (outside top dir)
4681                                return;
4682                        }
4683                } else {
4684                        push @path_parts, $part;
4685                }
4686        }
4687        $path = join('/', @path_parts);
4688
4689        return $path;
4690}
4691
4692# print tree entry (row of git_tree), but without encompassing <tr> element
4693sub git_print_tree_entry {
4694        my ($t, $basedir, $hash_base, $have_blame) = @_;
4695
4696        my %base_key = ();
4697        $base_key{'hash_base'} = $hash_base if defined $hash_base;
4698
4699        # The format of a table row is: mode list link.  Where mode is
4700        # the mode of the entry, list is the name of the entry, an href,
4701        # and link is the action links of the entry.
4702
4703        print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4704        if (exists $t->{'size'}) {
4705                print "<td class=\"size\">$t->{'size'}</td>\n";
4706        }
4707        if ($t->{'type'} eq "blob") {
4708                print "<td class=\"list\">" .
4709                        $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4710                                               file_name=>"$basedir$t->{'name'}", %base_key),
4711                                -class => "list"}, esc_path($t->{'name'}));
4712                if (S_ISLNK(oct $t->{'mode'})) {
4713                        my $link_target = git_get_link_target($t->{'hash'});
4714                        if ($link_target) {
4715                                my $norm_target = normalize_link_target($link_target, $basedir);
4716                                if (defined $norm_target) {
4717                                        print " -> " .
4718                                              $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4719                                                                     file_name=>$norm_target),
4720                                                       -title => $norm_target}, esc_path($link_target));
4721                                } else {
4722                                        print " -> " . esc_path($link_target);
4723                                }
4724                        }
4725                }
4726                print "</td>\n";
4727                print "<td class=\"link\">";
4728                print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4729                                             file_name=>"$basedir$t->{'name'}", %base_key)},
4730                              "blob");
4731                if ($have_blame) {
4732                        print " | " .
4733                              $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4734                                                     file_name=>"$basedir$t->{'name'}", %base_key)},
4735                                      "blame");
4736                }
4737                if (defined $hash_base) {
4738                        print " | " .
4739                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4740                                                     hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4741                                      "history");
4742                }
4743                print " | " .
4744                        $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4745                                               file_name=>"$basedir$t->{'name'}")},
4746                                "raw");
4747                print "</td>\n";
4748
4749        } elsif ($t->{'type'} eq "tree") {
4750                print "<td class=\"list\">";
4751                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4752                                             file_name=>"$basedir$t->{'name'}",
4753                                             %base_key)},
4754                              esc_path($t->{'name'}));
4755                print "</td>\n";
4756                print "<td class=\"link\">";
4757                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4758                                             file_name=>"$basedir$t->{'name'}",
4759                                             %base_key)},
4760                              "tree");
4761                if (defined $hash_base) {
4762                        print " | " .
4763                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4764                                                     file_name=>"$basedir$t->{'name'}")},
4765                                      "history");
4766                }
4767                print "</td>\n";
4768        } else {
4769                # unknown object: we can only present history for it
4770                # (this includes 'commit' object, i.e. submodule support)
4771                print "<td class=\"list\">" .
4772                      esc_path($t->{'name'}) .
4773                      "</td>\n";
4774                print "<td class=\"link\">";
4775                if (defined $hash_base) {
4776                        print $cgi->a({-href => href(action=>"history",
4777                                                     hash_base=>$hash_base,
4778                                                     file_name=>"$basedir$t->{'name'}")},
4779                                      "history");
4780                }
4781                print "</td>\n";
4782        }
4783}
4784
4785## ......................................................................
4786## functions printing large fragments of HTML
4787
4788# get pre-image filenames for merge (combined) diff
4789sub fill_from_file_info {
4790        my ($diff, @parents) = @_;
4791
4792        $diff->{'from_file'} = [ ];
4793        $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4794        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4795                if ($diff->{'status'}[$i] eq 'R' ||
4796                    $diff->{'status'}[$i] eq 'C') {
4797                        $diff->{'from_file'}[$i] =
4798                                git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4799                }
4800        }
4801
4802        return $diff;
4803}
4804
4805# is current raw difftree line of file deletion
4806sub is_deleted {
4807        my $diffinfo = shift;
4808
4809        return $diffinfo->{'to_id'} eq ('0' x 40);
4810}
4811
4812# does patch correspond to [previous] difftree raw line
4813# $diffinfo  - hashref of parsed raw diff format
4814# $patchinfo - hashref of parsed patch diff format
4815#              (the same keys as in $diffinfo)
4816sub is_patch_split {
4817        my ($diffinfo, $patchinfo) = @_;
4818
4819        return defined $diffinfo && defined $patchinfo
4820                && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4821}
4822
4823
4824sub git_difftree_body {
4825        my ($difftree, $hash, @parents) = @_;
4826        my ($parent) = $parents[0];
4827        my $have_blame = gitweb_check_feature('blame');
4828        print "<div class=\"list_head\">\n";
4829        if ($#{$difftree} > 10) {
4830                print(($#{$difftree} + 1) . " files changed:\n");
4831        }
4832        print "</div>\n";
4833
4834        print "<table class=\"" .
4835              (@parents > 1 ? "combined " : "") .
4836              "diff_tree\">\n";
4837
4838        # header only for combined diff in 'commitdiff' view
4839        my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4840        if ($has_header) {
4841                # table header
4842                print "<thead><tr>\n" .
4843                       "<th></th><th></th>\n"; # filename, patchN link
4844                for (my $i = 0; $i < @parents; $i++) {
4845                        my $par = $parents[$i];
4846                        print "<th>" .
4847                              $cgi->a({-href => href(action=>"commitdiff",
4848                                                     hash=>$hash, hash_parent=>$par),
4849                                       -title => 'commitdiff to parent number ' .
4850                                                  ($i+1) . ': ' . substr($par,0,7)},
4851                                      $i+1) .
4852                              "&nbsp;</th>\n";
4853                }
4854                print "</tr></thead>\n<tbody>\n";
4855        }
4856
4857        my $alternate = 1;
4858        my $patchno = 0;
4859        foreach my $line (@{$difftree}) {
4860                my $diff = parsed_difftree_line($line);
4861
4862                if ($alternate) {
4863                        print "<tr class=\"dark\">\n";
4864                } else {
4865                        print "<tr class=\"light\">\n";
4866                }
4867                $alternate ^= 1;
4868
4869                if (exists $diff->{'nparents'}) { # combined diff
4870
4871                        fill_from_file_info($diff, @parents)
4872                                unless exists $diff->{'from_file'};
4873
4874                        if (!is_deleted($diff)) {
4875                                # file exists in the result (child) commit
4876                                print "<td>" .
4877                                      $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4878                                                             file_name=>$diff->{'to_file'},
4879                                                             hash_base=>$hash),
4880                                              -class => "list"}, esc_path($diff->{'to_file'})) .
4881                                      "</td>\n";
4882                        } else {
4883                                print "<td>" .
4884                                      esc_path($diff->{'to_file'}) .
4885                                      "</td>\n";
4886                        }
4887
4888                        if ($action eq 'commitdiff') {
4889                                # link to patch
4890                                $patchno++;
4891                                print "<td class=\"link\">" .
4892                                      $cgi->a({-href => href(-anchor=>"patch$patchno")},
4893                                              "patch") .
4894                                      " | " .
4895                                      "</td>\n";
4896                        }
4897
4898                        my $has_history = 0;
4899                        my $not_deleted = 0;
4900                        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4901                                my $hash_parent = $parents[$i];
4902                                my $from_hash = $diff->{'from_id'}[$i];
4903                                my $from_path = $diff->{'from_file'}[$i];
4904                                my $status = $diff->{'status'}[$i];
4905
4906                                $has_history ||= ($status ne 'A');
4907                                $not_deleted ||= ($status ne 'D');
4908
4909                                if ($status eq 'A') {
4910                                        print "<td  class=\"link\" align=\"right\"> | </td>\n";
4911                                } elsif ($status eq 'D') {
4912                                        print "<td class=\"link\">" .
4913                                              $cgi->a({-href => href(action=>"blob",
4914                                                                     hash_base=>$hash,
4915                                                                     hash=>$from_hash,
4916                                                                     file_name=>$from_path)},
4917                                                      "blob" . ($i+1)) .
4918                                              " | </td>\n";
4919                                } else {
4920                                        if ($diff->{'to_id'} eq $from_hash) {
4921                                                print "<td class=\"link nochange\">";
4922                                        } else {
4923                                                print "<td class=\"link\">";
4924                                        }
4925                                        print $cgi->a({-href => href(action=>"blobdiff",
4926                                                                     hash=>$diff->{'to_id'},
4927                                                                     hash_parent=>$from_hash,
4928                                                                     hash_base=>$hash,
4929                                                                     hash_parent_base=>$hash_parent,
4930                                                                     file_name=>$diff->{'to_file'},
4931                                                                     file_parent=>$from_path)},
4932                                                      "diff" . ($i+1)) .
4933                                              " | </td>\n";
4934                                }
4935                        }
4936
4937                        print "<td class=\"link\">";
4938                        if ($not_deleted) {
4939                                print $cgi->a({-href => href(action=>"blob",
4940                                                             hash=>$diff->{'to_id'},
4941                                                             file_name=>$diff->{'to_file'},
4942                                                             hash_base=>$hash)},
4943                                              "blob");
4944                                print " | " if ($has_history);
4945                        }
4946                        if ($has_history) {
4947                                print $cgi->a({-href => href(action=>"history",
4948                                                             file_name=>$diff->{'to_file'},
4949                                                             hash_base=>$hash)},
4950                                              "history");
4951                        }
4952                        print "</td>\n";
4953
4954                        print "</tr>\n";
4955                        next; # instead of 'else' clause, to avoid extra indent
4956                }
4957                # else ordinary diff
4958
4959                my ($to_mode_oct, $to_mode_str, $to_file_type);
4960                my ($from_mode_oct, $from_mode_str, $from_file_type);
4961                if ($diff->{'to_mode'} ne ('0' x 6)) {
4962                        $to_mode_oct = oct $diff->{'to_mode'};
4963                        if (S_ISREG($to_mode_oct)) { # only for regular file
4964                                $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4965                        }
4966                        $to_file_type = file_type($diff->{'to_mode'});
4967                }
4968                if ($diff->{'from_mode'} ne ('0' x 6)) {
4969                        $from_mode_oct = oct $diff->{'from_mode'};
4970                        if (S_ISREG($from_mode_oct)) { # only for regular file
4971                                $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4972                        }
4973                        $from_file_type = file_type($diff->{'from_mode'});
4974                }
4975
4976                if ($diff->{'status'} eq "A") { # created
4977                        my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4978                        $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4979                        $mode_chng   .= "]</span>";
4980                        print "<td>";
4981                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4982                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4983                                      -class => "list"}, esc_path($diff->{'file'}));
4984                        print "</td>\n";
4985                        print "<td>$mode_chng</td>\n";
4986                        print "<td class=\"link\">";
4987                        if ($action eq 'commitdiff') {
4988                                # link to patch
4989                                $patchno++;
4990                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4991                                              "patch") .
4992                                      " | ";
4993                        }
4994                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4995                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4996                                      "blob");
4997                        print "</td>\n";
4998
4999                } elsif ($diff->{'status'} eq "D") { # deleted
5000                        my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
5001                        print "<td>";
5002                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
5003                                                     hash_base=>$parent, file_name=>$diff->{'file'}),
5004                                       -class => "list"}, esc_path($diff->{'file'}));
5005                        print "</td>\n";
5006                        print "<td>$mode_chng</td>\n";
5007                        print "<td class=\"link\">";
5008                        if ($action eq 'commitdiff') {
5009                                # link to patch
5010                                $patchno++;
5011                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
5012                                              "patch") .
5013                                      " | ";
5014                        }
5015                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
5016                                                     hash_base=>$parent, file_name=>$diff->{'file'})},
5017                                      "blob") . " | ";
5018                        if ($have_blame) {
5019                                print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
5020                                                             file_name=>$diff->{'file'})},
5021                                              "blame") . " | ";
5022                        }
5023                        print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
5024                                                     file_name=>$diff->{'file'})},
5025                                      "history");
5026                        print "</td>\n";
5027
5028                } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
5029                        my $mode_chnge = "";
5030                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
5031                                $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
5032                                if ($from_file_type ne $to_file_type) {
5033                                        $mode_chnge .= " from $from_file_type to $to_file_type";
5034                                }
5035                                if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
5036                                        if ($from_mode_str && $to_mode_str) {
5037                                                $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
5038                                        } elsif ($to_mode_str) {
5039                                                $mode_chnge .= " mode: $to_mode_str";
5040                                        }
5041                                }
5042                                $mode_chnge .= "]</span>\n";
5043                        }
5044                        print "<td>";
5045                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
5046                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
5047                                      -class => "list"}, esc_path($diff->{'file'}));
5048                        print "</td>\n";
5049                        print "<td>$mode_chnge</td>\n";
5050                        print "<td class=\"link\">";
5051                        if ($action eq 'commitdiff') {
5052                                # link to patch
5053                                $patchno++;
5054                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
5055                                              "patch") .
5056                                      " | ";
5057                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
5058                                # "commit" view and modified file (not onlu mode changed)
5059                                print $cgi->a({-href => href(action=>"blobdiff",
5060                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
5061                                                             hash_base=>$hash, hash_parent_base=>$parent,
5062                                                             file_name=>$diff->{'file'})},
5063                                              "diff") .
5064                                      " | ";
5065                        }
5066                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
5067                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
5068                                       "blob") . " | ";
5069                        if ($have_blame) {
5070                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
5071                                                             file_name=>$diff->{'file'})},
5072                                              "blame") . " | ";
5073                        }
5074                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
5075                                                     file_name=>$diff->{'file'})},
5076                                      "history");
5077                        print "</td>\n";
5078
5079                } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
5080                        my %status_name = ('R' => 'moved', 'C' => 'copied');
5081                        my $nstatus = $status_name{$diff->{'status'}};
5082                        my $mode_chng = "";
5083                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
5084                                # mode also for directories, so we cannot use $to_mode_str
5085                                $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
5086                        }
5087                        print "<td>" .
5088                              $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
5089                                                     hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
5090                                      -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
5091                              "<td><span class=\"file_status $nstatus\">[$nstatus from " .
5092                              $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
5093                                                     hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
5094                                      -class => "list"}, esc_path($diff->{'from_file'})) .
5095                              " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
5096                              "<td class=\"link\">";
5097                        if ($action eq 'commitdiff') {
5098                                # link to patch
5099                                $patchno++;
5100                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
5101                                              "patch") .
5102                                      " | ";
5103                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
5104                                # "commit" view and modified file (not only pure rename or copy)
5105                                print $cgi->a({-href => href(action=>"blobdiff",
5106                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
5107                                                             hash_base=>$hash, hash_parent_base=>$parent,
5108                                                             file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
5109                                              "diff") .
5110                                      " | ";
5111                        }
5112                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
5113                                                     hash_base=>$parent, file_name=>$diff->{'to_file'})},
5114                                      "blob") . " | ";
5115                        if ($have_blame) {
5116                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
5117                                                             file_name=>$diff->{'to_file'})},
5118                                              "blame") . " | ";
5119                        }
5120                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
5121                                                    file_name=>$diff->{'to_file'})},
5122                                      "history");
5123                        print "</td>\n";
5124
5125                } # we should not encounter Unmerged (U) or Unknown (X) status
5126                print "</tr>\n";
5127        }
5128        print "</tbody>" if $has_header;
5129        print "</table>\n";
5130}
5131
5132# Print context lines and then rem/add lines in a side-by-side manner.
5133sub print_sidebyside_diff_lines {
5134        my ($ctx, $rem, $add) = @_;
5135
5136        # print context block before add/rem block
5137        if (@$ctx) {
5138                print join '',
5139                        '<div class="chunk_block ctx">',
5140                                '<div class="old">',
5141                                @$ctx,
5142                                '</div>',
5143                                '<div class="new">',
5144                                @$ctx,
5145                                '</div>',
5146                        '</div>';
5147        }
5148
5149        if (!@$add) {
5150                # pure removal
5151                print join '',
5152                        '<div class="chunk_block rem">',
5153                                '<div class="old">',
5154                                @$rem,
5155                                '</div>',
5156                        '</div>';
5157        } elsif (!@$rem) {
5158                # pure addition
5159                print join '',
5160                        '<div class="chunk_block add">',
5161                                '<div class="new">',
5162                                @$add,
5163                                '</div>',
5164                        '</div>';
5165        } else {
5166                print join '',
5167                        '<div class="chunk_block chg">',
5168                                '<div class="old">',
5169                                @$rem,
5170                                '</div>',
5171                                '<div class="new">',
5172                                @$add,
5173                                '</div>',
5174                        '</div>';
5175        }
5176}
5177
5178# Print context lines and then rem/add lines in inline manner.
5179sub print_inline_diff_lines {
5180        my ($ctx, $rem, $add) = @_;
5181
5182        print @$ctx, @$rem, @$add;
5183}
5184
5185# Format removed and added line, mark changed part and HTML-format them.
5186# Implementation is based on contrib/diff-highlight
5187sub format_rem_add_lines_pair {
5188        my ($rem, $add, $num_parents) = @_;
5189
5190        # We need to untabify lines before split()'ing them;
5191        # otherwise offsets would be invalid.
5192        chomp $rem;
5193        chomp $add;
5194        $rem = untabify($rem);
5195        $add = untabify($add);
5196
5197        my @rem = split(//, $rem);
5198        my @add = split(//, $add);
5199        my ($esc_rem, $esc_add);
5200        # Ignore leading +/- characters for each parent.
5201        my ($prefix_len, $suffix_len) = ($num_parents, 0);
5202        my ($prefix_has_nonspace, $suffix_has_nonspace);
5203
5204        my $shorter = (@rem < @add) ? @rem : @add;
5205        while ($prefix_len < $shorter) {
5206                last if ($rem[$prefix_len] ne $add[$prefix_len]);
5207
5208                $prefix_has_nonspace = 1 if ($rem[$prefix_len] !~ /\s/);
5209                $prefix_len++;
5210        }
5211
5212        while ($prefix_len + $suffix_len < $shorter) {
5213                last if ($rem[-1 - $suffix_len] ne $add[-1 - $suffix_len]);
5214
5215                $suffix_has_nonspace = 1 if ($rem[-1 - $suffix_len] !~ /\s/);
5216                $suffix_len++;
5217        }
5218
5219        # Mark lines that are different from each other, but have some common
5220        # part that isn't whitespace.  If lines are completely different, don't
5221        # mark them because that would make output unreadable, especially if
5222        # diff consists of multiple lines.
5223        if ($prefix_has_nonspace || $suffix_has_nonspace) {
5224                $esc_rem = esc_html_hl_regions($rem, 'marked',
5225                        [$prefix_len, @rem - $suffix_len], -nbsp=>1);
5226                $esc_add = esc_html_hl_regions($add, 'marked',
5227                        [$prefix_len, @add - $suffix_len], -nbsp=>1);
5228        } else {
5229                $esc_rem = esc_html($rem, -nbsp=>1);
5230                $esc_add = esc_html($add, -nbsp=>1);
5231        }
5232
5233        return format_diff_line(\$esc_rem, 'rem'),
5234               format_diff_line(\$esc_add, 'add');
5235}
5236
5237# HTML-format diff context, removed and added lines.
5238sub format_ctx_rem_add_lines {
5239        my ($ctx, $rem, $add, $num_parents) = @_;
5240        my (@new_ctx, @new_rem, @new_add);
5241        my $can_highlight = 0;
5242        my $is_combined = ($num_parents > 1);
5243
5244        # Highlight if every removed line has a corresponding added line.
5245        if (@$add > 0 && @$add == @$rem) {
5246                $can_highlight = 1;
5247
5248                # Highlight lines in combined diff only if the chunk contains
5249                # diff between the same version, e.g.
5250                #
5251                #    - a
5252                #   -  b
5253                #    + c
5254                #   +  d
5255                #
5256                # Otherwise the highlightling would be confusing.
5257                if ($is_combined) {
5258                        for (my $i = 0; $i < @$add; $i++) {
5259                                my $prefix_rem = substr($rem->[$i], 0, $num_parents);
5260                                my $prefix_add = substr($add->[$i], 0, $num_parents);
5261
5262                                $prefix_rem =~ s/-/+/g;
5263
5264                                if ($prefix_rem ne $prefix_add) {
5265                                        $can_highlight = 0;
5266                                        last;
5267                                }
5268                        }
5269                }
5270        }
5271
5272        if ($can_highlight) {
5273                for (my $i = 0; $i < @$add; $i++) {
5274                        my ($line_rem, $line_add) = format_rem_add_lines_pair(
5275                                $rem->[$i], $add->[$i], $num_parents);
5276                        push @new_rem, $line_rem;
5277                        push @new_add, $line_add;
5278                }
5279        } else {
5280                @new_rem = map { format_diff_line($_, 'rem') } @$rem;
5281                @new_add = map { format_diff_line($_, 'add') } @$add;
5282        }
5283
5284        @new_ctx = map { format_diff_line($_, 'ctx') } @$ctx;
5285
5286        return (\@new_ctx, \@new_rem, \@new_add);
5287}
5288
5289# Print context lines and then rem/add lines.
5290sub print_diff_lines {
5291        my ($ctx, $rem, $add, $diff_style, $num_parents) = @_;
5292        my $is_combined = $num_parents > 1;
5293
5294        ($ctx, $rem, $add) = format_ctx_rem_add_lines($ctx, $rem, $add,
5295                $num_parents);
5296
5297        if ($diff_style eq 'sidebyside' && !$is_combined) {
5298                print_sidebyside_diff_lines($ctx, $rem, $add);
5299        } else {
5300                # default 'inline' style and unknown styles
5301                print_inline_diff_lines($ctx, $rem, $add);
5302        }
5303}
5304
5305sub print_diff_chunk {
5306        my ($diff_style, $num_parents, $from, $to, @chunk) = @_;
5307        my (@ctx, @rem, @add);
5308
5309        # The class of the previous line.
5310        my $prev_class = '';
5311
5312        return unless @chunk;
5313
5314        # incomplete last line might be among removed or added lines,
5315        # or both, or among context lines: find which
5316        for (my $i = 1; $i < @chunk; $i++) {
5317                if ($chunk[$i][0] eq 'incomplete') {
5318                        $chunk[$i][0] = $chunk[$i-1][0];
5319                }
5320        }
5321
5322        # guardian
5323        push @chunk, ["", ""];
5324
5325        foreach my $line_info (@chunk) {
5326                my ($class, $line) = @$line_info;
5327
5328                # print chunk headers
5329                if ($class && $class eq 'chunk_header') {
5330                        print format_diff_line($line, $class, $from, $to);
5331                        next;
5332                }
5333
5334                ## print from accumulator when have some add/rem lines or end
5335                # of chunk (flush context lines), or when have add and rem
5336                # lines and new block is reached (otherwise add/rem lines could
5337                # be reordered)
5338                if (!$class || ((@rem || @add) && $class eq 'ctx') ||
5339                    (@rem && @add && $class ne $prev_class)) {
5340                        print_diff_lines(\@ctx, \@rem, \@add,
5341                                         $diff_style, $num_parents);
5342                        @ctx = @rem = @add = ();
5343                }
5344
5345                ## adding lines to accumulator
5346                # guardian value
5347                last unless $line;
5348                # rem, add or change
5349                if ($class eq 'rem') {
5350                        push @rem, $line;
5351                } elsif ($class eq 'add') {
5352                        push @add, $line;
5353                }
5354                # context line
5355                if ($class eq 'ctx') {
5356                        push @ctx, $line;
5357                }
5358
5359                $prev_class = $class;
5360        }
5361}
5362
5363sub git_patchset_body {
5364        my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
5365        my ($hash_parent) = $hash_parents[0];
5366
5367        my $is_combined = (@hash_parents > 1);
5368        my $patch_idx = 0;
5369        my $patch_number = 0;
5370        my $patch_line;
5371        my $diffinfo;
5372        my $to_name;
5373        my (%from, %to);
5374        my @chunk; # for side-by-side diff
5375
5376        print "<div class=\"patchset\">\n";
5377
5378        # skip to first patch
5379        while ($patch_line = <$fd>) {
5380                chomp $patch_line;
5381
5382                last if ($patch_line =~ m/^diff /);
5383        }
5384
5385 PATCH:
5386        while ($patch_line) {
5387
5388                # parse "git diff" header line
5389                if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
5390                        # $1 is from_name, which we do not use
5391                        $to_name = unquote($2);
5392                        $to_name =~ s!^b/!!;
5393                } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
5394                        # $1 is 'cc' or 'combined', which we do not use
5395                        $to_name = unquote($2);
5396                } else {
5397                        $to_name = undef;
5398                }
5399
5400                # check if current patch belong to current raw line
5401                # and parse raw git-diff line if needed
5402                if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
5403                        # this is continuation of a split patch
5404                        print "<div class=\"patch cont\">\n";
5405                } else {
5406                        # advance raw git-diff output if needed
5407                        $patch_idx++ if defined $diffinfo;
5408
5409                        # read and prepare patch information
5410                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5411
5412                        # compact combined diff output can have some patches skipped
5413                        # find which patch (using pathname of result) we are at now;
5414                        if ($is_combined) {
5415                                while ($to_name ne $diffinfo->{'to_file'}) {
5416                                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5417                                              format_diff_cc_simplified($diffinfo, @hash_parents) .
5418                                              "</div>\n";  # class="patch"
5419
5420                                        $patch_idx++;
5421                                        $patch_number++;
5422
5423                                        last if $patch_idx > $#$difftree;
5424                                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5425                                }
5426                        }
5427
5428                        # modifies %from, %to hashes
5429                        parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5430
5431                        # this is first patch for raw difftree line with $patch_idx index
5432                        # we index @$difftree array from 0, but number patches from 1
5433                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5434                }
5435
5436                # git diff header
5437                #assert($patch_line =~ m/^diff /) if DEBUG;
5438                #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5439                $patch_number++;
5440                # print "git diff" header
5441                print format_git_diff_header_line($patch_line, $diffinfo,
5442                                                  \%from, \%to);
5443
5444                # print extended diff header
5445                print "<div class=\"diff extended_header\">\n";
5446        EXTENDED_HEADER:
5447                while ($patch_line = <$fd>) {
5448                        chomp $patch_line;
5449
5450                        last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5451
5452                        print format_extended_diff_header_line($patch_line, $diffinfo,
5453                                                               \%from, \%to);
5454                }
5455                print "</div>\n"; # class="diff extended_header"
5456
5457                # from-file/to-file diff header
5458                if (! $patch_line) {
5459                        print "</div>\n"; # class="patch"
5460                        last PATCH;
5461                }
5462                next PATCH if ($patch_line =~ m/^diff /);
5463                #assert($patch_line =~ m/^---/) if DEBUG;
5464
5465                my $last_patch_line = $patch_line;
5466                $patch_line = <$fd>;
5467                chomp $patch_line;
5468                #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5469
5470                print format_diff_from_to_header($last_patch_line, $patch_line,
5471                                                 $diffinfo, \%from, \%to,
5472                                                 @hash_parents);
5473
5474                # the patch itself
5475        LINE:
5476                while ($patch_line = <$fd>) {
5477                        chomp $patch_line;
5478
5479                        next PATCH if ($patch_line =~ m/^diff /);
5480
5481                        my $class = diff_line_class($patch_line, \%from, \%to);
5482
5483                        if ($class eq 'chunk_header') {
5484                                print_diff_chunk($diff_style, scalar @hash_parents, \%from, \%to, @chunk);
5485                                @chunk = ();
5486                        }
5487
5488                        push @chunk, [ $class, $patch_line ];
5489                }
5490
5491        } continue {
5492                if (@chunk) {
5493                        print_diff_chunk($diff_style, scalar @hash_parents, \%from, \%to, @chunk);
5494                        @chunk = ();
5495                }
5496                print "</div>\n"; # class="patch"
5497        }
5498
5499        # for compact combined (--cc) format, with chunk and patch simplification
5500        # the patchset might be empty, but there might be unprocessed raw lines
5501        for (++$patch_idx if $patch_number > 0;
5502             $patch_idx < @$difftree;
5503             ++$patch_idx) {
5504                # read and prepare patch information
5505                $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5506
5507                # generate anchor for "patch" links in difftree / whatchanged part
5508                print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5509                      format_diff_cc_simplified($diffinfo, @hash_parents) .
5510                      "</div>\n";  # class="patch"
5511
5512                $patch_number++;
5513        }
5514
5515        if ($patch_number == 0) {
5516                if (@hash_parents > 1) {
5517                        print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5518                } else {
5519                        print "<div class=\"diff nodifferences\">No differences found</div>\n";
5520                }
5521        }
5522
5523        print "</div>\n"; # class="patchset"
5524}
5525
5526# . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5527
5528sub git_project_search_form {
5529        my ($searchtext, $search_use_regexp) = @_;
5530
5531        my $limit = '';
5532        if ($project_filter) {
5533                $limit = " in '$project_filter/'";
5534        }
5535
5536        print "<div class=\"projsearch\">\n";
5537        print $cgi->start_form(-method => 'get', -action => $my_uri) .
5538              $cgi->hidden(-name => 'a', -value => 'project_list')  . "\n";
5539        print $cgi->hidden(-name => 'pf', -value => $project_filter). "\n"
5540                if (defined $project_filter);
5541        print $cgi->textfield(-name => 's', -value => $searchtext,
5542                              -title => "Search project by name and description$limit",
5543                              -size => 60) . "\n" .
5544              "<span title=\"Extended regular expression\">" .
5545              $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
5546                             -checked => $search_use_regexp) .
5547              "</span>\n" .
5548              $cgi->submit(-name => 'btnS', -value => 'Search') .
5549              $cgi->end_form() . "\n" .
5550              $cgi->a({-href => href(project => undef, searchtext => undef,
5551                                     project_filter => $project_filter)},
5552                      esc_html("List all projects$limit")) . "<br />\n";
5553        print "</div>\n";
5554}
5555
5556# entry for given @keys needs filling if at least one of keys in list
5557# is not present in %$project_info
5558sub project_info_needs_filling {
5559        my ($project_info, @keys) = @_;
5560
5561        # return List::MoreUtils::any { !exists $project_info->{$_} } @keys;
5562        foreach my $key (@keys) {
5563                if (!exists $project_info->{$key}) {
5564                        return 1;
5565                }
5566        }
5567        return;
5568}
5569
5570# fills project list info (age, description, owner, category, forks, etc.)
5571# for each project in the list, removing invalid projects from
5572# returned list, or fill only specified info.
5573#
5574# Invalid projects are removed from the returned list if and only if you
5575# ask 'age' or 'age_string' to be filled, because they are the only fields
5576# that run unconditionally git command that requires repository, and
5577# therefore do always check if project repository is invalid.
5578#
5579# USAGE:
5580# * fill_project_list_info(\@project_list, 'descr_long', 'ctags')
5581#   ensures that 'descr_long' and 'ctags' fields are filled
5582# * @project_list = fill_project_list_info(\@project_list)
5583#   ensures that all fields are filled (and invalid projects removed)
5584#
5585# NOTE: modifies $projlist, but does not remove entries from it
5586sub fill_project_list_info {
5587        my ($projlist, @wanted_keys) = @_;
5588        my @projects;
5589        my $filter_set = sub { return @_; };
5590        if (@wanted_keys) {
5591                my %wanted_keys = map { $_ => 1 } @wanted_keys;
5592                $filter_set = sub { return grep { $wanted_keys{$_} } @_; };
5593        }
5594
5595        my $show_ctags = gitweb_check_feature('ctags');
5596 PROJECT:
5597        foreach my $pr (@$projlist) {
5598                if (project_info_needs_filling($pr, $filter_set->('age', 'age_string'))) {
5599                        my (@activity) = git_get_last_activity($pr->{'path'});
5600                        unless (@activity) {
5601                                next PROJECT;
5602                        }
5603                        ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5604                }
5605                if (project_info_needs_filling($pr, $filter_set->('descr', 'descr_long'))) {
5606                        my $descr = git_get_project_description($pr->{'path'}) || "";
5607                        $descr = to_utf8($descr);
5608                        $pr->{'descr_long'} = $descr;
5609                        $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5610                }
5611                if (project_info_needs_filling($pr, $filter_set->('owner'))) {
5612                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5613                }
5614                if ($show_ctags &&
5615                    project_info_needs_filling($pr, $filter_set->('ctags'))) {
5616                        $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5617                }
5618                if ($projects_list_group_categories &&
5619                    project_info_needs_filling($pr, $filter_set->('category'))) {
5620                        my $cat = git_get_project_category($pr->{'path'}) ||
5621                                                           $project_list_default_category;
5622                        $pr->{'category'} = to_utf8($cat);
5623                }
5624
5625                push @projects, $pr;
5626        }
5627
5628        return @projects;
5629}
5630
5631sub sort_projects_list {
5632        my ($projlist, $order) = @_;
5633
5634        sub order_str {
5635                my $key = shift;
5636                return sub { $a->{$key} cmp $b->{$key} };
5637        }
5638
5639        sub order_num_then_undef {
5640                my $key = shift;
5641                return sub {
5642                        defined $a->{$key} ?
5643                                (defined $b->{$key} ? $a->{$key} <=> $b->{$key} : -1) :
5644                                (defined $b->{$key} ? 1 : 0)
5645                };
5646        }
5647
5648        my %orderings = (
5649                project => order_str('path'),
5650                descr => order_str('descr_long'),
5651                owner => order_str('owner'),
5652                age => order_num_then_undef('age'),
5653        );
5654
5655        my $ordering = $orderings{$order};
5656        return defined $ordering ? sort $ordering @$projlist : @$projlist;
5657}
5658
5659# returns a hash of categories, containing the list of project
5660# belonging to each category
5661sub build_projlist_by_category {
5662        my ($projlist, $from, $to) = @_;
5663        my %categories;
5664
5665        $from = 0 unless defined $from;
5666        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5667
5668        for (my $i = $from; $i <= $to; $i++) {
5669                my $pr = $projlist->[$i];
5670                push @{$categories{ $pr->{'category'} }}, $pr;
5671        }
5672
5673        return wantarray ? %categories : \%categories;
5674}
5675
5676# print 'sort by' <th> element, generating 'sort by $name' replay link
5677# if that order is not selected
5678sub print_sort_th {
5679        print format_sort_th(@_);
5680}
5681
5682sub format_sort_th {
5683        my ($name, $order, $header) = @_;
5684        my $sort_th = "";
5685        $header ||= ucfirst($name);
5686
5687        if ($order eq $name) {
5688                $sort_th .= "<th>$header</th>\n";
5689        } else {
5690                $sort_th .= "<th>" .
5691                            $cgi->a({-href => href(-replay=>1, order=>$name),
5692                                     -class => "header"}, $header) .
5693                            "</th>\n";
5694        }
5695
5696        return $sort_th;
5697}
5698
5699sub git_project_list_rows {
5700        my ($projlist, $from, $to, $check_forks) = @_;
5701
5702        $from = 0 unless defined $from;
5703        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5704
5705        my $alternate = 1;
5706        for (my $i = $from; $i <= $to; $i++) {
5707                my $pr = $projlist->[$i];
5708
5709                if ($alternate) {
5710                        print "<tr class=\"dark\">\n";
5711                } else {
5712                        print "<tr class=\"light\">\n";
5713                }
5714                $alternate ^= 1;
5715
5716                if ($check_forks) {
5717                        print "<td>";
5718                        if ($pr->{'forks'}) {
5719                                my $nforks = scalar @{$pr->{'forks'}};
5720                                if ($nforks > 0) {
5721                                        print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5722                                                       -title => "$nforks forks"}, "+");
5723                                } else {
5724                                        print $cgi->span({-title => "$nforks forks"}, "+");
5725                                }
5726                        }
5727                        print "</td>\n";
5728                }
5729                print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5730                                        -class => "list"},
5731                                       esc_html_match_hl($pr->{'path'}, $search_regexp)) .
5732                      "</td>\n" .
5733                      "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5734                                        -class => "list",
5735                                        -title => $pr->{'descr_long'}},
5736                                        $search_regexp
5737                                        ? esc_html_match_hl_chopped($pr->{'descr_long'},
5738                                                                    $pr->{'descr'}, $search_regexp)
5739                                        : esc_html($pr->{'descr'})) .
5740                      "</td>\n";
5741                unless ($omit_owner) {
5742                        print "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5743                }
5744                unless ($omit_age_column) {
5745                        print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5746                            (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n";
5747                }
5748                print"<td class=\"link\">" .
5749                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5750                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5751                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5752                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5753                      ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5754                      "</td>\n" .
5755                      "</tr>\n";
5756        }
5757}
5758
5759sub git_project_list_body {
5760        # actually uses global variable $project
5761        my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5762        my @projects = @$projlist;
5763
5764        my $check_forks = gitweb_check_feature('forks');
5765        my $show_ctags  = gitweb_check_feature('ctags');
5766        my $tagfilter = $show_ctags ? $input_params{'ctag'} : undef;
5767        $check_forks = undef
5768                if ($tagfilter || $search_regexp);
5769
5770        # filtering out forks before filling info allows to do less work
5771        @projects = filter_forks_from_projects_list(\@projects)
5772                if ($check_forks);
5773        # search_projects_list pre-fills required info
5774        @projects = search_projects_list(\@projects,
5775                                         'search_regexp' => $search_regexp,
5776                                         'tagfilter'  => $tagfilter)
5777                if ($tagfilter || $search_regexp);
5778        # fill the rest
5779        my @all_fields = ('descr', 'descr_long', 'ctags', 'category');
5780        push @all_fields, ('age', 'age_string') unless($omit_age_column);
5781        push @all_fields, 'owner' unless($omit_owner);
5782        @projects = fill_project_list_info(\@projects, @all_fields);
5783
5784        $order ||= $default_projects_order;
5785        $from = 0 unless defined $from;
5786        $to = $#projects if (!defined $to || $#projects < $to);
5787
5788        # short circuit
5789        if ($from > $to) {
5790                print "<center>\n".
5791                      "<b>No such projects found</b><br />\n".
5792                      "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5793                      "</center>\n<br />\n";
5794                return;
5795        }
5796
5797        @projects = sort_projects_list(\@projects, $order);
5798
5799        if ($show_ctags) {
5800                my $ctags = git_gather_all_ctags(\@projects);
5801                my $cloud = git_populate_project_tagcloud($ctags);
5802                print git_show_project_tagcloud($cloud, 64);
5803        }
5804
5805        print "<table class=\"project_list\">\n";
5806        unless ($no_header) {
5807                print "<tr>\n";
5808                if ($check_forks) {
5809                        print "<th></th>\n";
5810                }
5811                print_sort_th('project', $order, 'Project');
5812                print_sort_th('descr', $order, 'Description');
5813                print_sort_th('owner', $order, 'Owner') unless $omit_owner;
5814                print_sort_th('age', $order, 'Last Change') unless $omit_age_column;
5815                print "<th></th>\n" . # for links
5816                      "</tr>\n";
5817        }
5818
5819        if ($projects_list_group_categories) {
5820                # only display categories with projects in the $from-$to window
5821                @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5822                my %categories = build_projlist_by_category(\@projects, $from, $to);
5823                foreach my $cat (sort keys %categories) {
5824                        unless ($cat eq "") {
5825                                print "<tr>\n";
5826                                if ($check_forks) {
5827                                        print "<td></td>\n";
5828                                }
5829                                print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5830                                print "</tr>\n";
5831                        }
5832
5833                        git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5834                }
5835        } else {
5836                git_project_list_rows(\@projects, $from, $to, $check_forks);
5837        }
5838
5839        if (defined $extra) {
5840                print "<tr>\n";
5841                if ($check_forks) {
5842                        print "<td></td>\n";
5843                }
5844                print "<td colspan=\"5\">$extra</td>\n" .
5845                      "</tr>\n";
5846        }
5847        print "</table>\n";
5848}
5849
5850sub git_log_body {
5851        # uses global variable $project
5852        my ($commitlist, $from, $to, $refs, $extra) = @_;
5853
5854        $from = 0 unless defined $from;
5855        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5856
5857        for (my $i = 0; $i <= $to; $i++) {
5858                my %co = %{$commitlist->[$i]};
5859                next if !%co;
5860                my $commit = $co{'id'};
5861                my $ref = format_ref_marker($refs, $commit);
5862                git_print_header_div('commit',
5863                               "<span class=\"age\">$co{'age_string'}</span>" .
5864                               esc_html($co{'title'}) . $ref,
5865                               $commit);
5866                print "<div class=\"title_text\">\n" .
5867                      "<div class=\"log_link\">\n" .
5868                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5869                      " | " .
5870                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5871                      " | " .
5872                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5873                      "<br/>\n" .
5874                      "</div>\n";
5875                      git_print_authorship(\%co, -tag => 'span');
5876                      print "<br/>\n</div>\n";
5877
5878                print "<div class=\"log_body\">\n";
5879                git_print_log($co{'comment'}, -final_empty_line=> 1);
5880                print "</div>\n";
5881        }
5882        if ($extra) {
5883                print "<div class=\"page_nav\">\n";
5884                print "$extra\n";
5885                print "</div>\n";
5886        }
5887}
5888
5889sub git_shortlog_body {
5890        # uses global variable $project
5891        my ($commitlist, $from, $to, $refs, $extra) = @_;
5892
5893        $from = 0 unless defined $from;
5894        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5895
5896        print "<table class=\"shortlog\">\n";
5897        my $alternate = 1;
5898        for (my $i = $from; $i <= $to; $i++) {
5899                my %co = %{$commitlist->[$i]};
5900                my $commit = $co{'id'};
5901                my $ref = format_ref_marker($refs, $commit);
5902                if ($alternate) {
5903                        print "<tr class=\"dark\">\n";
5904                } else {
5905                        print "<tr class=\"light\">\n";
5906                }
5907                $alternate ^= 1;
5908                # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5909                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5910                      format_author_html('td', \%co, 10) . "<td>";
5911                print format_subject_html($co{'title'}, $co{'title_short'},
5912                                          href(action=>"commit", hash=>$commit), $ref);
5913                print "</td>\n" .
5914                      "<td class=\"link\">" .
5915                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5916                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5917                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5918                my $snapshot_links = format_snapshot_links($commit);
5919                if (defined $snapshot_links) {
5920                        print " | " . $snapshot_links;
5921                }
5922                print "</td>\n" .
5923                      "</tr>\n";
5924        }
5925        if (defined $extra) {
5926                print "<tr>\n" .
5927                      "<td colspan=\"4\">$extra</td>\n" .
5928                      "</tr>\n";
5929        }
5930        print "</table>\n";
5931}
5932
5933sub git_history_body {
5934        # Warning: assumes constant type (blob or tree) during history
5935        my ($commitlist, $from, $to, $refs, $extra,
5936            $file_name, $file_hash, $ftype) = @_;
5937
5938        $from = 0 unless defined $from;
5939        $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5940
5941        print "<table class=\"history\">\n";
5942        my $alternate = 1;
5943        for (my $i = $from; $i <= $to; $i++) {
5944                my %co = %{$commitlist->[$i]};
5945                if (!%co) {
5946                        next;
5947                }
5948                my $commit = $co{'id'};
5949
5950                my $ref = format_ref_marker($refs, $commit);
5951
5952                if ($alternate) {
5953                        print "<tr class=\"dark\">\n";
5954                } else {
5955                        print "<tr class=\"light\">\n";
5956                }
5957                $alternate ^= 1;
5958                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5959        # shortlog:   format_author_html('td', \%co, 10)
5960                      format_author_html('td', \%co, 15, 3) . "<td>";
5961                # originally git_history used chop_str($co{'title'}, 50)
5962                print format_subject_html($co{'title'}, $co{'title_short'},
5963                                          href(action=>"commit", hash=>$commit), $ref);
5964                print "</td>\n" .
5965                      "<td class=\"link\">" .
5966                      $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5967                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5968
5969                if ($ftype eq 'blob') {
5970                        print " | " .
5971                              $cgi->a({-href => href(action=>"blob_plain", hash_base=>$commit, file_name=>$file_name)}, "raw");
5972
5973                        my $blob_current = $file_hash;
5974                        my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5975                        if (defined $blob_current && defined $blob_parent &&
5976                                        $blob_current ne $blob_parent) {
5977                                print " | " .
5978                                        $cgi->a({-href => href(action=>"blobdiff",
5979                                                               hash=>$blob_current, hash_parent=>$blob_parent,
5980                                                               hash_base=>$hash_base, hash_parent_base=>$commit,
5981                                                               file_name=>$file_name)},
5982                                                "diff to current");
5983                        }
5984                }
5985                print "</td>\n" .
5986                      "</tr>\n";
5987        }
5988        if (defined $extra) {
5989                print "<tr>\n" .
5990                      "<td colspan=\"4\">$extra</td>\n" .
5991                      "</tr>\n";
5992        }
5993        print "</table>\n";
5994}
5995
5996sub git_tags_body {
5997        # uses global variable $project
5998        my ($taglist, $from, $to, $extra) = @_;
5999        $from = 0 unless defined $from;
6000        $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
6001
6002        print "<table class=\"tags\">\n";
6003        my $alternate = 1;
6004        for (my $i = $from; $i <= $to; $i++) {
6005                my $entry = $taglist->[$i];
6006                my %tag = %$entry;
6007                my $comment = $tag{'subject'};
6008                my $comment_short;
6009                if (defined $comment) {
6010                        $comment_short = chop_str($comment, 30, 5);
6011                }
6012                if ($alternate) {
6013                        print "<tr class=\"dark\">\n";
6014                } else {
6015                        print "<tr class=\"light\">\n";
6016                }
6017                $alternate ^= 1;
6018                if (defined $tag{'age'}) {
6019                        print "<td><i>$tag{'age'}</i></td>\n";
6020                } else {
6021                        print "<td></td>\n";
6022                }
6023                print "<td>" .
6024                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
6025                               -class => "list name"}, esc_html($tag{'name'})) .
6026                      "</td>\n" .
6027                      "<td>";
6028                if (defined $comment) {
6029                        print format_subject_html($comment, $comment_short,
6030                                                  href(action=>"tag", hash=>$tag{'id'}));
6031                }
6032                print "</td>\n" .
6033                      "<td class=\"selflink\">";
6034                if ($tag{'type'} eq "tag") {
6035                        print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
6036                } else {
6037                        print "&nbsp;";
6038                }
6039                print "</td>\n" .
6040                      "<td class=\"link\">" . " | " .
6041                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
6042                if ($tag{'reftype'} eq "commit") {
6043                        print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
6044                              " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
6045                } elsif ($tag{'reftype'} eq "blob") {
6046                        print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
6047                }
6048                print "</td>\n" .
6049                      "</tr>";
6050        }
6051        if (defined $extra) {
6052                print "<tr>\n" .
6053                      "<td colspan=\"5\">$extra</td>\n" .
6054                      "</tr>\n";
6055        }
6056        print "</table>\n";
6057}
6058
6059sub git_heads_body {
6060        # uses global variable $project
6061        my ($headlist, $head_at, $from, $to, $extra) = @_;
6062        $from = 0 unless defined $from;
6063        $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
6064
6065        print "<table class=\"heads\">\n";
6066        my $alternate = 1;
6067        for (my $i = $from; $i <= $to; $i++) {
6068                my $entry = $headlist->[$i];
6069                my %ref = %$entry;
6070                my $curr = defined $head_at && $ref{'id'} eq $head_at;
6071                if ($alternate) {
6072                        print "<tr class=\"dark\">\n";
6073                } else {
6074                        print "<tr class=\"light\">\n";
6075                }
6076                $alternate ^= 1;
6077                print "<td><i>$ref{'age'}</i></td>\n" .
6078                      ($curr ? "<td class=\"current_head\">" : "<td>") .
6079                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
6080                               -class => "list name"},esc_html($ref{'name'})) .
6081                      "</td>\n" .
6082                      "<td class=\"link\">" .
6083                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
6084                      $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
6085                      $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
6086                      "</td>\n" .
6087                      "</tr>";
6088        }
6089        if (defined $extra) {
6090                print "<tr>\n" .
6091                      "<td colspan=\"3\">$extra</td>\n" .
6092                      "</tr>\n";
6093        }
6094        print "</table>\n";
6095}
6096
6097# Display a single remote block
6098sub git_remote_block {
6099        my ($remote, $rdata, $limit, $head) = @_;
6100
6101        my $heads = $rdata->{'heads'};
6102        my $fetch = $rdata->{'fetch'};
6103        my $push = $rdata->{'push'};
6104
6105        my $urls_table = "<table class=\"projects_list\">\n" ;
6106
6107        if (defined $fetch) {
6108                if ($fetch eq $push) {
6109                        $urls_table .= format_repo_url("URL", $fetch);
6110                } else {
6111                        $urls_table .= format_repo_url("Fetch URL", $fetch);
6112                        $urls_table .= format_repo_url("Push URL", $push) if defined $push;
6113                }
6114        } elsif (defined $push) {
6115                $urls_table .= format_repo_url("Push URL", $push);
6116        } else {
6117                $urls_table .= format_repo_url("", "No remote URL");
6118        }
6119
6120        $urls_table .= "</table>\n";
6121
6122        my $dots;
6123        if (defined $limit && $limit < @$heads) {
6124                $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
6125        }
6126
6127        print $urls_table;
6128        git_heads_body($heads, $head, 0, $limit, $dots);
6129}
6130
6131# Display a list of remote names with the respective fetch and push URLs
6132sub git_remotes_list {
6133        my ($remotedata, $limit) = @_;
6134        print "<table class=\"heads\">\n";
6135        my $alternate = 1;
6136        my @remotes = sort keys %$remotedata;
6137
6138        my $limited = $limit && $limit < @remotes;
6139
6140        $#remotes = $limit - 1 if $limited;
6141
6142        while (my $remote = shift @remotes) {
6143                my $rdata = $remotedata->{$remote};
6144                my $fetch = $rdata->{'fetch'};
6145                my $push = $rdata->{'push'};
6146                if ($alternate) {
6147                        print "<tr class=\"dark\">\n";
6148                } else {
6149                        print "<tr class=\"light\">\n";
6150                }
6151                $alternate ^= 1;
6152                print "<td>" .
6153                      $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
6154                               -class=> "list name"},esc_html($remote)) .
6155                      "</td>";
6156                print "<td class=\"link\">" .
6157                      (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
6158                      " | " .
6159                      (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
6160                      "</td>";
6161
6162                print "</tr>\n";
6163        }
6164
6165        if ($limited) {
6166                print "<tr>\n" .
6167                      "<td colspan=\"3\">" .
6168                      $cgi->a({-href => href(action=>"remotes")}, "...") .
6169                      "</td>\n" . "</tr>\n";
6170        }
6171
6172        print "</table>";
6173}
6174
6175# Display remote heads grouped by remote, unless there are too many
6176# remotes, in which case we only display the remote names
6177sub git_remotes_body {
6178        my ($remotedata, $limit, $head) = @_;
6179        if ($limit and $limit < keys %$remotedata) {
6180                git_remotes_list($remotedata, $limit);
6181        } else {
6182                fill_remote_heads($remotedata);
6183                while (my ($remote, $rdata) = each %$remotedata) {
6184                        git_print_section({-class=>"remote", -id=>$remote},
6185                                ["remotes", $remote, $remote], sub {
6186                                        git_remote_block($remote, $rdata, $limit, $head);
6187                                });
6188                }
6189        }
6190}
6191
6192sub git_search_message {
6193        my %co = @_;
6194
6195        my $greptype;
6196        if ($searchtype eq 'commit') {
6197                $greptype = "--grep=";
6198        } elsif ($searchtype eq 'author') {
6199                $greptype = "--author=";
6200        } elsif ($searchtype eq 'committer') {
6201                $greptype = "--committer=";
6202        }
6203        $greptype .= $searchtext;
6204        my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
6205                                       $greptype, '--regexp-ignore-case',
6206                                       $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
6207
6208        my $paging_nav = '';
6209        if ($page > 0) {
6210                $paging_nav .=
6211                        $cgi->a({-href => href(-replay=>1, page=>undef)},
6212                                "first") .
6213                        " &sdot; " .
6214                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
6215                                 -accesskey => "p", -title => "Alt-p"}, "prev");
6216        } else {
6217                $paging_nav .= "first &sdot; prev";
6218        }
6219        my $next_link = '';
6220        if ($#commitlist >= 100) {
6221                $next_link =
6222                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
6223                                 -accesskey => "n", -title => "Alt-n"}, "next");
6224                $paging_nav .= " &sdot; $next_link";
6225        } else {
6226                $paging_nav .= " &sdot; next";
6227        }
6228
6229        git_header_html();
6230
6231        git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
6232        git_print_header_div('commit', esc_html($co{'title'}), $hash);
6233        if ($page == 0 && !@commitlist) {
6234                print "<p>No match.</p>\n";
6235        } else {
6236                git_search_grep_body(\@commitlist, 0, 99, $next_link);
6237        }
6238
6239        git_footer_html();
6240}
6241
6242sub git_search_changes {
6243        my %co = @_;
6244
6245        local $/ = "\n";
6246        open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
6247                '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
6248                ($search_use_regexp ? '--pickaxe-regex' : ())
6249                        or die_error(500, "Open git-log failed");
6250
6251        git_header_html();
6252
6253        git_print_page_nav('','', $hash,$co{'tree'},$hash);
6254        git_print_header_div('commit', esc_html($co{'title'}), $hash);
6255
6256        print "<table class=\"pickaxe search\">\n";
6257        my $alternate = 1;
6258        undef %co;
6259        my @files;
6260        while (my $line = <$fd>) {
6261                chomp $line;
6262                next unless $line;
6263
6264                my %set = parse_difftree_raw_line($line);
6265                if (defined $set{'commit'}) {
6266                        # finish previous commit
6267                        if (%co) {
6268                                print "</td>\n" .
6269                                      "<td class=\"link\">" .
6270                                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
6271                                              "commit") .
6272                                      " | " .
6273                                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
6274                                                             hash_base=>$co{'id'})},
6275                                              "tree") .
6276                                      "</td>\n" .
6277                                      "</tr>\n";
6278                        }
6279
6280                        if ($alternate) {
6281                                print "<tr class=\"dark\">\n";
6282                        } else {
6283                                print "<tr class=\"light\">\n";
6284                        }
6285                        $alternate ^= 1;
6286                        %co = parse_commit($set{'commit'});
6287                        my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6288                        print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6289                              "<td><i>$author</i></td>\n" .
6290                              "<td>" .
6291                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6292                                      -class => "list subject"},
6293                                      chop_and_escape_str($co{'title'}, 50) . "<br/>");
6294                } elsif (defined $set{'to_id'}) {
6295                        next if ($set{'to_id'} =~ m/^0{40}$/);
6296
6297                        print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6298                                                     hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6299                                      -class => "list"},
6300                                      "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6301                              "<br/>\n";
6302                }
6303        }
6304        close $fd;
6305
6306        # finish last commit (warning: repetition!)
6307        if (%co) {
6308                print "</td>\n" .
6309                      "<td class=\"link\">" .
6310                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
6311                              "commit") .
6312                      " | " .
6313                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
6314                                             hash_base=>$co{'id'})},
6315                              "tree") .
6316                      "</td>\n" .
6317                      "</tr>\n";
6318        }
6319
6320        print "</table>\n";
6321
6322        git_footer_html();
6323}
6324
6325sub git_search_files {
6326        my %co = @_;
6327
6328        local $/ = "\n";
6329        open my $fd, "-|", git_cmd(), 'grep', '-n', '-z',
6330                $search_use_regexp ? ('-E', '-i') : '-F',
6331                $searchtext, $co{'tree'}
6332                        or die_error(500, "Open git-grep failed");
6333
6334        git_header_html();
6335
6336        git_print_page_nav('','', $hash,$co{'tree'},$hash);
6337        git_print_header_div('commit', esc_html($co{'title'}), $hash);
6338
6339        print "<table class=\"grep_search\">\n";
6340        my $alternate = 1;
6341        my $matches = 0;
6342        my $lastfile = '';
6343        my $file_href;
6344        while (my $line = <$fd>) {
6345                chomp $line;
6346                my ($file, $lno, $ltext, $binary);
6347                last if ($matches++ > 1000);
6348                if ($line =~ /^Binary file (.+) matches$/) {
6349                        $file = $1;
6350                        $binary = 1;
6351                } else {
6352                        ($file, $lno, $ltext) = split(/\0/, $line, 3);
6353                        $file =~ s/^$co{'tree'}://;
6354                }
6355                if ($file ne $lastfile) {
6356                        $lastfile and print "</td></tr>\n";
6357                        if ($alternate++) {
6358                                print "<tr class=\"dark\">\n";
6359                        } else {
6360                                print "<tr class=\"light\">\n";
6361                        }
6362                        $file_href = href(action=>"blob", hash_base=>$co{'id'},
6363                                          file_name=>$file);
6364                        print "<td class=\"list\">".
6365                                $cgi->a({-href => $file_href, -class => "list"}, esc_path($file));
6366                        print "</td><td>\n";
6367                        $lastfile = $file;
6368                }
6369                if ($binary) {
6370                        print "<div class=\"binary\">Binary file</div>\n";
6371                } else {
6372                        $ltext = untabify($ltext);
6373                        if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6374                                $ltext = esc_html($1, -nbsp=>1);
6375                                $ltext .= '<span class="match">';
6376                                $ltext .= esc_html($2, -nbsp=>1);
6377                                $ltext .= '</span>';
6378                                $ltext .= esc_html($3, -nbsp=>1);
6379                        } else {
6380                                $ltext = esc_html($ltext, -nbsp=>1);
6381                        }
6382                        print "<div class=\"pre\">" .
6383                                $cgi->a({-href => $file_href.'#l'.$lno,
6384                                        -class => "linenr"}, sprintf('%4i', $lno)) .
6385                                ' ' .  $ltext . "</div>\n";
6386                }
6387        }
6388        if ($lastfile) {
6389                print "</td></tr>\n";
6390                if ($matches > 1000) {
6391                        print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6392                }
6393        } else {
6394                print "<div class=\"diff nodifferences\">No matches found</div>\n";
6395        }
6396        close $fd;
6397
6398        print "</table>\n";
6399
6400        git_footer_html();
6401}
6402
6403sub git_search_grep_body {
6404        my ($commitlist, $from, $to, $extra) = @_;
6405        $from = 0 unless defined $from;
6406        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
6407
6408        print "<table class=\"commit_search\">\n";
6409        my $alternate = 1;
6410        for (my $i = $from; $i <= $to; $i++) {
6411                my %co = %{$commitlist->[$i]};
6412                if (!%co) {
6413                        next;
6414                }
6415                my $commit = $co{'id'};
6416                if ($alternate) {
6417                        print "<tr class=\"dark\">\n";
6418                } else {
6419                        print "<tr class=\"light\">\n";
6420                }
6421                $alternate ^= 1;
6422                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6423                      format_author_html('td', \%co, 15, 5) .
6424                      "<td>" .
6425                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6426                               -class => "list subject"},
6427                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
6428                my $comment = $co{'comment'};
6429                foreach my $line (@$comment) {
6430                        if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
6431                                my ($lead, $match, $trail) = ($1, $2, $3);
6432                                $match = chop_str($match, 70, 5, 'center');
6433                                my $contextlen = int((80 - length($match))/2);
6434                                $contextlen = 30 if ($contextlen > 30);
6435                                $lead  = chop_str($lead,  $contextlen, 10, 'left');
6436                                $trail = chop_str($trail, $contextlen, 10, 'right');
6437
6438                                $lead  = esc_html($lead);
6439                                $match = esc_html($match);
6440                                $trail = esc_html($trail);
6441
6442                                print "$lead<span class=\"match\">$match</span>$trail<br />";
6443                        }
6444                }
6445                print "</td>\n" .
6446                      "<td class=\"link\">" .
6447                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6448                      " | " .
6449                      $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
6450                      " | " .
6451                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6452                print "</td>\n" .
6453                      "</tr>\n";
6454        }
6455        if (defined $extra) {
6456                print "<tr>\n" .
6457                      "<td colspan=\"3\">$extra</td>\n" .
6458                      "</tr>\n";
6459        }
6460        print "</table>\n";
6461}
6462
6463## ======================================================================
6464## ======================================================================
6465## actions
6466
6467sub git_project_list {
6468        my $order = $input_params{'order'};
6469        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6470                die_error(400, "Unknown order parameter");
6471        }
6472
6473        my @list = git_get_projects_list($project_filter, $strict_export);
6474        if (!@list) {
6475                die_error(404, "No projects found");
6476        }
6477
6478        git_header_html();
6479        if (defined $home_text && -f $home_text) {
6480                print "<div class=\"index_include\">\n";
6481                insert_file($home_text);
6482                print "</div>\n";
6483        }
6484
6485        git_project_search_form($searchtext, $search_use_regexp);
6486        git_project_list_body(\@list, $order);
6487        git_footer_html();
6488}
6489
6490sub git_forks {
6491        my $order = $input_params{'order'};
6492        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6493                die_error(400, "Unknown order parameter");
6494        }
6495
6496        my $filter = $project;
6497        $filter =~ s/\.git$//;
6498        my @list = git_get_projects_list($filter);
6499        if (!@list) {
6500                die_error(404, "No forks found");
6501        }
6502
6503        git_header_html();
6504        git_print_page_nav('','');
6505        git_print_header_div('summary', "$project forks");
6506        git_project_list_body(\@list, $order);
6507        git_footer_html();
6508}
6509
6510sub git_project_index {
6511        my @projects = git_get_projects_list($project_filter, $strict_export);
6512        if (!@projects) {
6513                die_error(404, "No projects found");
6514        }
6515
6516        print $cgi->header(
6517                -type => 'text/plain',
6518                -charset => 'utf-8',
6519                -content_disposition => 'inline; filename="index.aux"');
6520
6521        foreach my $pr (@projects) {
6522                if (!exists $pr->{'owner'}) {
6523                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6524                }
6525
6526                my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6527                # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6528                $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6529                $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6530                $path  =~ s/ /\+/g;
6531                $owner =~ s/ /\+/g;
6532
6533                print "$path $owner\n";
6534        }
6535}
6536
6537sub git_summary {
6538        my $descr = git_get_project_description($project) || "none";
6539        my %co = parse_commit("HEAD");
6540        my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6541        my $head = $co{'id'};
6542        my $remote_heads = gitweb_check_feature('remote_heads');
6543
6544        my $owner = git_get_project_owner($project);
6545
6546        my $refs = git_get_references();
6547        # These get_*_list functions return one more to allow us to see if
6548        # there are more ...
6549        my @taglist  = git_get_tags_list(16);
6550        my @headlist = git_get_heads_list(16);
6551        my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6552        my @forklist;
6553        my $check_forks = gitweb_check_feature('forks');
6554
6555        if ($check_forks) {
6556                # find forks of a project
6557                my $filter = $project;
6558                $filter =~ s/\.git$//;
6559                @forklist = git_get_projects_list($filter);
6560                # filter out forks of forks
6561                @forklist = filter_forks_from_projects_list(\@forklist)
6562                        if (@forklist);
6563        }
6564
6565        git_header_html();
6566        git_print_page_nav('summary','', $head);
6567
6568        print "<div class=\"title\">&nbsp;</div>\n";
6569        print "<table class=\"projects_list\">\n" .
6570              "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n";
6571        if ($owner and not $omit_owner) {
6572                print  "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6573        }
6574        if (defined $cd{'rfc2822'}) {
6575                print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6576                      "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6577        }
6578
6579        # use per project git URL list in $projectroot/$project/cloneurl
6580        # or make project git URL from git base URL and project name
6581        my $url_tag = "URL";
6582        my @url_list = git_get_project_url_list($project);
6583        @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6584        foreach my $git_url (@url_list) {
6585                next unless $git_url;
6586                print format_repo_url($url_tag, $git_url);
6587                $url_tag = "";
6588        }
6589
6590        # Tag cloud
6591        my $show_ctags = gitweb_check_feature('ctags');
6592        if ($show_ctags) {
6593                my $ctags = git_get_project_ctags($project);
6594                if (%$ctags) {
6595                        # without ability to add tags, don't show if there are none
6596                        my $cloud = git_populate_project_tagcloud($ctags);
6597                        print "<tr id=\"metadata_ctags\">" .
6598                              "<td>content tags</td>" .
6599                              "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6600                              "</tr>\n";
6601                }
6602        }
6603
6604        print "</table>\n";
6605
6606        # If XSS prevention is on, we don't include README.html.
6607        # TODO: Allow a readme in some safe format.
6608        if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6609                print "<div class=\"title\">readme</div>\n" .
6610                      "<div class=\"readme\">\n";
6611                insert_file("$projectroot/$project/README.html");
6612                print "\n</div>\n"; # class="readme"
6613        }
6614
6615        # we need to request one more than 16 (0..15) to check if
6616        # those 16 are all
6617        my @commitlist = $head ? parse_commits($head, 17) : ();
6618        if (@commitlist) {
6619                git_print_header_div('shortlog');
6620                git_shortlog_body(\@commitlist, 0, 15, $refs,
6621                                  $#commitlist <=  15 ? undef :
6622                                  $cgi->a({-href => href(action=>"shortlog")}, "..."));
6623        }
6624
6625        if (@taglist) {
6626                git_print_header_div('tags');
6627                git_tags_body(\@taglist, 0, 15,
6628                              $#taglist <=  15 ? undef :
6629                              $cgi->a({-href => href(action=>"tags")}, "..."));
6630        }
6631
6632        if (@headlist) {
6633                git_print_header_div('heads');
6634                git_heads_body(\@headlist, $head, 0, 15,
6635                               $#headlist <= 15 ? undef :
6636                               $cgi->a({-href => href(action=>"heads")}, "..."));
6637        }
6638
6639        if (%remotedata) {
6640                git_print_header_div('remotes');
6641                git_remotes_body(\%remotedata, 15, $head);
6642        }
6643
6644        if (@forklist) {
6645                git_print_header_div('forks');
6646                git_project_list_body(\@forklist, 'age', 0, 15,
6647                                      $#forklist <= 15 ? undef :
6648                                      $cgi->a({-href => href(action=>"forks")}, "..."),
6649                                      'no_header');
6650        }
6651
6652        git_footer_html();
6653}
6654
6655sub git_tag {
6656        my %tag = parse_tag($hash);
6657
6658        if (! %tag) {
6659                die_error(404, "Unknown tag object");
6660        }
6661
6662        my $head = git_get_head_hash($project);
6663        git_header_html();
6664        git_print_page_nav('','', $head,undef,$head);
6665        git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6666        print "<div class=\"title_text\">\n" .
6667              "<table class=\"object_header\">\n" .
6668              "<tr>\n" .
6669              "<td>object</td>\n" .
6670              "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6671                               $tag{'object'}) . "</td>\n" .
6672              "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6673                                              $tag{'type'}) . "</td>\n" .
6674              "</tr>\n";
6675        if (defined($tag{'author'})) {
6676                git_print_authorship_rows(\%tag, 'author');
6677        }
6678        print "</table>\n\n" .
6679              "</div>\n";
6680        print "<div class=\"page_body\">";
6681        my $comment = $tag{'comment'};
6682        foreach my $line (@$comment) {
6683                chomp $line;
6684                print esc_html($line, -nbsp=>1) . "<br/>\n";
6685        }
6686        print "</div>\n";
6687        git_footer_html();
6688}
6689
6690sub git_blame_common {
6691        my $format = shift || 'porcelain';
6692        if ($format eq 'porcelain' && $input_params{'javascript'}) {
6693                $format = 'incremental';
6694                $action = 'blame_incremental'; # for page title etc
6695        }
6696
6697        # permissions
6698        gitweb_check_feature('blame')
6699                or die_error(403, "Blame view not allowed");
6700
6701        # error checking
6702        die_error(400, "No file name given") unless $file_name;
6703        $hash_base ||= git_get_head_hash($project);
6704        die_error(404, "Couldn't find base commit") unless $hash_base;
6705        my %co = parse_commit($hash_base)
6706                or die_error(404, "Commit not found");
6707        my $ftype = "blob";
6708        if (!defined $hash) {
6709                $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6710                        or die_error(404, "Error looking up file");
6711        } else {
6712                $ftype = git_get_type($hash);
6713                if ($ftype !~ "blob") {
6714                        die_error(400, "Object is not a blob");
6715                }
6716        }
6717
6718        my $fd;
6719        if ($format eq 'incremental') {
6720                # get file contents (as base)
6721                open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6722                        or die_error(500, "Open git-cat-file failed");
6723        } elsif ($format eq 'data') {
6724                # run git-blame --incremental
6725                open $fd, "-|", git_cmd(), "blame", "--incremental",
6726                        $hash_base, "--", $file_name
6727                        or die_error(500, "Open git-blame --incremental failed");
6728        } else {
6729                # run git-blame --porcelain
6730                open $fd, "-|", git_cmd(), "blame", '-p',
6731                        $hash_base, '--', $file_name
6732                        or die_error(500, "Open git-blame --porcelain failed");
6733        }
6734        binmode $fd, ':utf8';
6735
6736        # incremental blame data returns early
6737        if ($format eq 'data') {
6738                print $cgi->header(
6739                        -type=>"text/plain", -charset => "utf-8",
6740                        -status=> "200 OK");
6741                local $| = 1; # output autoflush
6742                while (my $line = <$fd>) {
6743                        print to_utf8($line);
6744                }
6745                close $fd
6746                        or print "ERROR $!\n";
6747
6748                print 'END';
6749                if (defined $t0 && gitweb_check_feature('timed')) {
6750                        print ' '.
6751                              tv_interval($t0, [ gettimeofday() ]).
6752                              ' '.$number_of_git_cmds;
6753                }
6754                print "\n";
6755
6756                return;
6757        }
6758
6759        # page header
6760        git_header_html();
6761        my $formats_nav =
6762                $cgi->a({-href => href(action=>"blob", -replay=>1)},
6763                        "blob") .
6764                " | ";
6765        if ($format eq 'incremental') {
6766                $formats_nav .=
6767                        $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6768                                "blame") . " (non-incremental)";
6769        } else {
6770                $formats_nav .=
6771                        $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6772                                "blame") . " (incremental)";
6773        }
6774        $formats_nav .=
6775                " | " .
6776                $cgi->a({-href => href(action=>"history", -replay=>1)},
6777                        "history") .
6778                " | " .
6779                $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6780                        "HEAD");
6781        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6782        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6783        git_print_page_path($file_name, $ftype, $hash_base);
6784
6785        # page body
6786        if ($format eq 'incremental') {
6787                print "<noscript>\n<div class=\"error\"><center><b>\n".
6788                      "This page requires JavaScript to run.\n Use ".
6789                      $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6790                              'this page').
6791                      " instead.\n".
6792                      "</b></center></div>\n</noscript>\n";
6793
6794                print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6795        }
6796
6797        print qq!<div class="page_body">\n!;
6798        print qq!<div id="progress_info">... / ...</div>\n!
6799                if ($format eq 'incremental');
6800        print qq!<table id="blame_table" class="blame" width="100%">\n!.
6801              #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6802              qq!<thead>\n!.
6803              qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6804              qq!</thead>\n!.
6805              qq!<tbody>\n!;
6806
6807        my @rev_color = qw(light dark);
6808        my $num_colors = scalar(@rev_color);
6809        my $current_color = 0;
6810
6811        if ($format eq 'incremental') {
6812                my $color_class = $rev_color[$current_color];
6813
6814                #contents of a file
6815                my $linenr = 0;
6816        LINE:
6817                while (my $line = <$fd>) {
6818                        chomp $line;
6819                        $linenr++;
6820
6821                        print qq!<tr id="l$linenr" class="$color_class">!.
6822                              qq!<td class="sha1"><a href=""> </a></td>!.
6823                              qq!<td class="linenr">!.
6824                              qq!<a class="linenr" href="">$linenr</a></td>!;
6825                        print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6826                        print qq!</tr>\n!;
6827                }
6828
6829        } else { # porcelain, i.e. ordinary blame
6830                my %metainfo = (); # saves information about commits
6831
6832                # blame data
6833        LINE:
6834                while (my $line = <$fd>) {
6835                        chomp $line;
6836                        # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6837                        # no <lines in group> for subsequent lines in group of lines
6838                        my ($full_rev, $orig_lineno, $lineno, $group_size) =
6839                           ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6840                        if (!exists $metainfo{$full_rev}) {
6841                                $metainfo{$full_rev} = { 'nprevious' => 0 };
6842                        }
6843                        my $meta = $metainfo{$full_rev};
6844                        my $data;
6845                        while ($data = <$fd>) {
6846                                chomp $data;
6847                                last if ($data =~ s/^\t//); # contents of line
6848                                if ($data =~ /^(\S+)(?: (.*))?$/) {
6849                                        $meta->{$1} = $2 unless exists $meta->{$1};
6850                                }
6851                                if ($data =~ /^previous /) {
6852                                        $meta->{'nprevious'}++;
6853                                }
6854                        }
6855                        my $short_rev = substr($full_rev, 0, 8);
6856                        my $author = $meta->{'author'};
6857                        my %date =
6858                                parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6859                        my $date = $date{'iso-tz'};
6860                        if ($group_size) {
6861                                $current_color = ($current_color + 1) % $num_colors;
6862                        }
6863                        my $tr_class = $rev_color[$current_color];
6864                        $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6865                        $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6866                        $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6867                        print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6868                        if ($group_size) {
6869                                print "<td class=\"sha1\"";
6870                                print " title=\"". esc_html($author) . ", $date\"";
6871                                print " rowspan=\"$group_size\"" if ($group_size > 1);
6872                                print ">";
6873                                print $cgi->a({-href => href(action=>"commit",
6874                                                             hash=>$full_rev,
6875                                                             file_name=>$file_name)},
6876                                              esc_html($short_rev));
6877                                if ($group_size >= 2) {
6878                                        my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6879                                        if (@author_initials) {
6880                                                print "<br />" .
6881                                                      esc_html(join('', @author_initials));
6882                                                #           or join('.', ...)
6883                                        }
6884                                }
6885                                print "</td>\n";
6886                        }
6887                        # 'previous' <sha1 of parent commit> <filename at commit>
6888                        if (exists $meta->{'previous'} &&
6889                            $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6890                                $meta->{'parent'} = $1;
6891                                $meta->{'file_parent'} = unquote($2);
6892                        }
6893                        my $linenr_commit =
6894                                exists($meta->{'parent'}) ?
6895                                $meta->{'parent'} : $full_rev;
6896                        my $linenr_filename =
6897                                exists($meta->{'file_parent'}) ?
6898                                $meta->{'file_parent'} : unquote($meta->{'filename'});
6899                        my $blamed = href(action => 'blame',
6900                                          file_name => $linenr_filename,
6901                                          hash_base => $linenr_commit);
6902                        print "<td class=\"linenr\">";
6903                        print $cgi->a({ -href => "$blamed#l$orig_lineno",
6904                                        -class => "linenr" },
6905                                      esc_html($lineno));
6906                        print "</td>";
6907                        print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6908                        print "</tr>\n";
6909                } # end while
6910
6911        }
6912
6913        # footer
6914        print "</tbody>\n".
6915              "</table>\n"; # class="blame"
6916        print "</div>\n";   # class="blame_body"
6917        close $fd
6918                or print "Reading blob failed\n";
6919
6920        git_footer_html();
6921}
6922
6923sub git_blame {
6924        git_blame_common();
6925}
6926
6927sub git_blame_incremental {
6928        git_blame_common('incremental');
6929}
6930
6931sub git_blame_data {
6932        git_blame_common('data');
6933}
6934
6935sub git_tags {
6936        my $head = git_get_head_hash($project);
6937        git_header_html();
6938        git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6939        git_print_header_div('summary', $project);
6940
6941        my @tagslist = git_get_tags_list();
6942        if (@tagslist) {
6943                git_tags_body(\@tagslist);
6944        }
6945        git_footer_html();
6946}
6947
6948sub git_heads {
6949        my $head = git_get_head_hash($project);
6950        git_header_html();
6951        git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6952        git_print_header_div('summary', $project);
6953
6954        my @headslist = git_get_heads_list();
6955        if (@headslist) {
6956                git_heads_body(\@headslist, $head);
6957        }
6958        git_footer_html();
6959}
6960
6961# used both for single remote view and for list of all the remotes
6962sub git_remotes {
6963        gitweb_check_feature('remote_heads')
6964                or die_error(403, "Remote heads view is disabled");
6965
6966        my $head = git_get_head_hash($project);
6967        my $remote = $input_params{'hash'};
6968
6969        my $remotedata = git_get_remotes_list($remote);
6970        die_error(500, "Unable to get remote information") unless defined $remotedata;
6971
6972        unless (%$remotedata) {
6973                die_error(404, defined $remote ?
6974                        "Remote $remote not found" :
6975                        "No remotes found");
6976        }
6977
6978        git_header_html(undef, undef, -action_extra => $remote);
6979        git_print_page_nav('', '',  $head, undef, $head,
6980                format_ref_views($remote ? '' : 'remotes'));
6981
6982        fill_remote_heads($remotedata);
6983        if (defined $remote) {
6984                git_print_header_div('remotes', "$remote remote for $project");
6985                git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6986        } else {
6987                git_print_header_div('summary', "$project remotes");
6988                git_remotes_body($remotedata, undef, $head);
6989        }
6990
6991        git_footer_html();
6992}
6993
6994sub git_blob_plain {
6995        my $type = shift;
6996        my $expires;
6997
6998        if (!defined $hash) {
6999                if (defined $file_name) {
7000                        my $base = $hash_base || git_get_head_hash($project);
7001                        $hash = git_get_hash_by_path($base, $file_name, "blob")
7002                                or die_error(404, "Cannot find file");
7003                } else {
7004                        die_error(400, "No file name defined");
7005                }
7006        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7007                # blobs defined by non-textual hash id's can be cached
7008                $expires = "+1d";
7009        }
7010
7011        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
7012                or die_error(500, "Open git-cat-file blob '$hash' failed");
7013
7014        # content-type (can include charset)
7015        $type = blob_contenttype($fd, $file_name, $type);
7016
7017        # "save as" filename, even when no $file_name is given
7018        my $save_as = "$hash";
7019        if (defined $file_name) {
7020                $save_as = $file_name;
7021        } elsif ($type =~ m/^text\//) {
7022                $save_as .= '.txt';
7023        }
7024
7025        # With XSS prevention on, blobs of all types except a few known safe
7026        # ones are served with "Content-Disposition: attachment" to make sure
7027        # they don't run in our security domain.  For certain image types,
7028        # blob view writes an <img> tag referring to blob_plain view, and we
7029        # want to be sure not to break that by serving the image as an
7030        # attachment (though Firefox 3 doesn't seem to care).
7031        my $sandbox = $prevent_xss &&
7032                $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
7033
7034        # serve text/* as text/plain
7035        if ($prevent_xss &&
7036            ($type =~ m!^text/[a-z]+\b(.*)$! ||
7037             ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
7038                my $rest = $1;
7039                $rest = defined $rest ? $rest : '';
7040                $type = "text/plain$rest";
7041        }
7042
7043        print $cgi->header(
7044                -type => $type,
7045                -expires => $expires,
7046                -content_disposition =>
7047                        ($sandbox ? 'attachment' : 'inline')
7048                        . '; filename="' . $save_as . '"');
7049        local $/ = undef;
7050        binmode STDOUT, ':raw';
7051        print <$fd>;
7052        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
7053        close $fd;
7054}
7055
7056sub git_blob {
7057        my $expires;
7058
7059        if (!defined $hash) {
7060                if (defined $file_name) {
7061                        my $base = $hash_base || git_get_head_hash($project);
7062                        $hash = git_get_hash_by_path($base, $file_name, "blob")
7063                                or die_error(404, "Cannot find file");
7064                } else {
7065                        die_error(400, "No file name defined");
7066                }
7067        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7068                # blobs defined by non-textual hash id's can be cached
7069                $expires = "+1d";
7070        }
7071
7072        my $have_blame = gitweb_check_feature('blame');
7073        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
7074                or die_error(500, "Couldn't cat $file_name, $hash");
7075        my $mimetype = blob_mimetype($fd, $file_name);
7076        # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
7077        if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
7078                close $fd;
7079                return git_blob_plain($mimetype);
7080        }
7081        # we can have blame only for text/* mimetype
7082        $have_blame &&= ($mimetype =~ m!^text/!);
7083
7084        my $highlight = gitweb_check_feature('highlight');
7085        my $syntax = guess_file_syntax($highlight, $file_name);
7086        $fd = run_highlighter($fd, $highlight, $syntax);
7087
7088        git_header_html(undef, $expires);
7089        my $formats_nav = '';
7090        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7091                if (defined $file_name) {
7092                        if ($have_blame) {
7093                                $formats_nav .=
7094                                        $cgi->a({-href => href(action=>"blame", -replay=>1)},
7095                                                "blame") .
7096                                        " | ";
7097                        }
7098                        $formats_nav .=
7099                                $cgi->a({-href => href(action=>"history", -replay=>1)},
7100                                        "history") .
7101                                " | " .
7102                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
7103                                        "raw") .
7104                                " | " .
7105                                $cgi->a({-href => href(action=>"blob",
7106                                                       hash_base=>"HEAD", file_name=>$file_name)},
7107                                        "HEAD");
7108                } else {
7109                        $formats_nav .=
7110                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
7111                                        "raw");
7112                }
7113                git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7114                git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7115        } else {
7116                print "<div class=\"page_nav\">\n" .
7117                      "<br/><br/></div>\n" .
7118                      "<div class=\"title\">".esc_html($hash)."</div>\n";
7119        }
7120        git_print_page_path($file_name, "blob", $hash_base);
7121        print "<div class=\"page_body\">\n";
7122        if ($mimetype =~ m!^image/!) {
7123                print qq!<img class="blob" type="!.esc_attr($mimetype).qq!"!;
7124                if ($file_name) {
7125                        print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
7126                }
7127                print qq! src="! .
7128                      href(action=>"blob_plain", hash=>$hash,
7129                           hash_base=>$hash_base, file_name=>$file_name) .
7130                      qq!" />\n!;
7131        } else {
7132                my $nr;
7133                while (my $line = <$fd>) {
7134                        chomp $line;
7135                        $nr++;
7136                        $line = untabify($line);
7137                        printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
7138                               $nr, esc_attr(href(-replay => 1)), $nr, $nr,
7139                               $highlight ? sanitize($line) : esc_html($line, -nbsp=>1);
7140                }
7141        }
7142        close $fd
7143                or print "Reading blob failed.\n";
7144        print "</div>";
7145        git_footer_html();
7146}
7147
7148sub git_tree {
7149        if (!defined $hash_base) {
7150                $hash_base = "HEAD";
7151        }
7152        if (!defined $hash) {
7153                if (defined $file_name) {
7154                        $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
7155                } else {
7156                        $hash = $hash_base;
7157                }
7158        }
7159        die_error(404, "No such tree") unless defined($hash);
7160
7161        my $show_sizes = gitweb_check_feature('show-sizes');
7162        my $have_blame = gitweb_check_feature('blame');
7163
7164        my @entries = ();
7165        {
7166                local $/ = "\0";
7167                open my $fd, "-|", git_cmd(), "ls-tree", '-z',
7168                        ($show_sizes ? '-l' : ()), @extra_options, $hash
7169                        or die_error(500, "Open git-ls-tree failed");
7170                @entries = map { chomp; $_ } <$fd>;
7171                close $fd
7172                        or die_error(404, "Reading tree failed");
7173        }
7174
7175        my $refs = git_get_references();
7176        my $ref = format_ref_marker($refs, $hash_base);
7177        git_header_html();
7178        my $basedir = '';
7179        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7180                my @views_nav = ();
7181                if (defined $file_name) {
7182                        push @views_nav,
7183                                $cgi->a({-href => href(action=>"history", -replay=>1)},
7184                                        "history"),
7185                                $cgi->a({-href => href(action=>"tree",
7186                                                       hash_base=>"HEAD", file_name=>$file_name)},
7187                                        "HEAD"),
7188                }
7189                my $snapshot_links = format_snapshot_links($hash);
7190                if (defined $snapshot_links) {
7191                        # FIXME: Should be available when we have no hash base as well.
7192                        push @views_nav, $snapshot_links;
7193                }
7194                git_print_page_nav('tree','', $hash_base, undef, undef,
7195                                   join(' | ', @views_nav));
7196                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
7197        } else {
7198                undef $hash_base;
7199                print "<div class=\"page_nav\">\n";
7200                print "<br/><br/></div>\n";
7201                print "<div class=\"title\">".esc_html($hash)."</div>\n";
7202        }
7203        if (defined $file_name) {
7204                $basedir = $file_name;
7205                if ($basedir ne '' && substr($basedir, -1) ne '/') {
7206                        $basedir .= '/';
7207                }
7208                git_print_page_path($file_name, 'tree', $hash_base);
7209        }
7210        print "<div class=\"page_body\">\n";
7211        print "<table class=\"tree\">\n";
7212        my $alternate = 1;
7213        # '..' (top directory) link if possible
7214        if (defined $hash_base &&
7215            defined $file_name && $file_name =~ m![^/]+$!) {
7216                if ($alternate) {
7217                        print "<tr class=\"dark\">\n";
7218                } else {
7219                        print "<tr class=\"light\">\n";
7220                }
7221                $alternate ^= 1;
7222
7223                my $up = $file_name;
7224                $up =~ s!/?[^/]+$!!;
7225                undef $up unless $up;
7226                # based on git_print_tree_entry
7227                print '<td class="mode">' . mode_str('040000') . "</td>\n";
7228                print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
7229                print '<td class="list">';
7230                print $cgi->a({-href => href(action=>"tree",
7231                                             hash_base=>$hash_base,
7232                                             file_name=>$up)},
7233                              "..");
7234                print "</td>\n";
7235                print "<td class=\"link\"></td>\n";
7236
7237                print "</tr>\n";
7238        }
7239        foreach my $line (@entries) {
7240                my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
7241
7242                if ($alternate) {
7243                        print "<tr class=\"dark\">\n";
7244                } else {
7245                        print "<tr class=\"light\">\n";
7246                }
7247                $alternate ^= 1;
7248
7249                git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
7250
7251                print "</tr>\n";
7252        }
7253        print "</table>\n" .
7254              "</div>";
7255        git_footer_html();
7256}
7257
7258sub sanitize_for_filename {
7259    my $name = shift;
7260
7261    $name =~ s!/!-!g;
7262    $name =~ s/[^[:alnum:]_.-]//g;
7263
7264    return $name;
7265}
7266
7267sub snapshot_name {
7268        my ($project, $hash) = @_;
7269
7270        # path/to/project.git  -> project
7271        # path/to/project/.git -> project
7272        my $name = to_utf8($project);
7273        $name =~ s,([^/])/*\.git$,$1,;
7274        $name = sanitize_for_filename(basename($name));
7275
7276        my $ver = $hash;
7277        if ($hash =~ /^[0-9a-fA-F]+$/) {
7278                # shorten SHA-1 hash
7279                my $full_hash = git_get_full_hash($project, $hash);
7280                if ($full_hash =~ /^$hash/ && length($hash) > 7) {
7281                        $ver = git_get_short_hash($project, $hash);
7282                }
7283        } elsif ($hash =~ m!^refs/tags/(.*)$!) {
7284                # tags don't need shortened SHA-1 hash
7285                $ver = $1;
7286        } else {
7287                # branches and other need shortened SHA-1 hash
7288                my $strip_refs = join '|', map { quotemeta } get_branch_refs();
7289                if ($hash =~ m!^refs/($strip_refs|remotes)/(.*)$!) {
7290                        my $ref_dir = (defined $1) ? $1 : '';
7291                        $ver = $2;
7292
7293                        $ref_dir = sanitize_for_filename($ref_dir);
7294                        # for refs neither in heads nor remotes we want to
7295                        # add a ref dir to archive name
7296                        if ($ref_dir ne '' and $ref_dir ne 'heads' and $ref_dir ne 'remotes') {
7297                                $ver = $ref_dir . '-' . $ver;
7298                        }
7299                }
7300                $ver .= '-' . git_get_short_hash($project, $hash);
7301        }
7302        # special case of sanitization for filename - we change
7303        # slashes to dots instead of dashes
7304        # in case of hierarchical branch names
7305        $ver =~ s!/!.!g;
7306        $ver =~ s/[^[:alnum:]_.-]//g;
7307
7308        # name = project-version_string
7309        $name = "$name-$ver";
7310
7311        return wantarray ? ($name, $name) : $name;
7312}
7313
7314sub exit_if_unmodified_since {
7315        my ($latest_epoch) = @_;
7316        our $cgi;
7317
7318        my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7319        if (defined $if_modified) {
7320                my $since;
7321                if (eval { require HTTP::Date; 1; }) {
7322                        $since = HTTP::Date::str2time($if_modified);
7323                } elsif (eval { require Time::ParseDate; 1; }) {
7324                        $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7325                }
7326                if (defined $since && $latest_epoch <= $since) {
7327                        my %latest_date = parse_date($latest_epoch);
7328                        print $cgi->header(
7329                                -last_modified => $latest_date{'rfc2822'},
7330                                -status => '304 Not Modified');
7331                        goto DONE_GITWEB;
7332                }
7333        }
7334}
7335
7336sub git_snapshot {
7337        my $format = $input_params{'snapshot_format'};
7338        if (!@snapshot_fmts) {
7339                die_error(403, "Snapshots not allowed");
7340        }
7341        # default to first supported snapshot format
7342        $format ||= $snapshot_fmts[0];
7343        if ($format !~ m/^[a-z0-9]+$/) {
7344                die_error(400, "Invalid snapshot format parameter");
7345        } elsif (!exists($known_snapshot_formats{$format})) {
7346                die_error(400, "Unknown snapshot format");
7347        } elsif ($known_snapshot_formats{$format}{'disabled'}) {
7348                die_error(403, "Snapshot format not allowed");
7349        } elsif (!grep($_ eq $format, @snapshot_fmts)) {
7350                die_error(403, "Unsupported snapshot format");
7351        }
7352
7353        my $type = git_get_type("$hash^{}");
7354        if (!$type) {
7355                die_error(404, 'Object does not exist');
7356        }  elsif ($type eq 'blob') {
7357                die_error(400, 'Object is not a tree-ish');
7358        }
7359
7360        my ($name, $prefix) = snapshot_name($project, $hash);
7361        my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
7362
7363        my %co = parse_commit($hash);
7364        exit_if_unmodified_since($co{'committer_epoch'}) if %co;
7365
7366        my $cmd = quote_command(
7367                git_cmd(), 'archive',
7368                "--format=$known_snapshot_formats{$format}{'format'}",
7369                "--prefix=$prefix/", $hash);
7370        if (exists $known_snapshot_formats{$format}{'compressor'}) {
7371                $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
7372        }
7373
7374        $filename =~ s/(["\\])/\\$1/g;
7375        my %latest_date;
7376        if (%co) {
7377                %latest_date = parse_date($co{'committer_epoch'}, $co{'committer_tz'});
7378        }
7379
7380        print $cgi->header(
7381                -type => $known_snapshot_formats{$format}{'type'},
7382                -content_disposition => 'inline; filename="' . $filename . '"',
7383                %co ? (-last_modified => $latest_date{'rfc2822'}) : (),
7384                -status => '200 OK');
7385
7386        open my $fd, "-|", $cmd
7387                or die_error(500, "Execute git-archive failed");
7388        binmode STDOUT, ':raw';
7389        print <$fd>;
7390        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
7391        close $fd;
7392}
7393
7394sub git_log_generic {
7395        my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
7396
7397        my $head = git_get_head_hash($project);
7398        if (!defined $base) {
7399                $base = $head;
7400        }
7401        if (!defined $page) {
7402                $page = 0;
7403        }
7404        my $refs = git_get_references();
7405
7406        my $commit_hash = $base;
7407        if (defined $parent) {
7408                $commit_hash = "$parent..$base";
7409        }
7410        my @commitlist =
7411                parse_commits($commit_hash, 101, (100 * $page),
7412                              defined $file_name ? ($file_name, "--full-history") : ());
7413
7414        my $ftype;
7415        if (!defined $file_hash && defined $file_name) {
7416                # some commits could have deleted file in question,
7417                # and not have it in tree, but one of them has to have it
7418                for (my $i = 0; $i < @commitlist; $i++) {
7419                        $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
7420                        last if defined $file_hash;
7421                }
7422        }
7423        if (defined $file_hash) {
7424                $ftype = git_get_type($file_hash);
7425        }
7426        if (defined $file_name && !defined $ftype) {
7427                die_error(500, "Unknown type of object");
7428        }
7429        my %co;
7430        if (defined $file_name) {
7431                %co = parse_commit($base)
7432                        or die_error(404, "Unknown commit object");
7433        }
7434
7435
7436        my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
7437        my $next_link = '';
7438        if ($#commitlist >= 100) {
7439                $next_link =
7440                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
7441                                 -accesskey => "n", -title => "Alt-n"}, "next");
7442        }
7443        my $patch_max = gitweb_get_feature('patches');
7444        if ($patch_max && !defined $file_name) {
7445                if ($patch_max < 0 || @commitlist <= $patch_max) {
7446                        $paging_nav .= " &sdot; " .
7447                                $cgi->a({-href => href(action=>"patches", -replay=>1)},
7448                                        "patches");
7449                }
7450        }
7451
7452        git_header_html();
7453        git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
7454        if (defined $file_name) {
7455                git_print_header_div('commit', esc_html($co{'title'}), $base);
7456        } else {
7457                git_print_header_div('summary', $project)
7458        }
7459        git_print_page_path($file_name, $ftype, $hash_base)
7460                if (defined $file_name);
7461
7462        $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
7463                     $file_name, $file_hash, $ftype);
7464
7465        git_footer_html();
7466}
7467
7468sub git_log {
7469        git_log_generic('log', \&git_log_body,
7470                        $hash, $hash_parent);
7471}
7472
7473sub git_commit {
7474        $hash ||= $hash_base || "HEAD";
7475        my %co = parse_commit($hash)
7476            or die_error(404, "Unknown commit object");
7477
7478        my $parent  = $co{'parent'};
7479        my $parents = $co{'parents'}; # listref
7480
7481        # we need to prepare $formats_nav before any parameter munging
7482        my $formats_nav;
7483        if (!defined $parent) {
7484                # --root commitdiff
7485                $formats_nav .= '(initial)';
7486        } elsif (@$parents == 1) {
7487                # single parent commit
7488                $formats_nav .=
7489                        '(parent: ' .
7490                        $cgi->a({-href => href(action=>"commit",
7491                                               hash=>$parent)},
7492                                esc_html(substr($parent, 0, 7))) .
7493                        ')';
7494        } else {
7495                # merge commit
7496                $formats_nav .=
7497                        '(merge: ' .
7498                        join(' ', map {
7499                                $cgi->a({-href => href(action=>"commit",
7500                                                       hash=>$_)},
7501                                        esc_html(substr($_, 0, 7)));
7502                        } @$parents ) .
7503                        ')';
7504        }
7505        if (gitweb_check_feature('patches') && @$parents <= 1) {
7506                $formats_nav .= " | " .
7507                        $cgi->a({-href => href(action=>"patch", -replay=>1)},
7508                                "patch");
7509        }
7510
7511        if (!defined $parent) {
7512                $parent = "--root";
7513        }
7514        my @difftree;
7515        open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
7516                @diff_opts,
7517                (@$parents <= 1 ? $parent : '-c'),
7518                $hash, "--"
7519                or die_error(500, "Open git-diff-tree failed");
7520        @difftree = map { chomp; $_ } <$fd>;
7521        close $fd or die_error(404, "Reading git-diff-tree failed");
7522
7523        # non-textual hash id's can be cached
7524        my $expires;
7525        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7526                $expires = "+1d";
7527        }
7528        my $refs = git_get_references();
7529        my $ref = format_ref_marker($refs, $co{'id'});
7530
7531        git_header_html(undef, $expires);
7532        git_print_page_nav('commit', '',
7533                           $hash, $co{'tree'}, $hash,
7534                           $formats_nav);
7535
7536        if (defined $co{'parent'}) {
7537                git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
7538        } else {
7539                git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
7540        }
7541        print "<div class=\"title_text\">\n" .
7542              "<table class=\"object_header\">\n";
7543        git_print_authorship_rows(\%co);
7544        print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
7545        print "<tr>" .
7546              "<td>tree</td>" .
7547              "<td class=\"sha1\">" .
7548              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7549                       class => "list"}, $co{'tree'}) .
7550              "</td>" .
7551              "<td class=\"link\">" .
7552              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7553                      "tree");
7554        my $snapshot_links = format_snapshot_links($hash);
7555        if (defined $snapshot_links) {
7556                print " | " . $snapshot_links;
7557        }
7558        print "</td>" .
7559              "</tr>\n";
7560
7561        foreach my $par (@$parents) {
7562                print "<tr>" .
7563                      "<td>parent</td>" .
7564                      "<td class=\"sha1\">" .
7565                      $cgi->a({-href => href(action=>"commit", hash=>$par),
7566                               class => "list"}, $par) .
7567                      "</td>" .
7568                      "<td class=\"link\">" .
7569                      $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7570                      " | " .
7571                      $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7572                      "</td>" .
7573                      "</tr>\n";
7574        }
7575        print "</table>".
7576              "</div>\n";
7577
7578        print "<div class=\"page_body\">\n";
7579        git_print_log($co{'comment'});
7580        print "</div>\n";
7581
7582        git_difftree_body(\@difftree, $hash, @$parents);
7583
7584        git_footer_html();
7585}
7586
7587sub git_object {
7588        # object is defined by:
7589        # - hash or hash_base alone
7590        # - hash_base and file_name
7591        my $type;
7592
7593        # - hash or hash_base alone
7594        if ($hash || ($hash_base && !defined $file_name)) {
7595                my $object_id = $hash || $hash_base;
7596
7597                open my $fd, "-|", quote_command(
7598                        git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7599                        or die_error(404, "Object does not exist");
7600                $type = <$fd>;
7601                defined $type && chomp $type;
7602                close $fd
7603                        or die_error(404, "Object does not exist");
7604
7605        # - hash_base and file_name
7606        } elsif ($hash_base && defined $file_name) {
7607                $file_name =~ s,/+$,,;
7608
7609                system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7610                        or die_error(404, "Base object does not exist");
7611
7612                # here errors should not happen
7613                open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7614                        or die_error(500, "Open git-ls-tree failed");
7615                my $line = <$fd>;
7616                close $fd;
7617
7618                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7619                unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7620                        die_error(404, "File or directory for given base does not exist");
7621                }
7622                $type = $2;
7623                $hash = $3;
7624        } else {
7625                die_error(400, "Not enough information to find object");
7626        }
7627
7628        print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7629                                          hash=>$hash, hash_base=>$hash_base,
7630                                          file_name=>$file_name),
7631                             -status => '302 Found');
7632}
7633
7634sub git_blobdiff {
7635        my $format = shift || 'html';
7636        my $diff_style = $input_params{'diff_style'} || 'inline';
7637
7638        my $fd;
7639        my @difftree;
7640        my %diffinfo;
7641        my $expires;
7642
7643        # preparing $fd and %diffinfo for git_patchset_body
7644        # new style URI
7645        if (defined $hash_base && defined $hash_parent_base) {
7646                if (defined $file_name) {
7647                        # read raw output
7648                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7649                                $hash_parent_base, $hash_base,
7650                                "--", (defined $file_parent ? $file_parent : ()), $file_name
7651                                or die_error(500, "Open git-diff-tree failed");
7652                        @difftree = map { chomp; $_ } <$fd>;
7653                        close $fd
7654                                or die_error(404, "Reading git-diff-tree failed");
7655                        @difftree
7656                                or die_error(404, "Blob diff not found");
7657
7658                } elsif (defined $hash &&
7659                         $hash =~ /[0-9a-fA-F]{40}/) {
7660                        # try to find filename from $hash
7661
7662                        # read filtered raw output
7663                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7664                                $hash_parent_base, $hash_base, "--"
7665                                or die_error(500, "Open git-diff-tree failed");
7666                        @difftree =
7667                                # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7668                                # $hash == to_id
7669                                grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7670                                map { chomp; $_ } <$fd>;
7671                        close $fd
7672                                or die_error(404, "Reading git-diff-tree failed");
7673                        @difftree
7674                                or die_error(404, "Blob diff not found");
7675
7676                } else {
7677                        die_error(400, "Missing one of the blob diff parameters");
7678                }
7679
7680                if (@difftree > 1) {
7681                        die_error(400, "Ambiguous blob diff specification");
7682                }
7683
7684                %diffinfo = parse_difftree_raw_line($difftree[0]);
7685                $file_parent ||= $diffinfo{'from_file'} || $file_name;
7686                $file_name   ||= $diffinfo{'to_file'};
7687
7688                $hash_parent ||= $diffinfo{'from_id'};
7689                $hash        ||= $diffinfo{'to_id'};
7690
7691                # non-textual hash id's can be cached
7692                if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7693                    $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7694                        $expires = '+1d';
7695                }
7696
7697                # open patch output
7698                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7699                        '-p', ($format eq 'html' ? "--full-index" : ()),
7700                        $hash_parent_base, $hash_base,
7701                        "--", (defined $file_parent ? $file_parent : ()), $file_name
7702                        or die_error(500, "Open git-diff-tree failed");
7703        }
7704
7705        # old/legacy style URI -- not generated anymore since 1.4.3.
7706        if (!%diffinfo) {
7707                die_error('404 Not Found', "Missing one of the blob diff parameters")
7708        }
7709
7710        # header
7711        if ($format eq 'html') {
7712                my $formats_nav =
7713                        $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7714                                "raw");
7715                $formats_nav .= diff_style_nav($diff_style);
7716                git_header_html(undef, $expires);
7717                if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7718                        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7719                        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7720                } else {
7721                        print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7722                        print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7723                }
7724                if (defined $file_name) {
7725                        git_print_page_path($file_name, "blob", $hash_base);
7726                } else {
7727                        print "<div class=\"page_path\"></div>\n";
7728                }
7729
7730        } elsif ($format eq 'plain') {
7731                print $cgi->header(
7732                        -type => 'text/plain',
7733                        -charset => 'utf-8',
7734                        -expires => $expires,
7735                        -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7736
7737                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7738
7739        } else {
7740                die_error(400, "Unknown blobdiff format");
7741        }
7742
7743        # patch
7744        if ($format eq 'html') {
7745                print "<div class=\"page_body\">\n";
7746
7747                git_patchset_body($fd, $diff_style,
7748                                  [ \%diffinfo ], $hash_base, $hash_parent_base);
7749                close $fd;
7750
7751                print "</div>\n"; # class="page_body"
7752                git_footer_html();
7753
7754        } else {
7755                while (my $line = <$fd>) {
7756                        $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7757                        $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7758
7759                        print $line;
7760
7761                        last if $line =~ m!^\+\+\+!;
7762                }
7763                local $/ = undef;
7764                print <$fd>;
7765                close $fd;
7766        }
7767}
7768
7769sub git_blobdiff_plain {
7770        git_blobdiff('plain');
7771}
7772
7773# assumes that it is added as later part of already existing navigation,
7774# so it returns "| foo | bar" rather than just "foo | bar"
7775sub diff_style_nav {
7776        my ($diff_style, $is_combined) = @_;
7777        $diff_style ||= 'inline';
7778
7779        return "" if ($is_combined);
7780
7781        my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7782        my %styles = @styles;
7783        @styles =
7784                @styles[ map { $_ * 2 } 0..$#styles/2 ];
7785
7786        return join '',
7787                map { " | ".$_ }
7788                map {
7789                        $_ eq $diff_style ? $styles{$_} :
7790                        $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7791                } @styles;
7792}
7793
7794sub git_commitdiff {
7795        my %params = @_;
7796        my $format = $params{-format} || 'html';
7797        my $diff_style = $input_params{'diff_style'} || 'inline';
7798
7799        my ($patch_max) = gitweb_get_feature('patches');
7800        if ($format eq 'patch') {
7801                die_error(403, "Patch view not allowed") unless $patch_max;
7802        }
7803
7804        $hash ||= $hash_base || "HEAD";
7805        my %co = parse_commit($hash)
7806            or die_error(404, "Unknown commit object");
7807
7808        # choose format for commitdiff for merge
7809        if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7810                $hash_parent = '--cc';
7811        }
7812        # we need to prepare $formats_nav before almost any parameter munging
7813        my $formats_nav;
7814        if ($format eq 'html') {
7815                $formats_nav =
7816                        $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7817                                "raw");
7818                if ($patch_max && @{$co{'parents'}} <= 1) {
7819                        $formats_nav .= " | " .
7820                                $cgi->a({-href => href(action=>"patch", -replay=>1)},
7821                                        "patch");
7822                }
7823                $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7824
7825                if (defined $hash_parent &&
7826                    $hash_parent ne '-c' && $hash_parent ne '--cc') {
7827                        # commitdiff with two commits given
7828                        my $hash_parent_short = $hash_parent;
7829                        if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7830                                $hash_parent_short = substr($hash_parent, 0, 7);
7831                        }
7832                        $formats_nav .=
7833                                ' (from';
7834                        for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7835                                if ($co{'parents'}[$i] eq $hash_parent) {
7836                                        $formats_nav .= ' parent ' . ($i+1);
7837                                        last;
7838                                }
7839                        }
7840                        $formats_nav .= ': ' .
7841                                $cgi->a({-href => href(-replay=>1,
7842                                                       hash=>$hash_parent, hash_base=>undef)},
7843                                        esc_html($hash_parent_short)) .
7844                                ')';
7845                } elsif (!$co{'parent'}) {
7846                        # --root commitdiff
7847                        $formats_nav .= ' (initial)';
7848                } elsif (scalar @{$co{'parents'}} == 1) {
7849                        # single parent commit
7850                        $formats_nav .=
7851                                ' (parent: ' .
7852                                $cgi->a({-href => href(-replay=>1,
7853                                                       hash=>$co{'parent'}, hash_base=>undef)},
7854                                        esc_html(substr($co{'parent'}, 0, 7))) .
7855                                ')';
7856                } else {
7857                        # merge commit
7858                        if ($hash_parent eq '--cc') {
7859                                $formats_nav .= ' | ' .
7860                                        $cgi->a({-href => href(-replay=>1,
7861                                                               hash=>$hash, hash_parent=>'-c')},
7862                                                'combined');
7863                        } else { # $hash_parent eq '-c'
7864                                $formats_nav .= ' | ' .
7865                                        $cgi->a({-href => href(-replay=>1,
7866                                                               hash=>$hash, hash_parent=>'--cc')},
7867                                                'compact');
7868                        }
7869                        $formats_nav .=
7870                                ' (merge: ' .
7871                                join(' ', map {
7872                                        $cgi->a({-href => href(-replay=>1,
7873                                                               hash=>$_, hash_base=>undef)},
7874                                                esc_html(substr($_, 0, 7)));
7875                                } @{$co{'parents'}} ) .
7876                                ')';
7877                }
7878        }
7879
7880        my $hash_parent_param = $hash_parent;
7881        if (!defined $hash_parent_param) {
7882                # --cc for multiple parents, --root for parentless
7883                $hash_parent_param =
7884                        @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7885        }
7886
7887        # read commitdiff
7888        my $fd;
7889        my @difftree;
7890        if ($format eq 'html') {
7891                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7892                        "--no-commit-id", "--patch-with-raw", "--full-index",
7893                        $hash_parent_param, $hash, "--"
7894                        or die_error(500, "Open git-diff-tree failed");
7895
7896                while (my $line = <$fd>) {
7897                        chomp $line;
7898                        # empty line ends raw part of diff-tree output
7899                        last unless $line;
7900                        push @difftree, scalar parse_difftree_raw_line($line);
7901                }
7902
7903        } elsif ($format eq 'plain') {
7904                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7905                        '-p', $hash_parent_param, $hash, "--"
7906                        or die_error(500, "Open git-diff-tree failed");
7907        } elsif ($format eq 'patch') {
7908                # For commit ranges, we limit the output to the number of
7909                # patches specified in the 'patches' feature.
7910                # For single commits, we limit the output to a single patch,
7911                # diverging from the git-format-patch default.
7912                my @commit_spec = ();
7913                if ($hash_parent) {
7914                        if ($patch_max > 0) {
7915                                push @commit_spec, "-$patch_max";
7916                        }
7917                        push @commit_spec, '-n', "$hash_parent..$hash";
7918                } else {
7919                        if ($params{-single}) {
7920                                push @commit_spec, '-1';
7921                        } else {
7922                                if ($patch_max > 0) {
7923                                        push @commit_spec, "-$patch_max";
7924                                }
7925                                push @commit_spec, "-n";
7926                        }
7927                        push @commit_spec, '--root', $hash;
7928                }
7929                open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7930                        '--encoding=utf8', '--stdout', @commit_spec
7931                        or die_error(500, "Open git-format-patch failed");
7932        } else {
7933                die_error(400, "Unknown commitdiff format");
7934        }
7935
7936        # non-textual hash id's can be cached
7937        my $expires;
7938        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7939                $expires = "+1d";
7940        }
7941
7942        # write commit message
7943        if ($format eq 'html') {
7944                my $refs = git_get_references();
7945                my $ref = format_ref_marker($refs, $co{'id'});
7946
7947                git_header_html(undef, $expires);
7948                git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7949                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7950                print "<div class=\"title_text\">\n" .
7951                      "<table class=\"object_header\">\n";
7952                git_print_authorship_rows(\%co);
7953                print "</table>".
7954                      "</div>\n";
7955                print "<div class=\"page_body\">\n";
7956                if (@{$co{'comment'}} > 1) {
7957                        print "<div class=\"log\">\n";
7958                        git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7959                        print "</div>\n"; # class="log"
7960                }
7961
7962        } elsif ($format eq 'plain') {
7963                my $refs = git_get_references("tags");
7964                my $tagname = git_get_rev_name_tags($hash);
7965                my $filename = basename($project) . "-$hash.patch";
7966
7967                print $cgi->header(
7968                        -type => 'text/plain',
7969                        -charset => 'utf-8',
7970                        -expires => $expires,
7971                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7972                my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7973                print "From: " . to_utf8($co{'author'}) . "\n";
7974                print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7975                print "Subject: " . to_utf8($co{'title'}) . "\n";
7976
7977                print "X-Git-Tag: $tagname\n" if $tagname;
7978                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7979
7980                foreach my $line (@{$co{'comment'}}) {
7981                        print to_utf8($line) . "\n";
7982                }
7983                print "---\n\n";
7984        } elsif ($format eq 'patch') {
7985                my $filename = basename($project) . "-$hash.patch";
7986
7987                print $cgi->header(
7988                        -type => 'text/plain',
7989                        -charset => 'utf-8',
7990                        -expires => $expires,
7991                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7992        }
7993
7994        # write patch
7995        if ($format eq 'html') {
7996                my $use_parents = !defined $hash_parent ||
7997                        $hash_parent eq '-c' || $hash_parent eq '--cc';
7998                git_difftree_body(\@difftree, $hash,
7999                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
8000                print "<br/>\n";
8001
8002                git_patchset_body($fd, $diff_style,
8003                                  \@difftree, $hash,
8004                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
8005                close $fd;
8006                print "</div>\n"; # class="page_body"
8007                git_footer_html();
8008
8009        } elsif ($format eq 'plain') {
8010                local $/ = undef;
8011                print <$fd>;
8012                close $fd
8013                        or print "Reading git-diff-tree failed\n";
8014        } elsif ($format eq 'patch') {
8015                local $/ = undef;
8016                print <$fd>;
8017                close $fd
8018                        or print "Reading git-format-patch failed\n";
8019        }
8020}
8021
8022sub git_commitdiff_plain {
8023        git_commitdiff(-format => 'plain');
8024}
8025
8026# format-patch-style patches
8027sub git_patch {
8028        git_commitdiff(-format => 'patch', -single => 1);
8029}
8030
8031sub git_patches {
8032        git_commitdiff(-format => 'patch');
8033}
8034
8035sub git_history {
8036        git_log_generic('history', \&git_history_body,
8037                        $hash_base, $hash_parent_base,
8038                        $file_name, $hash);
8039}
8040
8041sub git_search {
8042        $searchtype ||= 'commit';
8043
8044        # check if appropriate features are enabled
8045        gitweb_check_feature('search')
8046                or die_error(403, "Search is disabled");
8047        if ($searchtype eq 'pickaxe') {
8048                # pickaxe may take all resources of your box and run for several minutes
8049                # with every query - so decide by yourself how public you make this feature
8050                gitweb_check_feature('pickaxe')
8051                        or die_error(403, "Pickaxe search is disabled");
8052        }
8053        if ($searchtype eq 'grep') {
8054                # grep search might be potentially CPU-intensive, too
8055                gitweb_check_feature('grep')
8056                        or die_error(403, "Grep search is disabled");
8057        }
8058
8059        if (!defined $searchtext) {
8060                die_error(400, "Text field is empty");
8061        }
8062        if (!defined $hash) {
8063                $hash = git_get_head_hash($project);
8064        }
8065        my %co = parse_commit($hash);
8066        if (!%co) {
8067                die_error(404, "Unknown commit object");
8068        }
8069        if (!defined $page) {
8070                $page = 0;
8071        }
8072
8073        if ($searchtype eq 'commit' ||
8074            $searchtype eq 'author' ||
8075            $searchtype eq 'committer') {
8076                git_search_message(%co);
8077        } elsif ($searchtype eq 'pickaxe') {
8078                git_search_changes(%co);
8079        } elsif ($searchtype eq 'grep') {
8080                git_search_files(%co);
8081        } else {
8082                die_error(400, "Unknown search type");
8083        }
8084}
8085
8086sub git_search_help {
8087        git_header_html();
8088        git_print_page_nav('','', $hash,$hash,$hash);
8089        print <<EOT;
8090<p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
8091regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
8092the pattern entered is recognized as the POSIX extended
8093<a href="https://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
8094insensitive).</p>
8095<dl>
8096<dt><b>commit</b></dt>
8097<dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
8098EOT
8099        my $have_grep = gitweb_check_feature('grep');
8100        if ($have_grep) {
8101                print <<EOT;
8102<dt><b>grep</b></dt>
8103<dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
8104    a different one) are searched for the given pattern. On large trees, this search can take
8105a while and put some strain on the server, so please use it with some consideration. Note that
8106due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
8107case-sensitive.</dd>
8108EOT
8109        }
8110        print <<EOT;
8111<dt><b>author</b></dt>
8112<dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
8113<dt><b>committer</b></dt>
8114<dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
8115EOT
8116        my $have_pickaxe = gitweb_check_feature('pickaxe');
8117        if ($have_pickaxe) {
8118                print <<EOT;
8119<dt><b>pickaxe</b></dt>
8120<dd>All commits that caused the string to appear or disappear from any file (changes that
8121added, removed or "modified" the string) will be listed. This search can take a while and
8122takes a lot of strain on the server, so please use it wisely. Note that since you may be
8123interested even in changes just changing the case as well, this search is case sensitive.</dd>
8124EOT
8125        }
8126        print "</dl>\n";
8127        git_footer_html();
8128}
8129
8130sub git_shortlog {
8131        git_log_generic('shortlog', \&git_shortlog_body,
8132                        $hash, $hash_parent);
8133}
8134
8135## ......................................................................
8136## feeds (RSS, Atom; OPML)
8137
8138sub git_feed {
8139        my $format = shift || 'atom';
8140        my $have_blame = gitweb_check_feature('blame');
8141
8142        # Atom: http://www.atomenabled.org/developers/syndication/
8143        # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
8144        if ($format ne 'rss' && $format ne 'atom') {
8145                die_error(400, "Unknown web feed format");
8146        }
8147
8148        # log/feed of current (HEAD) branch, log of given branch, history of file/directory
8149        my $head = $hash || 'HEAD';
8150        my @commitlist = parse_commits($head, 150, 0, $file_name);
8151
8152        my %latest_commit;
8153        my %latest_date;
8154        my $content_type = "application/$format+xml";
8155        if (defined $cgi->http('HTTP_ACCEPT') &&
8156                 $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
8157                # browser (feed reader) prefers text/xml
8158                $content_type = 'text/xml';
8159        }
8160        if (defined($commitlist[0])) {
8161                %latest_commit = %{$commitlist[0]};
8162                my $latest_epoch = $latest_commit{'committer_epoch'};
8163                exit_if_unmodified_since($latest_epoch);
8164                %latest_date = parse_date($latest_epoch, $latest_commit{'committer_tz'});
8165        }
8166        print $cgi->header(
8167                -type => $content_type,
8168                -charset => 'utf-8',
8169                %latest_date ? (-last_modified => $latest_date{'rfc2822'}) : (),
8170                -status => '200 OK');
8171
8172        # Optimization: skip generating the body if client asks only
8173        # for Last-Modified date.
8174        return if ($cgi->request_method() eq 'HEAD');
8175
8176        # header variables
8177        my $title = "$site_name - $project/$action";
8178        my $feed_type = 'log';
8179        if (defined $hash) {
8180                $title .= " - '$hash'";
8181                $feed_type = 'branch log';
8182                if (defined $file_name) {
8183                        $title .= " :: $file_name";
8184                        $feed_type = 'history';
8185                }
8186        } elsif (defined $file_name) {
8187                $title .= " - $file_name";
8188                $feed_type = 'history';
8189        }
8190        $title .= " $feed_type";
8191        $title = esc_html($title);
8192        my $descr = git_get_project_description($project);
8193        if (defined $descr) {
8194                $descr = esc_html($descr);
8195        } else {
8196                $descr = "$project " .
8197                         ($format eq 'rss' ? 'RSS' : 'Atom') .
8198                         " feed";
8199        }
8200        my $owner = git_get_project_owner($project);
8201        $owner = esc_html($owner);
8202
8203        #header
8204        my $alt_url;
8205        if (defined $file_name) {
8206                $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
8207        } elsif (defined $hash) {
8208                $alt_url = href(-full=>1, action=>"log", hash=>$hash);
8209        } else {
8210                $alt_url = href(-full=>1, action=>"summary");
8211        }
8212        print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
8213        if ($format eq 'rss') {
8214                print <<XML;
8215<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
8216<channel>
8217XML
8218                print "<title>$title</title>\n" .
8219                      "<link>$alt_url</link>\n" .
8220                      "<description>$descr</description>\n" .
8221                      "<language>en</language>\n" .
8222                      # project owner is responsible for 'editorial' content
8223                      "<managingEditor>$owner</managingEditor>\n";
8224                if (defined $logo || defined $favicon) {
8225                        # prefer the logo to the favicon, since RSS
8226                        # doesn't allow both
8227                        my $img = esc_url($logo || $favicon);
8228                        print "<image>\n" .
8229                              "<url>$img</url>\n" .
8230                              "<title>$title</title>\n" .
8231                              "<link>$alt_url</link>\n" .
8232                              "</image>\n";
8233                }
8234                if (%latest_date) {
8235                        print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
8236                        print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
8237                }
8238                print "<generator>gitweb v.$version/$git_version</generator>\n";
8239        } elsif ($format eq 'atom') {
8240                print <<XML;
8241<feed xmlns="http://www.w3.org/2005/Atom">
8242XML
8243                print "<title>$title</title>\n" .
8244                      "<subtitle>$descr</subtitle>\n" .
8245                      '<link rel="alternate" type="text/html" href="' .
8246                      $alt_url . '" />' . "\n" .
8247                      '<link rel="self" type="' . $content_type . '" href="' .
8248                      $cgi->self_url() . '" />' . "\n" .
8249                      "<id>" . href(-full=>1) . "</id>\n" .
8250                      # use project owner for feed author
8251                      "<author><name>$owner</name></author>\n";
8252                if (defined $favicon) {
8253                        print "<icon>" . esc_url($favicon) . "</icon>\n";
8254                }
8255                if (defined $logo) {
8256                        # not twice as wide as tall: 72 x 27 pixels
8257                        print "<logo>" . esc_url($logo) . "</logo>\n";
8258                }
8259                if (! %latest_date) {
8260                        # dummy date to keep the feed valid until commits trickle in:
8261                        print "<updated>1970-01-01T00:00:00Z</updated>\n";
8262                } else {
8263                        print "<updated>$latest_date{'iso-8601'}</updated>\n";
8264                }
8265                print "<generator version='$version/$git_version'>gitweb</generator>\n";
8266        }
8267
8268        # contents
8269        for (my $i = 0; $i <= $#commitlist; $i++) {
8270                my %co = %{$commitlist[$i]};
8271                my $commit = $co{'id'};
8272                # we read 150, we always show 30 and the ones more recent than 48 hours
8273                if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
8274                        last;
8275                }
8276                my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
8277
8278                # get list of changed files
8279                open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
8280                        $co{'parent'} || "--root",
8281                        $co{'id'}, "--", (defined $file_name ? $file_name : ())
8282                        or next;
8283                my @difftree = map { chomp; $_ } <$fd>;
8284                close $fd
8285                        or next;
8286
8287                # print element (entry, item)
8288                my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
8289                if ($format eq 'rss') {
8290                        print "<item>\n" .
8291                              "<title>" . esc_html($co{'title'}) . "</title>\n" .
8292                              "<author>" . esc_html($co{'author'}) . "</author>\n" .
8293                              "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
8294                              "<guid isPermaLink=\"true\">$co_url</guid>\n" .
8295                              "<link>$co_url</link>\n" .
8296                              "<description>" . esc_html($co{'title'}) . "</description>\n" .
8297                              "<content:encoded>" .
8298                              "<![CDATA[\n";
8299                } elsif ($format eq 'atom') {
8300                        print "<entry>\n" .
8301                              "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
8302                              "<updated>$cd{'iso-8601'}</updated>\n" .
8303                              "<author>\n" .
8304                              "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
8305                        if ($co{'author_email'}) {
8306                                print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
8307                        }
8308                        print "</author>\n" .
8309                              # use committer for contributor
8310                              "<contributor>\n" .
8311                              "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
8312                        if ($co{'committer_email'}) {
8313                                print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
8314                        }
8315                        print "</contributor>\n" .
8316                              "<published>$cd{'iso-8601'}</published>\n" .
8317                              "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
8318                              "<id>$co_url</id>\n" .
8319                              "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
8320                              "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
8321                }
8322                my $comment = $co{'comment'};
8323                print "<pre>\n";
8324                foreach my $line (@$comment) {
8325                        $line = esc_html($line);
8326                        print "$line\n";
8327                }
8328                print "</pre><ul>\n";
8329                foreach my $difftree_line (@difftree) {
8330                        my %difftree = parse_difftree_raw_line($difftree_line);
8331                        next if !$difftree{'from_id'};
8332
8333                        my $file = $difftree{'file'} || $difftree{'to_file'};
8334
8335                        print "<li>" .
8336                              "[" .
8337                              $cgi->a({-href => href(-full=>1, action=>"blobdiff",
8338                                                     hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
8339                                                     hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
8340                                                     file_name=>$file, file_parent=>$difftree{'from_file'}),
8341                                      -title => "diff"}, 'D');
8342                        if ($have_blame) {
8343                                print $cgi->a({-href => href(-full=>1, action=>"blame",
8344                                                             file_name=>$file, hash_base=>$commit),
8345                                              -title => "blame"}, 'B');
8346                        }
8347                        # if this is not a feed of a file history
8348                        if (!defined $file_name || $file_name ne $file) {
8349                                print $cgi->a({-href => href(-full=>1, action=>"history",
8350                                                             file_name=>$file, hash=>$commit),
8351                                              -title => "history"}, 'H');
8352                        }
8353                        $file = esc_path($file);
8354                        print "] ".
8355                              "$file</li>\n";
8356                }
8357                if ($format eq 'rss') {
8358                        print "</ul>]]>\n" .
8359                              "</content:encoded>\n" .
8360                              "</item>\n";
8361                } elsif ($format eq 'atom') {
8362                        print "</ul>\n</div>\n" .
8363                              "</content>\n" .
8364                              "</entry>\n";
8365                }
8366        }
8367
8368        # end of feed
8369        if ($format eq 'rss') {
8370                print "</channel>\n</rss>\n";
8371        } elsif ($format eq 'atom') {
8372                print "</feed>\n";
8373        }
8374}
8375
8376sub git_rss {
8377        git_feed('rss');
8378}
8379
8380sub git_atom {
8381        git_feed('atom');
8382}
8383
8384sub git_opml {
8385        my @list = git_get_projects_list($project_filter, $strict_export);
8386        if (!@list) {
8387                die_error(404, "No projects found");
8388        }
8389
8390        print $cgi->header(
8391                -type => 'text/xml',
8392                -charset => 'utf-8',
8393                -content_disposition => 'inline; filename="opml.xml"');
8394
8395        my $title = esc_html($site_name);
8396        my $filter = " within subdirectory ";
8397        if (defined $project_filter) {
8398                $filter .= esc_html($project_filter);
8399        } else {
8400                $filter = "";
8401        }
8402        print <<XML;
8403<?xml version="1.0" encoding="utf-8"?>
8404<opml version="1.0">
8405<head>
8406  <title>$title OPML Export$filter</title>
8407</head>
8408<body>
8409<outline text="git RSS feeds">
8410XML
8411
8412        foreach my $pr (@list) {
8413                my %proj = %$pr;
8414                my $head = git_get_head_hash($proj{'path'});
8415                if (!defined $head) {
8416                        next;
8417                }
8418                $git_dir = "$projectroot/$proj{'path'}";
8419                my %co = parse_commit($head);
8420                if (!%co) {
8421                        next;
8422                }
8423
8424                my $path = esc_html(chop_str($proj{'path'}, 25, 5));
8425                my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
8426                my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
8427                print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
8428        }
8429        print <<XML;
8430</outline>
8431</body>
8432</opml>
8433XML
8434}