gitweb / gitweb.perlon commit Merge branch 'jk/pack-objects-optim-mru' (e6e24c9)
   1#!/usr/bin/perl
   2
   3# gitweb - simple web interface to track changes in git repositories
   4#
   5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
   6# (C) 2005, Christian Gierke
   7#
   8# This program is licensed under the GPLv2
   9
  10use 5.008;
  11use strict;
  12use warnings;
  13use CGI qw(:standard :escapeHTML -nosticky);
  14use CGI::Util qw(unescape);
  15use CGI::Carp qw(fatalsToBrowser set_message);
  16use Encode;
  17use Fcntl ':mode';
  18use File::Find qw();
  19use File::Basename qw(basename);
  20use Time::HiRes qw(gettimeofday tv_interval);
  21binmode STDOUT, ':utf8';
  22
  23if (!defined($CGI::VERSION) || $CGI::VERSION < 4.08) {
  24        eval 'sub CGI::multi_param { CGI::param(@_) }'
  25}
  26
  27our $t0 = [ gettimeofday() ];
  28our $number_of_git_cmds = 0;
  29
  30BEGIN {
  31        CGI->compile() if $ENV{'MOD_PERL'};
  32}
  33
  34our $version = "++GIT_VERSION++";
  35
  36our ($my_url, $my_uri, $base_url, $path_info, $home_link);
  37sub evaluate_uri {
  38        our $cgi;
  39
  40        our $my_url = $cgi->url();
  41        our $my_uri = $cgi->url(-absolute => 1);
  42
  43        # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
  44        # needed and used only for URLs with nonempty PATH_INFO
  45        our $base_url = $my_url;
  46
  47        # When the script is used as DirectoryIndex, the URL does not contain the name
  48        # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
  49        # have to do it ourselves. We make $path_info global because it's also used
  50        # later on.
  51        #
  52        # Another issue with the script being the DirectoryIndex is that the resulting
  53        # $my_url data is not the full script URL: this is good, because we want
  54        # generated links to keep implying the script name if it wasn't explicitly
  55        # indicated in the URL we're handling, but it means that $my_url cannot be used
  56        # as base URL.
  57        # Therefore, if we needed to strip PATH_INFO, then we know that we have
  58        # to build the base URL ourselves:
  59        our $path_info = decode_utf8($ENV{"PATH_INFO"});
  60        if ($path_info) {
  61                # $path_info has already been URL-decoded by the web server, but
  62                # $my_url and $my_uri have not. URL-decode them so we can properly
  63                # strip $path_info.
  64                $my_url = unescape($my_url);
  65                $my_uri = unescape($my_uri);
  66                if ($my_url =~ s,\Q$path_info\E$,, &&
  67                    $my_uri =~ s,\Q$path_info\E$,, &&
  68                    defined $ENV{'SCRIPT_NAME'}) {
  69                        $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
  70                }
  71        }
  72
  73        # target of the home link on top of all pages
  74        our $home_link = $my_uri || "/";
  75}
  76
  77# core git executable to use
  78# this can just be "git" if your webserver has a sensible PATH
  79our $GIT = "++GIT_BINDIR++/git";
  80
  81# absolute fs-path which will be prepended to the project path
  82#our $projectroot = "/pub/scm";
  83our $projectroot = "++GITWEB_PROJECTROOT++";
  84
  85# fs traversing limit for getting project list
  86# the number is relative to the projectroot
  87our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
  88
  89# string of the home link on top of all pages
  90our $home_link_str = "++GITWEB_HOME_LINK_STR++";
  91
  92# extra breadcrumbs preceding the home link
  93our @extra_breadcrumbs = ();
  94
  95# name of your site or organization to appear in page titles
  96# replace this with something more descriptive for clearer bookmarks
  97our $site_name = "++GITWEB_SITENAME++"
  98                 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
  99
 100# html snippet to include in the <head> section of each page
 101our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
 102# filename of html text to include at top of each page
 103our $site_header = "++GITWEB_SITE_HEADER++";
 104# html text to include at home page
 105our $home_text = "++GITWEB_HOMETEXT++";
 106# filename of html text to include at bottom of each page
 107our $site_footer = "++GITWEB_SITE_FOOTER++";
 108
 109# URI of stylesheets
 110our @stylesheets = ("++GITWEB_CSS++");
 111# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
 112our $stylesheet = undef;
 113# URI of GIT logo (72x27 size)
 114our $logo = "++GITWEB_LOGO++";
 115# URI of GIT favicon, assumed to be image/png type
 116our $favicon = "++GITWEB_FAVICON++";
 117# URI of gitweb.js (JavaScript code for gitweb)
 118our $javascript = "++GITWEB_JS++";
 119
 120# URI and label (title) of GIT logo link
 121#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
 122#our $logo_label = "git documentation";
 123our $logo_url = "http://git-scm.com/";
 124our $logo_label = "git homepage";
 125
 126# source of projects list
 127our $projects_list = "++GITWEB_LIST++";
 128
 129# the width (in characters) of the projects list "Description" column
 130our $projects_list_description_width = 25;
 131
 132# group projects by category on the projects list
 133# (enabled if this variable evaluates to true)
 134our $projects_list_group_categories = 0;
 135
 136# default category if none specified
 137# (leave the empty string for no category)
 138our $project_list_default_category = "";
 139
 140# default order of projects list
 141# valid values are none, project, descr, owner, and age
 142our $default_projects_order = "project";
 143
 144# show repository only if this file exists
 145# (only effective if this variable evaluates to true)
 146our $export_ok = "++GITWEB_EXPORT_OK++";
 147
 148# don't generate age column on the projects list page
 149our $omit_age_column = 0;
 150
 151# don't generate information about owners of repositories
 152our $omit_owner=0;
 153
 154# show repository only if this subroutine returns true
 155# when given the path to the project, for example:
 156#    sub { return -e "$_[0]/git-daemon-export-ok"; }
 157our $export_auth_hook = undef;
 158
 159# only allow viewing of repositories also shown on the overview page
 160our $strict_export = "++GITWEB_STRICT_EXPORT++";
 161
 162# list of git base URLs used for URL to where fetch project from,
 163# i.e. full URL is "$git_base_url/$project"
 164our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
 165
 166# default blob_plain mimetype and default charset for text/plain blob
 167our $default_blob_plain_mimetype = 'text/plain';
 168our $default_text_plain_charset  = undef;
 169
 170# file to use for guessing MIME types before trying /etc/mime.types
 171# (relative to the current git repository)
 172our $mimetypes_file = undef;
 173
 174# assume this charset if line contains non-UTF-8 characters;
 175# it should be valid encoding (see Encoding::Supported(3pm) for list),
 176# for which encoding all byte sequences are valid, for example
 177# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
 178# could be even 'utf-8' for the old behavior)
 179our $fallback_encoding = 'latin1';
 180
 181# rename detection options for git-diff and git-diff-tree
 182# - default is '-M', with the cost proportional to
 183#   (number of removed files) * (number of new files).
 184# - more costly is '-C' (which implies '-M'), with the cost proportional to
 185#   (number of changed files + number of removed files) * (number of new files)
 186# - even more costly is '-C', '--find-copies-harder' with cost
 187#   (number of files in the original tree) * (number of new files)
 188# - one might want to include '-B' option, e.g. '-B', '-M'
 189our @diff_opts = ('-M'); # taken from git_commit
 190
 191# Disables features that would allow repository owners to inject script into
 192# the gitweb domain.
 193our $prevent_xss = 0;
 194
 195# Path to the highlight executable to use (must be the one from
 196# http://www.andre-simon.de due to assumptions about parameters and output).
 197# Useful if highlight is not installed on your webserver's PATH.
 198# [Default: highlight]
 199our $highlight_bin = "++HIGHLIGHT_BIN++";
 200
 201# information about snapshot formats that gitweb is capable of serving
 202our %known_snapshot_formats = (
 203        # name => {
 204        #       'display' => display name,
 205        #       'type' => mime type,
 206        #       'suffix' => filename suffix,
 207        #       'format' => --format for git-archive,
 208        #       'compressor' => [compressor command and arguments]
 209        #                       (array reference, optional)
 210        #       'disabled' => boolean (optional)}
 211        #
 212        'tgz' => {
 213                'display' => 'tar.gz',
 214                'type' => 'application/x-gzip',
 215                'suffix' => '.tar.gz',
 216                'format' => 'tar',
 217                'compressor' => ['gzip', '-n']},
 218
 219        'tbz2' => {
 220                'display' => 'tar.bz2',
 221                'type' => 'application/x-bzip2',
 222                'suffix' => '.tar.bz2',
 223                'format' => 'tar',
 224                'compressor' => ['bzip2']},
 225
 226        'txz' => {
 227                'display' => 'tar.xz',
 228                'type' => 'application/x-xz',
 229                'suffix' => '.tar.xz',
 230                'format' => 'tar',
 231                'compressor' => ['xz'],
 232                'disabled' => 1},
 233
 234        'zip' => {
 235                'display' => 'zip',
 236                'type' => 'application/x-zip',
 237                'suffix' => '.zip',
 238                'format' => 'zip'},
 239);
 240
 241# Aliases so we understand old gitweb.snapshot values in repository
 242# configuration.
 243our %known_snapshot_format_aliases = (
 244        'gzip'  => 'tgz',
 245        'bzip2' => 'tbz2',
 246        'xz'    => 'txz',
 247
 248        # backward compatibility: legacy gitweb config support
 249        'x-gzip' => undef, 'gz' => undef,
 250        'x-bzip2' => undef, 'bz2' => undef,
 251        'x-zip' => undef, '' => undef,
 252);
 253
 254# Pixel sizes for icons and avatars. If the default font sizes or lineheights
 255# are changed, it may be appropriate to change these values too via
 256# $GITWEB_CONFIG.
 257our %avatar_size = (
 258        'default' => 16,
 259        'double'  => 32
 260);
 261
 262# Used to set the maximum load that we will still respond to gitweb queries.
 263# If server load exceed this value then return "503 server busy" error.
 264# If gitweb cannot determined server load, it is taken to be 0.
 265# Leave it undefined (or set to 'undef') to turn off load checking.
 266our $maxload = 300;
 267
 268# configuration for 'highlight' (http://www.andre-simon.de/)
 269# match by basename
 270our %highlight_basename = (
 271        #'Program' => 'py',
 272        #'Library' => 'py',
 273        'SConstruct' => 'py', # SCons equivalent of Makefile
 274        'Makefile' => 'make',
 275);
 276# match by extension
 277our %highlight_ext = (
 278        # main extensions, defining name of syntax;
 279        # see files in /usr/share/highlight/langDefs/ directory
 280        (map { $_ => $_ } qw(py rb java css js tex bib xml awk bat ini spec tcl sql)),
 281        # alternate extensions, see /etc/highlight/filetypes.conf
 282        (map { $_ => 'c'   } qw(c h)),
 283        (map { $_ => 'sh'  } qw(sh bash zsh ksh)),
 284        (map { $_ => 'cpp' } qw(cpp cxx c++ cc)),
 285        (map { $_ => 'php' } qw(php php3 php4 php5 phps)),
 286        (map { $_ => 'pl'  } qw(pl perl pm)), # perhaps also 'cgi'
 287        (map { $_ => 'make'} qw(make mak mk)),
 288        (map { $_ => 'xml' } qw(xml xhtml html htm)),
 289);
 290
 291# You define site-wide feature defaults here; override them with
 292# $GITWEB_CONFIG as necessary.
 293our %feature = (
 294        # feature => {
 295        #       'sub' => feature-sub (subroutine),
 296        #       'override' => allow-override (boolean),
 297        #       'default' => [ default options...] (array reference)}
 298        #
 299        # if feature is overridable (it means that allow-override has true value),
 300        # then feature-sub will be called with default options as parameters;
 301        # return value of feature-sub indicates if to enable specified feature
 302        #
 303        # if there is no 'sub' key (no feature-sub), then feature cannot be
 304        # overridden
 305        #
 306        # use gitweb_get_feature(<feature>) to retrieve the <feature> value
 307        # (an array) or gitweb_check_feature(<feature>) to check if <feature>
 308        # is enabled
 309
 310        # Enable the 'blame' blob view, showing the last commit that modified
 311        # each line in the file. This can be very CPU-intensive.
 312
 313        # To enable system wide have in $GITWEB_CONFIG
 314        # $feature{'blame'}{'default'} = [1];
 315        # To have project specific config enable override in $GITWEB_CONFIG
 316        # $feature{'blame'}{'override'} = 1;
 317        # and in project config gitweb.blame = 0|1;
 318        'blame' => {
 319                'sub' => sub { feature_bool('blame', @_) },
 320                'override' => 0,
 321                'default' => [0]},
 322
 323        # Enable the 'snapshot' link, providing a compressed archive of any
 324        # tree. This can potentially generate high traffic if you have large
 325        # project.
 326
 327        # Value is a list of formats defined in %known_snapshot_formats that
 328        # you wish to offer.
 329        # To disable system wide have in $GITWEB_CONFIG
 330        # $feature{'snapshot'}{'default'} = [];
 331        # To have project specific config enable override in $GITWEB_CONFIG
 332        # $feature{'snapshot'}{'override'} = 1;
 333        # and in project config, a comma-separated list of formats or "none"
 334        # to disable.  Example: gitweb.snapshot = tbz2,zip;
 335        'snapshot' => {
 336                'sub' => \&feature_snapshot,
 337                'override' => 0,
 338                'default' => ['tgz']},
 339
 340        # Enable text search, which will list the commits which match author,
 341        # committer or commit text to a given string.  Enabled by default.
 342        # Project specific override is not supported.
 343        #
 344        # Note that this controls all search features, which means that if
 345        # it is disabled, then 'grep' and 'pickaxe' search would also be
 346        # disabled.
 347        'search' => {
 348                'override' => 0,
 349                'default' => [1]},
 350
 351        # Enable grep search, which will list the files in currently selected
 352        # tree containing the given string. Enabled by default. This can be
 353        # potentially CPU-intensive, of course.
 354        # Note that you need to have 'search' feature enabled too.
 355
 356        # To enable system wide have in $GITWEB_CONFIG
 357        # $feature{'grep'}{'default'} = [1];
 358        # To have project specific config enable override in $GITWEB_CONFIG
 359        # $feature{'grep'}{'override'} = 1;
 360        # and in project config gitweb.grep = 0|1;
 361        'grep' => {
 362                'sub' => sub { feature_bool('grep', @_) },
 363                'override' => 0,
 364                'default' => [1]},
 365
 366        # Enable the pickaxe search, which will list the commits that modified
 367        # a given string in a file. This can be practical and quite faster
 368        # alternative to 'blame', but still potentially CPU-intensive.
 369        # Note that you need to have 'search' feature enabled too.
 370
 371        # To enable system wide have in $GITWEB_CONFIG
 372        # $feature{'pickaxe'}{'default'} = [1];
 373        # To have project specific config enable override in $GITWEB_CONFIG
 374        # $feature{'pickaxe'}{'override'} = 1;
 375        # and in project config gitweb.pickaxe = 0|1;
 376        'pickaxe' => {
 377                'sub' => sub { feature_bool('pickaxe', @_) },
 378                'override' => 0,
 379                'default' => [1]},
 380
 381        # Enable showing size of blobs in a 'tree' view, in a separate
 382        # column, similar to what 'ls -l' does.  This cost a bit of IO.
 383
 384        # To disable system wide have in $GITWEB_CONFIG
 385        # $feature{'show-sizes'}{'default'} = [0];
 386        # To have project specific config enable override in $GITWEB_CONFIG
 387        # $feature{'show-sizes'}{'override'} = 1;
 388        # and in project config gitweb.showsizes = 0|1;
 389        'show-sizes' => {
 390                'sub' => sub { feature_bool('showsizes', @_) },
 391                'override' => 0,
 392                'default' => [1]},
 393
 394        # Make gitweb use an alternative format of the URLs which can be
 395        # more readable and natural-looking: project name is embedded
 396        # directly in the path and the query string contains other
 397        # auxiliary information. All gitweb installations recognize
 398        # URL in either format; this configures in which formats gitweb
 399        # generates links.
 400
 401        # To enable system wide have in $GITWEB_CONFIG
 402        # $feature{'pathinfo'}{'default'} = [1];
 403        # Project specific override is not supported.
 404
 405        # Note that you will need to change the default location of CSS,
 406        # favicon, logo and possibly other files to an absolute URL. Also,
 407        # if gitweb.cgi serves as your indexfile, you will need to force
 408        # $my_uri to contain the script name in your $GITWEB_CONFIG.
 409        'pathinfo' => {
 410                'override' => 0,
 411                'default' => [0]},
 412
 413        # Make gitweb consider projects in project root subdirectories
 414        # to be forks of existing projects. Given project $projname.git,
 415        # projects matching $projname/*.git will not be shown in the main
 416        # projects list, instead a '+' mark will be added to $projname
 417        # there and a 'forks' view will be enabled for the project, listing
 418        # all the forks. If project list is taken from a file, forks have
 419        # to be listed after the main project.
 420
 421        # To enable system wide have in $GITWEB_CONFIG
 422        # $feature{'forks'}{'default'} = [1];
 423        # Project specific override is not supported.
 424        'forks' => {
 425                'override' => 0,
 426                'default' => [0]},
 427
 428        # Insert custom links to the action bar of all project pages.
 429        # This enables you mainly to link to third-party scripts integrating
 430        # into gitweb; e.g. git-browser for graphical history representation
 431        # or custom web-based repository administration interface.
 432
 433        # The 'default' value consists of a list of triplets in the form
 434        # (label, link, position) where position is the label after which
 435        # to insert the link and link is a format string where %n expands
 436        # to the project name, %f to the project path within the filesystem,
 437        # %h to the current hash (h gitweb parameter) and %b to the current
 438        # hash base (hb gitweb parameter); %% expands to %.
 439
 440        # To enable system wide have in $GITWEB_CONFIG e.g.
 441        # $feature{'actions'}{'default'} = [('graphiclog',
 442        #       '/git-browser/by-commit.html?r=%n', 'summary')];
 443        # Project specific override is not supported.
 444        'actions' => {
 445                'override' => 0,
 446                'default' => []},
 447
 448        # Allow gitweb scan project content tags of project repository,
 449        # and display the popular Web 2.0-ish "tag cloud" near the projects
 450        # list.  Note that this is something COMPLETELY different from the
 451        # normal Git tags.
 452
 453        # gitweb by itself can show existing tags, but it does not handle
 454        # tagging itself; you need to do it externally, outside gitweb.
 455        # The format is described in git_get_project_ctags() subroutine.
 456        # You may want to install the HTML::TagCloud Perl module to get
 457        # a pretty tag cloud instead of just a list of tags.
 458
 459        # To enable system wide have in $GITWEB_CONFIG
 460        # $feature{'ctags'}{'default'} = [1];
 461        # Project specific override is not supported.
 462
 463        # In the future whether ctags editing is enabled might depend
 464        # on the value, but using 1 should always mean no editing of ctags.
 465        'ctags' => {
 466                'override' => 0,
 467                'default' => [0]},
 468
 469        # The maximum number of patches in a patchset generated in patch
 470        # view. Set this to 0 or undef to disable patch view, or to a
 471        # negative number to remove any limit.
 472
 473        # To disable system wide have in $GITWEB_CONFIG
 474        # $feature{'patches'}{'default'} = [0];
 475        # To have project specific config enable override in $GITWEB_CONFIG
 476        # $feature{'patches'}{'override'} = 1;
 477        # and in project config gitweb.patches = 0|n;
 478        # where n is the maximum number of patches allowed in a patchset.
 479        'patches' => {
 480                'sub' => \&feature_patches,
 481                'override' => 0,
 482                'default' => [16]},
 483
 484        # Avatar support. When this feature is enabled, views such as
 485        # shortlog or commit will display an avatar associated with
 486        # the email of the committer(s) and/or author(s).
 487
 488        # Currently available providers are gravatar and picon.
 489        # If an unknown provider is specified, the feature is disabled.
 490
 491        # Gravatar depends on Digest::MD5.
 492        # Picon currently relies on the indiana.edu database.
 493
 494        # To enable system wide have in $GITWEB_CONFIG
 495        # $feature{'avatar'}{'default'} = ['<provider>'];
 496        # where <provider> is either gravatar or picon.
 497        # To have project specific config enable override in $GITWEB_CONFIG
 498        # $feature{'avatar'}{'override'} = 1;
 499        # and in project config gitweb.avatar = <provider>;
 500        'avatar' => {
 501                'sub' => \&feature_avatar,
 502                'override' => 0,
 503                'default' => ['']},
 504
 505        # Enable displaying how much time and how many git commands
 506        # it took to generate and display page.  Disabled by default.
 507        # Project specific override is not supported.
 508        'timed' => {
 509                'override' => 0,
 510                'default' => [0]},
 511
 512        # Enable turning some links into links to actions which require
 513        # JavaScript to run (like 'blame_incremental').  Not enabled by
 514        # default.  Project specific override is currently not supported.
 515        'javascript-actions' => {
 516                'override' => 0,
 517                'default' => [0]},
 518
 519        # Enable and configure ability to change common timezone for dates
 520        # in gitweb output via JavaScript.  Enabled by default.
 521        # Project specific override is not supported.
 522        'javascript-timezone' => {
 523                'override' => 0,
 524                'default' => [
 525                        'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
 526                                     # or undef to turn off this feature
 527                        'gitweb_tz', # name of cookie where to store selected timezone
 528                        'datetime',  # CSS class used to mark up dates for manipulation
 529                ]},
 530
 531        # Syntax highlighting support. This is based on Daniel Svensson's
 532        # and Sham Chukoury's work in gitweb-xmms2.git.
 533        # It requires the 'highlight' program present in $PATH,
 534        # and therefore is disabled by default.
 535
 536        # To enable system wide have in $GITWEB_CONFIG
 537        # $feature{'highlight'}{'default'} = [1];
 538
 539        'highlight' => {
 540                'sub' => sub { feature_bool('highlight', @_) },
 541                'override' => 0,
 542                'default' => [0]},
 543
 544        # Enable displaying of remote heads in the heads list
 545
 546        # To enable system wide have in $GITWEB_CONFIG
 547        # $feature{'remote_heads'}{'default'} = [1];
 548        # To have project specific config enable override in $GITWEB_CONFIG
 549        # $feature{'remote_heads'}{'override'} = 1;
 550        # and in project config gitweb.remoteheads = 0|1;
 551        'remote_heads' => {
 552                'sub' => sub { feature_bool('remote_heads', @_) },
 553                'override' => 0,
 554                'default' => [0]},
 555
 556        # Enable showing branches under other refs in addition to heads
 557
 558        # To set system wide extra branch refs have in $GITWEB_CONFIG
 559        # $feature{'extra-branch-refs'}{'default'} = ['dirs', 'of', 'choice'];
 560        # To have project specific config enable override in $GITWEB_CONFIG
 561        # $feature{'extra-branch-refs'}{'override'} = 1;
 562        # and in project config gitweb.extrabranchrefs = dirs of choice
 563        # Every directory is separated with whitespace.
 564
 565        'extra-branch-refs' => {
 566                'sub' => \&feature_extra_branch_refs,
 567                'override' => 0,
 568                'default' => []},
 569);
 570
 571sub gitweb_get_feature {
 572        my ($name) = @_;
 573        return unless exists $feature{$name};
 574        my ($sub, $override, @defaults) = (
 575                $feature{$name}{'sub'},
 576                $feature{$name}{'override'},
 577                @{$feature{$name}{'default'}});
 578        # project specific override is possible only if we have project
 579        our $git_dir; # global variable, declared later
 580        if (!$override || !defined $git_dir) {
 581                return @defaults;
 582        }
 583        if (!defined $sub) {
 584                warn "feature $name is not overridable";
 585                return @defaults;
 586        }
 587        return $sub->(@defaults);
 588}
 589
 590# A wrapper to check if a given feature is enabled.
 591# With this, you can say
 592#
 593#   my $bool_feat = gitweb_check_feature('bool_feat');
 594#   gitweb_check_feature('bool_feat') or somecode;
 595#
 596# instead of
 597#
 598#   my ($bool_feat) = gitweb_get_feature('bool_feat');
 599#   (gitweb_get_feature('bool_feat'))[0] or somecode;
 600#
 601sub gitweb_check_feature {
 602        return (gitweb_get_feature(@_))[0];
 603}
 604
 605
 606sub feature_bool {
 607        my $key = shift;
 608        my ($val) = git_get_project_config($key, '--bool');
 609
 610        if (!defined $val) {
 611                return ($_[0]);
 612        } elsif ($val eq 'true') {
 613                return (1);
 614        } elsif ($val eq 'false') {
 615                return (0);
 616        }
 617}
 618
 619sub feature_snapshot {
 620        my (@fmts) = @_;
 621
 622        my ($val) = git_get_project_config('snapshot');
 623
 624        if ($val) {
 625                @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
 626        }
 627
 628        return @fmts;
 629}
 630
 631sub feature_patches {
 632        my @val = (git_get_project_config('patches', '--int'));
 633
 634        if (@val) {
 635                return @val;
 636        }
 637
 638        return ($_[0]);
 639}
 640
 641sub feature_avatar {
 642        my @val = (git_get_project_config('avatar'));
 643
 644        return @val ? @val : @_;
 645}
 646
 647sub feature_extra_branch_refs {
 648        my (@branch_refs) = @_;
 649        my $values = git_get_project_config('extrabranchrefs');
 650
 651        if ($values) {
 652                $values = config_to_multi ($values);
 653                @branch_refs = ();
 654                foreach my $value (@{$values}) {
 655                        push @branch_refs, split /\s+/, $value;
 656                }
 657        }
 658
 659        return @branch_refs;
 660}
 661
 662# checking HEAD file with -e is fragile if the repository was
 663# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
 664# and then pruned.
 665sub check_head_link {
 666        my ($dir) = @_;
 667        my $headfile = "$dir/HEAD";
 668        return ((-e $headfile) ||
 669                (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
 670}
 671
 672sub check_export_ok {
 673        my ($dir) = @_;
 674        return (check_head_link($dir) &&
 675                (!$export_ok || -e "$dir/$export_ok") &&
 676                (!$export_auth_hook || $export_auth_hook->($dir)));
 677}
 678
 679# process alternate names for backward compatibility
 680# filter out unsupported (unknown) snapshot formats
 681sub filter_snapshot_fmts {
 682        my @fmts = @_;
 683
 684        @fmts = map {
 685                exists $known_snapshot_format_aliases{$_} ?
 686                       $known_snapshot_format_aliases{$_} : $_} @fmts;
 687        @fmts = grep {
 688                exists $known_snapshot_formats{$_} &&
 689                !$known_snapshot_formats{$_}{'disabled'}} @fmts;
 690}
 691
 692sub filter_and_validate_refs {
 693        my @refs = @_;
 694        my %unique_refs = ();
 695
 696        foreach my $ref (@refs) {
 697                die_error(500, "Invalid ref '$ref' in 'extra-branch-refs' feature") unless (is_valid_ref_format($ref));
 698                # 'heads' are added implicitly in get_branch_refs().
 699                $unique_refs{$ref} = 1 if ($ref ne 'heads');
 700        }
 701        return sort keys %unique_refs;
 702}
 703
 704# If it is set to code reference, it is code that it is to be run once per
 705# request, allowing updating configurations that change with each request,
 706# while running other code in config file only once.
 707#
 708# Otherwise, if it is false then gitweb would process config file only once;
 709# if it is true then gitweb config would be run for each request.
 710our $per_request_config = 1;
 711
 712# read and parse gitweb config file given by its parameter.
 713# returns true on success, false on recoverable error, allowing
 714# to chain this subroutine, using first file that exists.
 715# dies on errors during parsing config file, as it is unrecoverable.
 716sub read_config_file {
 717        my $filename = shift;
 718        return unless defined $filename;
 719        # die if there are errors parsing config file
 720        if (-e $filename) {
 721                do $filename;
 722                die $@ if $@;
 723                return 1;
 724        }
 725        return;
 726}
 727
 728our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
 729sub evaluate_gitweb_config {
 730        our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
 731        our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
 732        our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
 733
 734        # Protect against duplications of file names, to not read config twice.
 735        # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
 736        # there possibility of duplication of filename there doesn't matter.
 737        $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
 738        $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
 739
 740        # Common system-wide settings for convenience.
 741        # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
 742        read_config_file($GITWEB_CONFIG_COMMON);
 743
 744        # Use first config file that exists.  This means use the per-instance
 745        # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
 746        read_config_file($GITWEB_CONFIG) and return;
 747        read_config_file($GITWEB_CONFIG_SYSTEM);
 748}
 749
 750# Get loadavg of system, to compare against $maxload.
 751# Currently it requires '/proc/loadavg' present to get loadavg;
 752# if it is not present it returns 0, which means no load checking.
 753sub get_loadavg {
 754        if( -e '/proc/loadavg' ){
 755                open my $fd, '<', '/proc/loadavg'
 756                        or return 0;
 757                my @load = split(/\s+/, scalar <$fd>);
 758                close $fd;
 759
 760                # The first three columns measure CPU and IO utilization of the last one,
 761                # five, and 10 minute periods.  The fourth column shows the number of
 762                # currently running processes and the total number of processes in the m/n
 763                # format.  The last column displays the last process ID used.
 764                return $load[0] || 0;
 765        }
 766        # additional checks for load average should go here for things that don't export
 767        # /proc/loadavg
 768
 769        return 0;
 770}
 771
 772# version of the core git binary
 773our $git_version;
 774sub evaluate_git_version {
 775        our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
 776        $number_of_git_cmds++;
 777}
 778
 779sub check_loadavg {
 780        if (defined $maxload && get_loadavg() > $maxload) {
 781                die_error(503, "The load average on the server is too high");
 782        }
 783}
 784
 785# ======================================================================
 786# input validation and dispatch
 787
 788# input parameters can be collected from a variety of sources (presently, CGI
 789# and PATH_INFO), so we define an %input_params hash that collects them all
 790# together during validation: this allows subsequent uses (e.g. href()) to be
 791# agnostic of the parameter origin
 792
 793our %input_params = ();
 794
 795# input parameters are stored with the long parameter name as key. This will
 796# also be used in the href subroutine to convert parameters to their CGI
 797# equivalent, and since the href() usage is the most frequent one, we store
 798# the name -> CGI key mapping here, instead of the reverse.
 799#
 800# XXX: Warning: If you touch this, check the search form for updating,
 801# too.
 802
 803our @cgi_param_mapping = (
 804        project => "p",
 805        action => "a",
 806        file_name => "f",
 807        file_parent => "fp",
 808        hash => "h",
 809        hash_parent => "hp",
 810        hash_base => "hb",
 811        hash_parent_base => "hpb",
 812        page => "pg",
 813        order => "o",
 814        searchtext => "s",
 815        searchtype => "st",
 816        snapshot_format => "sf",
 817        extra_options => "opt",
 818        search_use_regexp => "sr",
 819        ctag => "by_tag",
 820        diff_style => "ds",
 821        project_filter => "pf",
 822        # this must be last entry (for manipulation from JavaScript)
 823        javascript => "js"
 824);
 825our %cgi_param_mapping = @cgi_param_mapping;
 826
 827# we will also need to know the possible actions, for validation
 828our %actions = (
 829        "blame" => \&git_blame,
 830        "blame_incremental" => \&git_blame_incremental,
 831        "blame_data" => \&git_blame_data,
 832        "blobdiff" => \&git_blobdiff,
 833        "blobdiff_plain" => \&git_blobdiff_plain,
 834        "blob" => \&git_blob,
 835        "blob_plain" => \&git_blob_plain,
 836        "commitdiff" => \&git_commitdiff,
 837        "commitdiff_plain" => \&git_commitdiff_plain,
 838        "commit" => \&git_commit,
 839        "forks" => \&git_forks,
 840        "heads" => \&git_heads,
 841        "history" => \&git_history,
 842        "log" => \&git_log,
 843        "patch" => \&git_patch,
 844        "patches" => \&git_patches,
 845        "remotes" => \&git_remotes,
 846        "rss" => \&git_rss,
 847        "atom" => \&git_atom,
 848        "search" => \&git_search,
 849        "search_help" => \&git_search_help,
 850        "shortlog" => \&git_shortlog,
 851        "summary" => \&git_summary,
 852        "tag" => \&git_tag,
 853        "tags" => \&git_tags,
 854        "tree" => \&git_tree,
 855        "snapshot" => \&git_snapshot,
 856        "object" => \&git_object,
 857        # those below don't need $project
 858        "opml" => \&git_opml,
 859        "project_list" => \&git_project_list,
 860        "project_index" => \&git_project_index,
 861);
 862
 863# finally, we have the hash of allowed extra_options for the commands that
 864# allow them
 865our %allowed_options = (
 866        "--no-merges" => [ qw(rss atom log shortlog history) ],
 867);
 868
 869# fill %input_params with the CGI parameters. All values except for 'opt'
 870# should be single values, but opt can be an array. We should probably
 871# build an array of parameters that can be multi-valued, but since for the time
 872# being it's only this one, we just single it out
 873sub evaluate_query_params {
 874        our $cgi;
 875
 876        while (my ($name, $symbol) = each %cgi_param_mapping) {
 877                if ($symbol eq 'opt') {
 878                        $input_params{$name} = [ map { decode_utf8($_) } $cgi->multi_param($symbol) ];
 879                } else {
 880                        $input_params{$name} = decode_utf8($cgi->param($symbol));
 881                }
 882        }
 883}
 884
 885# now read PATH_INFO and update the parameter list for missing parameters
 886sub evaluate_path_info {
 887        return if defined $input_params{'project'};
 888        return if !$path_info;
 889        $path_info =~ s,^/+,,;
 890        return if !$path_info;
 891
 892        # find which part of PATH_INFO is project
 893        my $project = $path_info;
 894        $project =~ s,/+$,,;
 895        while ($project && !check_head_link("$projectroot/$project")) {
 896                $project =~ s,/*[^/]*$,,;
 897        }
 898        return unless $project;
 899        $input_params{'project'} = $project;
 900
 901        # do not change any parameters if an action is given using the query string
 902        return if $input_params{'action'};
 903        $path_info =~ s,^\Q$project\E/*,,;
 904
 905        # next, check if we have an action
 906        my $action = $path_info;
 907        $action =~ s,/.*$,,;
 908        if (exists $actions{$action}) {
 909                $path_info =~ s,^$action/*,,;
 910                $input_params{'action'} = $action;
 911        }
 912
 913        # list of actions that want hash_base instead of hash, but can have no
 914        # pathname (f) parameter
 915        my @wants_base = (
 916                'tree',
 917                'history',
 918        );
 919
 920        # we want to catch, among others
 921        # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
 922        my ($parentrefname, $parentpathname, $refname, $pathname) =
 923                ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
 924
 925        # first, analyze the 'current' part
 926        if (defined $pathname) {
 927                # we got "branch:filename" or "branch:dir/"
 928                # we could use git_get_type(branch:pathname), but:
 929                # - it needs $git_dir
 930                # - it does a git() call
 931                # - the convention of terminating directories with a slash
 932                #   makes it superfluous
 933                # - embedding the action in the PATH_INFO would make it even
 934                #   more superfluous
 935                $pathname =~ s,^/+,,;
 936                if (!$pathname || substr($pathname, -1) eq "/") {
 937                        $input_params{'action'} ||= "tree";
 938                        $pathname =~ s,/$,,;
 939                } else {
 940                        # the default action depends on whether we had parent info
 941                        # or not
 942                        if ($parentrefname) {
 943                                $input_params{'action'} ||= "blobdiff_plain";
 944                        } else {
 945                                $input_params{'action'} ||= "blob_plain";
 946                        }
 947                }
 948                $input_params{'hash_base'} ||= $refname;
 949                $input_params{'file_name'} ||= $pathname;
 950        } elsif (defined $refname) {
 951                # we got "branch". In this case we have to choose if we have to
 952                # set hash or hash_base.
 953                #
 954                # Most of the actions without a pathname only want hash to be
 955                # set, except for the ones specified in @wants_base that want
 956                # hash_base instead. It should also be noted that hand-crafted
 957                # links having 'history' as an action and no pathname or hash
 958                # set will fail, but that happens regardless of PATH_INFO.
 959                if (defined $parentrefname) {
 960                        # if there is parent let the default be 'shortlog' action
 961                        # (for http://git.example.com/repo.git/A..B links); if there
 962                        # is no parent, dispatch will detect type of object and set
 963                        # action appropriately if required (if action is not set)
 964                        $input_params{'action'} ||= "shortlog";
 965                }
 966                if ($input_params{'action'} &&
 967                    grep { $_ eq $input_params{'action'} } @wants_base) {
 968                        $input_params{'hash_base'} ||= $refname;
 969                } else {
 970                        $input_params{'hash'} ||= $refname;
 971                }
 972        }
 973
 974        # next, handle the 'parent' part, if present
 975        if (defined $parentrefname) {
 976                # a missing pathspec defaults to the 'current' filename, allowing e.g.
 977                # someproject/blobdiff/oldrev..newrev:/filename
 978                if ($parentpathname) {
 979                        $parentpathname =~ s,^/+,,;
 980                        $parentpathname =~ s,/$,,;
 981                        $input_params{'file_parent'} ||= $parentpathname;
 982                } else {
 983                        $input_params{'file_parent'} ||= $input_params{'file_name'};
 984                }
 985                # we assume that hash_parent_base is wanted if a path was specified,
 986                # or if the action wants hash_base instead of hash
 987                if (defined $input_params{'file_parent'} ||
 988                        grep { $_ eq $input_params{'action'} } @wants_base) {
 989                        $input_params{'hash_parent_base'} ||= $parentrefname;
 990                } else {
 991                        $input_params{'hash_parent'} ||= $parentrefname;
 992                }
 993        }
 994
 995        # for the snapshot action, we allow URLs in the form
 996        # $project/snapshot/$hash.ext
 997        # where .ext determines the snapshot and gets removed from the
 998        # passed $refname to provide the $hash.
 999        #
1000        # To be able to tell that $refname includes the format extension, we
1001        # require the following two conditions to be satisfied:
1002        # - the hash input parameter MUST have been set from the $refname part
1003        #   of the URL (i.e. they must be equal)
1004        # - the snapshot format MUST NOT have been defined already (e.g. from
1005        #   CGI parameter sf)
1006        # It's also useless to try any matching unless $refname has a dot,
1007        # so we check for that too
1008        if (defined $input_params{'action'} &&
1009                $input_params{'action'} eq 'snapshot' &&
1010                defined $refname && index($refname, '.') != -1 &&
1011                $refname eq $input_params{'hash'} &&
1012                !defined $input_params{'snapshot_format'}) {
1013                # We loop over the known snapshot formats, checking for
1014                # extensions. Allowed extensions are both the defined suffix
1015                # (which includes the initial dot already) and the snapshot
1016                # format key itself, with a prepended dot
1017                while (my ($fmt, $opt) = each %known_snapshot_formats) {
1018                        my $hash = $refname;
1019                        unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
1020                                next;
1021                        }
1022                        my $sfx = $1;
1023                        # a valid suffix was found, so set the snapshot format
1024                        # and reset the hash parameter
1025                        $input_params{'snapshot_format'} = $fmt;
1026                        $input_params{'hash'} = $hash;
1027                        # we also set the format suffix to the one requested
1028                        # in the URL: this way a request for e.g. .tgz returns
1029                        # a .tgz instead of a .tar.gz
1030                        $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
1031                        last;
1032                }
1033        }
1034}
1035
1036our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
1037     $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
1038     $searchtext, $search_regexp, $project_filter);
1039sub evaluate_and_validate_params {
1040        our $action = $input_params{'action'};
1041        if (defined $action) {
1042                if (!is_valid_action($action)) {
1043                        die_error(400, "Invalid action parameter");
1044                }
1045        }
1046
1047        # parameters which are pathnames
1048        our $project = $input_params{'project'};
1049        if (defined $project) {
1050                if (!is_valid_project($project)) {
1051                        undef $project;
1052                        die_error(404, "No such project");
1053                }
1054        }
1055
1056        our $project_filter = $input_params{'project_filter'};
1057        if (defined $project_filter) {
1058                if (!is_valid_pathname($project_filter)) {
1059                        die_error(404, "Invalid project_filter parameter");
1060                }
1061        }
1062
1063        our $file_name = $input_params{'file_name'};
1064        if (defined $file_name) {
1065                if (!is_valid_pathname($file_name)) {
1066                        die_error(400, "Invalid file parameter");
1067                }
1068        }
1069
1070        our $file_parent = $input_params{'file_parent'};
1071        if (defined $file_parent) {
1072                if (!is_valid_pathname($file_parent)) {
1073                        die_error(400, "Invalid file parent parameter");
1074                }
1075        }
1076
1077        # parameters which are refnames
1078        our $hash = $input_params{'hash'};
1079        if (defined $hash) {
1080                if (!is_valid_refname($hash)) {
1081                        die_error(400, "Invalid hash parameter");
1082                }
1083        }
1084
1085        our $hash_parent = $input_params{'hash_parent'};
1086        if (defined $hash_parent) {
1087                if (!is_valid_refname($hash_parent)) {
1088                        die_error(400, "Invalid hash parent parameter");
1089                }
1090        }
1091
1092        our $hash_base = $input_params{'hash_base'};
1093        if (defined $hash_base) {
1094                if (!is_valid_refname($hash_base)) {
1095                        die_error(400, "Invalid hash base parameter");
1096                }
1097        }
1098
1099        our @extra_options = @{$input_params{'extra_options'}};
1100        # @extra_options is always defined, since it can only be (currently) set from
1101        # CGI, and $cgi->param() returns the empty array in array context if the param
1102        # is not set
1103        foreach my $opt (@extra_options) {
1104                if (not exists $allowed_options{$opt}) {
1105                        die_error(400, "Invalid option parameter");
1106                }
1107                if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1108                        die_error(400, "Invalid option parameter for this action");
1109                }
1110        }
1111
1112        our $hash_parent_base = $input_params{'hash_parent_base'};
1113        if (defined $hash_parent_base) {
1114                if (!is_valid_refname($hash_parent_base)) {
1115                        die_error(400, "Invalid hash parent base parameter");
1116                }
1117        }
1118
1119        # other parameters
1120        our $page = $input_params{'page'};
1121        if (defined $page) {
1122                if ($page =~ m/[^0-9]/) {
1123                        die_error(400, "Invalid page parameter");
1124                }
1125        }
1126
1127        our $searchtype = $input_params{'searchtype'};
1128        if (defined $searchtype) {
1129                if ($searchtype =~ m/[^a-z]/) {
1130                        die_error(400, "Invalid searchtype parameter");
1131                }
1132        }
1133
1134        our $search_use_regexp = $input_params{'search_use_regexp'};
1135
1136        our $searchtext = $input_params{'searchtext'};
1137        our $search_regexp = undef;
1138        if (defined $searchtext) {
1139                if (length($searchtext) < 2) {
1140                        die_error(403, "At least two characters are required for search parameter");
1141                }
1142                if ($search_use_regexp) {
1143                        $search_regexp = $searchtext;
1144                        if (!eval { qr/$search_regexp/; 1; }) {
1145                                (my $error = $@) =~ s/ at \S+ line \d+.*\n?//;
1146                                die_error(400, "Invalid search regexp '$search_regexp'",
1147                                          esc_html($error));
1148                        }
1149                } else {
1150                        $search_regexp = quotemeta $searchtext;
1151                }
1152        }
1153}
1154
1155# path to the current git repository
1156our $git_dir;
1157sub evaluate_git_dir {
1158        our $git_dir = "$projectroot/$project" if $project;
1159}
1160
1161our (@snapshot_fmts, $git_avatar, @extra_branch_refs);
1162sub configure_gitweb_features {
1163        # list of supported snapshot formats
1164        our @snapshot_fmts = gitweb_get_feature('snapshot');
1165        @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1166
1167        # check that the avatar feature is set to a known provider name,
1168        # and for each provider check if the dependencies are satisfied.
1169        # if the provider name is invalid or the dependencies are not met,
1170        # reset $git_avatar to the empty string.
1171        our ($git_avatar) = gitweb_get_feature('avatar');
1172        if ($git_avatar eq 'gravatar') {
1173                $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1174        } elsif ($git_avatar eq 'picon') {
1175                # no dependencies
1176        } else {
1177                $git_avatar = '';
1178        }
1179
1180        our @extra_branch_refs = gitweb_get_feature('extra-branch-refs');
1181        @extra_branch_refs = filter_and_validate_refs (@extra_branch_refs);
1182}
1183
1184sub get_branch_refs {
1185        return ('heads', @extra_branch_refs);
1186}
1187
1188# custom error handler: 'die <message>' is Internal Server Error
1189sub handle_errors_html {
1190        my $msg = shift; # it is already HTML escaped
1191
1192        # to avoid infinite loop where error occurs in die_error,
1193        # change handler to default handler, disabling handle_errors_html
1194        set_message("Error occurred when inside die_error:\n$msg");
1195
1196        # you cannot jump out of die_error when called as error handler;
1197        # the subroutine set via CGI::Carp::set_message is called _after_
1198        # HTTP headers are already written, so it cannot write them itself
1199        die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1200}
1201set_message(\&handle_errors_html);
1202
1203# dispatch
1204sub dispatch {
1205        if (!defined $action) {
1206                if (defined $hash) {
1207                        $action = git_get_type($hash);
1208                        $action or die_error(404, "Object does not exist");
1209                } elsif (defined $hash_base && defined $file_name) {
1210                        $action = git_get_type("$hash_base:$file_name");
1211                        $action or die_error(404, "File or directory does not exist");
1212                } elsif (defined $project) {
1213                        $action = 'summary';
1214                } else {
1215                        $action = 'project_list';
1216                }
1217        }
1218        if (!defined($actions{$action})) {
1219                die_error(400, "Unknown action");
1220        }
1221        if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1222            !$project) {
1223                die_error(400, "Project needed");
1224        }
1225        $actions{$action}->();
1226}
1227
1228sub reset_timer {
1229        our $t0 = [ gettimeofday() ]
1230                if defined $t0;
1231        our $number_of_git_cmds = 0;
1232}
1233
1234our $first_request = 1;
1235sub run_request {
1236        reset_timer();
1237
1238        evaluate_uri();
1239        if ($first_request) {
1240                evaluate_gitweb_config();
1241                evaluate_git_version();
1242        }
1243        if ($per_request_config) {
1244                if (ref($per_request_config) eq 'CODE') {
1245                        $per_request_config->();
1246                } elsif (!$first_request) {
1247                        evaluate_gitweb_config();
1248                }
1249        }
1250        check_loadavg();
1251
1252        # $projectroot and $projects_list might be set in gitweb config file
1253        $projects_list ||= $projectroot;
1254
1255        evaluate_query_params();
1256        evaluate_path_info();
1257        evaluate_and_validate_params();
1258        evaluate_git_dir();
1259
1260        configure_gitweb_features();
1261
1262        dispatch();
1263}
1264
1265our $is_last_request = sub { 1 };
1266our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1267our $CGI = 'CGI';
1268our $cgi;
1269sub configure_as_fcgi {
1270        require CGI::Fast;
1271        our $CGI = 'CGI::Fast';
1272
1273        my $request_number = 0;
1274        # let each child service 100 requests
1275        our $is_last_request = sub { ++$request_number > 100 };
1276}
1277sub evaluate_argv {
1278        my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1279        configure_as_fcgi()
1280                if $script_name =~ /\.fcgi$/;
1281
1282        return unless (@ARGV);
1283
1284        require Getopt::Long;
1285        Getopt::Long::GetOptions(
1286                'fastcgi|fcgi|f' => \&configure_as_fcgi,
1287                'nproc|n=i' => sub {
1288                        my ($arg, $val) = @_;
1289                        return unless eval { require FCGI::ProcManager; 1; };
1290                        my $proc_manager = FCGI::ProcManager->new({
1291                                n_processes => $val,
1292                        });
1293                        our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1294                        our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1295                        our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1296                },
1297        );
1298}
1299
1300sub run {
1301        evaluate_argv();
1302
1303        $first_request = 1;
1304        $pre_listen_hook->()
1305                if $pre_listen_hook;
1306
1307 REQUEST:
1308        while ($cgi = $CGI->new()) {
1309                $pre_dispatch_hook->()
1310                        if $pre_dispatch_hook;
1311
1312                run_request();
1313
1314                $post_dispatch_hook->()
1315                        if $post_dispatch_hook;
1316                $first_request = 0;
1317
1318                last REQUEST if ($is_last_request->());
1319        }
1320
1321 DONE_GITWEB:
1322        1;
1323}
1324
1325run();
1326
1327if (defined caller) {
1328        # wrapped in a subroutine processing requests,
1329        # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1330        return;
1331} else {
1332        # pure CGI script, serving single request
1333        exit;
1334}
1335
1336## ======================================================================
1337## action links
1338
1339# possible values of extra options
1340# -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1341# -replay => 1      - start from a current view (replay with modifications)
1342# -path_info => 0|1 - don't use/use path_info URL (if possible)
1343# -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1344sub href {
1345        my %params = @_;
1346        # default is to use -absolute url() i.e. $my_uri
1347        my $href = $params{-full} ? $my_url : $my_uri;
1348
1349        # implicit -replay, must be first of implicit params
1350        $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1351
1352        $params{'project'} = $project unless exists $params{'project'};
1353
1354        if ($params{-replay}) {
1355                while (my ($name, $symbol) = each %cgi_param_mapping) {
1356                        if (!exists $params{$name}) {
1357                                $params{$name} = $input_params{$name};
1358                        }
1359                }
1360        }
1361
1362        my $use_pathinfo = gitweb_check_feature('pathinfo');
1363        if (defined $params{'project'} &&
1364            (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1365                # try to put as many parameters as possible in PATH_INFO:
1366                #   - project name
1367                #   - action
1368                #   - hash_parent or hash_parent_base:/file_parent
1369                #   - hash or hash_base:/filename
1370                #   - the snapshot_format as an appropriate suffix
1371
1372                # When the script is the root DirectoryIndex for the domain,
1373                # $href here would be something like http://gitweb.example.com/
1374                # Thus, we strip any trailing / from $href, to spare us double
1375                # slashes in the final URL
1376                $href =~ s,/$,,;
1377
1378                # Then add the project name, if present
1379                $href .= "/".esc_path_info($params{'project'});
1380                delete $params{'project'};
1381
1382                # since we destructively absorb parameters, we keep this
1383                # boolean that remembers if we're handling a snapshot
1384                my $is_snapshot = $params{'action'} eq 'snapshot';
1385
1386                # Summary just uses the project path URL, any other action is
1387                # added to the URL
1388                if (defined $params{'action'}) {
1389                        $href .= "/".esc_path_info($params{'action'})
1390                                unless $params{'action'} eq 'summary';
1391                        delete $params{'action'};
1392                }
1393
1394                # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1395                # stripping nonexistent or useless pieces
1396                $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1397                        || $params{'hash_parent'} || $params{'hash'});
1398                if (defined $params{'hash_base'}) {
1399                        if (defined $params{'hash_parent_base'}) {
1400                                $href .= esc_path_info($params{'hash_parent_base'});
1401                                # skip the file_parent if it's the same as the file_name
1402                                if (defined $params{'file_parent'}) {
1403                                        if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1404                                                delete $params{'file_parent'};
1405                                        } elsif ($params{'file_parent'} !~ /\.\./) {
1406                                                $href .= ":/".esc_path_info($params{'file_parent'});
1407                                                delete $params{'file_parent'};
1408                                        }
1409                                }
1410                                $href .= "..";
1411                                delete $params{'hash_parent'};
1412                                delete $params{'hash_parent_base'};
1413                        } elsif (defined $params{'hash_parent'}) {
1414                                $href .= esc_path_info($params{'hash_parent'}). "..";
1415                                delete $params{'hash_parent'};
1416                        }
1417
1418                        $href .= esc_path_info($params{'hash_base'});
1419                        if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1420                                $href .= ":/".esc_path_info($params{'file_name'});
1421                                delete $params{'file_name'};
1422                        }
1423                        delete $params{'hash'};
1424                        delete $params{'hash_base'};
1425                } elsif (defined $params{'hash'}) {
1426                        $href .= esc_path_info($params{'hash'});
1427                        delete $params{'hash'};
1428                }
1429
1430                # If the action was a snapshot, we can absorb the
1431                # snapshot_format parameter too
1432                if ($is_snapshot) {
1433                        my $fmt = $params{'snapshot_format'};
1434                        # snapshot_format should always be defined when href()
1435                        # is called, but just in case some code forgets, we
1436                        # fall back to the default
1437                        $fmt ||= $snapshot_fmts[0];
1438                        $href .= $known_snapshot_formats{$fmt}{'suffix'};
1439                        delete $params{'snapshot_format'};
1440                }
1441        }
1442
1443        # now encode the parameters explicitly
1444        my @result = ();
1445        for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1446                my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1447                if (defined $params{$name}) {
1448                        if (ref($params{$name}) eq "ARRAY") {
1449                                foreach my $par (@{$params{$name}}) {
1450                                        push @result, $symbol . "=" . esc_param($par);
1451                                }
1452                        } else {
1453                                push @result, $symbol . "=" . esc_param($params{$name});
1454                        }
1455                }
1456        }
1457        $href .= "?" . join(';', @result) if scalar @result;
1458
1459        # final transformation: trailing spaces must be escaped (URI-encoded)
1460        $href =~ s/(\s+)$/CGI::escape($1)/e;
1461
1462        if ($params{-anchor}) {
1463                $href .= "#".esc_param($params{-anchor});
1464        }
1465
1466        return $href;
1467}
1468
1469
1470## ======================================================================
1471## validation, quoting/unquoting and escaping
1472
1473sub is_valid_action {
1474        my $input = shift;
1475        return undef unless exists $actions{$input};
1476        return 1;
1477}
1478
1479sub is_valid_project {
1480        my $input = shift;
1481
1482        return unless defined $input;
1483        if (!is_valid_pathname($input) ||
1484                !(-d "$projectroot/$input") ||
1485                !check_export_ok("$projectroot/$input") ||
1486                ($strict_export && !project_in_list($input))) {
1487                return undef;
1488        } else {
1489                return 1;
1490        }
1491}
1492
1493sub is_valid_pathname {
1494        my $input = shift;
1495
1496        return undef unless defined $input;
1497        # no '.' or '..' as elements of path, i.e. no '.' or '..'
1498        # at the beginning, at the end, and between slashes.
1499        # also this catches doubled slashes
1500        if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1501                return undef;
1502        }
1503        # no null characters
1504        if ($input =~ m!\0!) {
1505                return undef;
1506        }
1507        return 1;
1508}
1509
1510sub is_valid_ref_format {
1511        my $input = shift;
1512
1513        return undef unless defined $input;
1514        # restrictions on ref name according to git-check-ref-format
1515        if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1516                return undef;
1517        }
1518        return 1;
1519}
1520
1521sub is_valid_refname {
1522        my $input = shift;
1523
1524        return undef unless defined $input;
1525        # textual hashes are O.K.
1526        if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1527                return 1;
1528        }
1529        # it must be correct pathname
1530        is_valid_pathname($input) or return undef;
1531        # check git-check-ref-format restrictions
1532        is_valid_ref_format($input) or return undef;
1533        return 1;
1534}
1535
1536# decode sequences of octets in utf8 into Perl's internal form,
1537# which is utf-8 with utf8 flag set if needed.  gitweb writes out
1538# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1539sub to_utf8 {
1540        my $str = shift;
1541        return undef unless defined $str;
1542
1543        if (utf8::is_utf8($str) || utf8::decode($str)) {
1544                return $str;
1545        } else {
1546                return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1547        }
1548}
1549
1550# quote unsafe chars, but keep the slash, even when it's not
1551# correct, but quoted slashes look too horrible in bookmarks
1552sub esc_param {
1553        my $str = shift;
1554        return undef unless defined $str;
1555        $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1556        $str =~ s/ /\+/g;
1557        return $str;
1558}
1559
1560# the quoting rules for path_info fragment are slightly different
1561sub esc_path_info {
1562        my $str = shift;
1563        return undef unless defined $str;
1564
1565        # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1566        $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1567
1568        return $str;
1569}
1570
1571# quote unsafe chars in whole URL, so some characters cannot be quoted
1572sub esc_url {
1573        my $str = shift;
1574        return undef unless defined $str;
1575        $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1576        $str =~ s/ /\+/g;
1577        return $str;
1578}
1579
1580# quote unsafe characters in HTML attributes
1581sub esc_attr {
1582
1583        # for XHTML conformance escaping '"' to '&quot;' is not enough
1584        return esc_html(@_);
1585}
1586
1587# replace invalid utf8 character with SUBSTITUTION sequence
1588sub esc_html {
1589        my $str = shift;
1590        my %opts = @_;
1591
1592        return undef unless defined $str;
1593
1594        $str = to_utf8($str);
1595        $str = $cgi->escapeHTML($str);
1596        if ($opts{'-nbsp'}) {
1597                $str =~ s/ /&nbsp;/g;
1598        }
1599        $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1600        return $str;
1601}
1602
1603# quote control characters and escape filename to HTML
1604sub esc_path {
1605        my $str = shift;
1606        my %opts = @_;
1607
1608        return undef unless defined $str;
1609
1610        $str = to_utf8($str);
1611        $str = $cgi->escapeHTML($str);
1612        if ($opts{'-nbsp'}) {
1613                $str =~ s/ /&nbsp;/g;
1614        }
1615        $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1616        return $str;
1617}
1618
1619# Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1620sub sanitize {
1621        my $str = shift;
1622
1623        return undef unless defined $str;
1624
1625        $str = to_utf8($str);
1626        $str =~ s|([[:cntrl:]])|(index("\t\n\r", $1) != -1 ? $1 : quot_cec($1))|eg;
1627        return $str;
1628}
1629
1630# Make control characters "printable", using character escape codes (CEC)
1631sub quot_cec {
1632        my $cntrl = shift;
1633        my %opts = @_;
1634        my %es = ( # character escape codes, aka escape sequences
1635                "\t" => '\t',   # tab            (HT)
1636                "\n" => '\n',   # line feed      (LF)
1637                "\r" => '\r',   # carrige return (CR)
1638                "\f" => '\f',   # form feed      (FF)
1639                "\b" => '\b',   # backspace      (BS)
1640                "\a" => '\a',   # alarm (bell)   (BEL)
1641                "\e" => '\e',   # escape         (ESC)
1642                "\013" => '\v', # vertical tab   (VT)
1643                "\000" => '\0', # nul character  (NUL)
1644        );
1645        my $chr = ( (exists $es{$cntrl})
1646                    ? $es{$cntrl}
1647                    : sprintf('\%2x', ord($cntrl)) );
1648        if ($opts{-nohtml}) {
1649                return $chr;
1650        } else {
1651                return "<span class=\"cntrl\">$chr</span>";
1652        }
1653}
1654
1655# Alternatively use unicode control pictures codepoints,
1656# Unicode "printable representation" (PR)
1657sub quot_upr {
1658        my $cntrl = shift;
1659        my %opts = @_;
1660
1661        my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1662        if ($opts{-nohtml}) {
1663                return $chr;
1664        } else {
1665                return "<span class=\"cntrl\">$chr</span>";
1666        }
1667}
1668
1669# git may return quoted and escaped filenames
1670sub unquote {
1671        my $str = shift;
1672
1673        sub unq {
1674                my $seq = shift;
1675                my %es = ( # character escape codes, aka escape sequences
1676                        't' => "\t",   # tab            (HT, TAB)
1677                        'n' => "\n",   # newline        (NL)
1678                        'r' => "\r",   # return         (CR)
1679                        'f' => "\f",   # form feed      (FF)
1680                        'b' => "\b",   # backspace      (BS)
1681                        'a' => "\a",   # alarm (bell)   (BEL)
1682                        'e' => "\e",   # escape         (ESC)
1683                        'v' => "\013", # vertical tab   (VT)
1684                );
1685
1686                if ($seq =~ m/^[0-7]{1,3}$/) {
1687                        # octal char sequence
1688                        return chr(oct($seq));
1689                } elsif (exists $es{$seq}) {
1690                        # C escape sequence, aka character escape code
1691                        return $es{$seq};
1692                }
1693                # quoted ordinary character
1694                return $seq;
1695        }
1696
1697        if ($str =~ m/^"(.*)"$/) {
1698                # needs unquoting
1699                $str = $1;
1700                $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1701        }
1702        return $str;
1703}
1704
1705# escape tabs (convert tabs to spaces)
1706sub untabify {
1707        my $line = shift;
1708
1709        while ((my $pos = index($line, "\t")) != -1) {
1710                if (my $count = (8 - ($pos % 8))) {
1711                        my $spaces = ' ' x $count;
1712                        $line =~ s/\t/$spaces/;
1713                }
1714        }
1715
1716        return $line;
1717}
1718
1719sub project_in_list {
1720        my $project = shift;
1721        my @list = git_get_projects_list();
1722        return @list && scalar(grep { $_->{'path'} eq $project } @list);
1723}
1724
1725## ----------------------------------------------------------------------
1726## HTML aware string manipulation
1727
1728# Try to chop given string on a word boundary between position
1729# $len and $len+$add_len. If there is no word boundary there,
1730# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1731# (marking chopped part) would be longer than given string.
1732sub chop_str {
1733        my $str = shift;
1734        my $len = shift;
1735        my $add_len = shift || 10;
1736        my $where = shift || 'right'; # 'left' | 'center' | 'right'
1737
1738        # Make sure perl knows it is utf8 encoded so we don't
1739        # cut in the middle of a utf8 multibyte char.
1740        $str = to_utf8($str);
1741
1742        # allow only $len chars, but don't cut a word if it would fit in $add_len
1743        # if it doesn't fit, cut it if it's still longer than the dots we would add
1744        # remove chopped character entities entirely
1745
1746        # when chopping in the middle, distribute $len into left and right part
1747        # return early if chopping wouldn't make string shorter
1748        if ($where eq 'center') {
1749                return $str if ($len + 5 >= length($str)); # filler is length 5
1750                $len = int($len/2);
1751        } else {
1752                return $str if ($len + 4 >= length($str)); # filler is length 4
1753        }
1754
1755        # regexps: ending and beginning with word part up to $add_len
1756        my $endre = qr/.{$len}\w{0,$add_len}/;
1757        my $begre = qr/\w{0,$add_len}.{$len}/;
1758
1759        if ($where eq 'left') {
1760                $str =~ m/^(.*?)($begre)$/;
1761                my ($lead, $body) = ($1, $2);
1762                if (length($lead) > 4) {
1763                        $lead = " ...";
1764                }
1765                return "$lead$body";
1766
1767        } elsif ($where eq 'center') {
1768                $str =~ m/^($endre)(.*)$/;
1769                my ($left, $str)  = ($1, $2);
1770                $str =~ m/^(.*?)($begre)$/;
1771                my ($mid, $right) = ($1, $2);
1772                if (length($mid) > 5) {
1773                        $mid = " ... ";
1774                }
1775                return "$left$mid$right";
1776
1777        } else {
1778                $str =~ m/^($endre)(.*)$/;
1779                my $body = $1;
1780                my $tail = $2;
1781                if (length($tail) > 4) {
1782                        $tail = "... ";
1783                }
1784                return "$body$tail";
1785        }
1786}
1787
1788# takes the same arguments as chop_str, but also wraps a <span> around the
1789# result with a title attribute if it does get chopped. Additionally, the
1790# string is HTML-escaped.
1791sub chop_and_escape_str {
1792        my ($str) = @_;
1793
1794        my $chopped = chop_str(@_);
1795        $str = to_utf8($str);
1796        if ($chopped eq $str) {
1797                return esc_html($chopped);
1798        } else {
1799                $str =~ s/[[:cntrl:]]/?/g;
1800                return $cgi->span({-title=>$str}, esc_html($chopped));
1801        }
1802}
1803
1804# Highlight selected fragments of string, using given CSS class,
1805# and escape HTML.  It is assumed that fragments do not overlap.
1806# Regions are passed as list of pairs (array references).
1807#
1808# Example: esc_html_hl_regions("foobar", "mark", [ 0, 3 ]) returns
1809# '<span class="mark">foo</span>bar'
1810sub esc_html_hl_regions {
1811        my ($str, $css_class, @sel) = @_;
1812        my %opts = grep { ref($_) ne 'ARRAY' } @sel;
1813        @sel     = grep { ref($_) eq 'ARRAY' } @sel;
1814        return esc_html($str, %opts) unless @sel;
1815
1816        my $out = '';
1817        my $pos = 0;
1818
1819        for my $s (@sel) {
1820                my ($begin, $end) = @$s;
1821
1822                # Don't create empty <span> elements.
1823                next if $end <= $begin;
1824
1825                my $escaped = esc_html(substr($str, $begin, $end - $begin),
1826                                       %opts);
1827
1828                $out .= esc_html(substr($str, $pos, $begin - $pos), %opts)
1829                        if ($begin - $pos > 0);
1830                $out .= $cgi->span({-class => $css_class}, $escaped);
1831
1832                $pos = $end;
1833        }
1834        $out .= esc_html(substr($str, $pos), %opts)
1835                if ($pos < length($str));
1836
1837        return $out;
1838}
1839
1840# return positions of beginning and end of each match
1841sub matchpos_list {
1842        my ($str, $regexp) = @_;
1843        return unless (defined $str && defined $regexp);
1844
1845        my @matches;
1846        while ($str =~ /$regexp/g) {
1847                push @matches, [$-[0], $+[0]];
1848        }
1849        return @matches;
1850}
1851
1852# highlight match (if any), and escape HTML
1853sub esc_html_match_hl {
1854        my ($str, $regexp) = @_;
1855        return esc_html($str) unless defined $regexp;
1856
1857        my @matches = matchpos_list($str, $regexp);
1858        return esc_html($str) unless @matches;
1859
1860        return esc_html_hl_regions($str, 'match', @matches);
1861}
1862
1863
1864# highlight match (if any) of shortened string, and escape HTML
1865sub esc_html_match_hl_chopped {
1866        my ($str, $chopped, $regexp) = @_;
1867        return esc_html_match_hl($str, $regexp) unless defined $chopped;
1868
1869        my @matches = matchpos_list($str, $regexp);
1870        return esc_html($chopped) unless @matches;
1871
1872        # filter matches so that we mark chopped string
1873        my $tail = "... "; # see chop_str
1874        unless ($chopped =~ s/\Q$tail\E$//) {
1875                $tail = '';
1876        }
1877        my $chop_len = length($chopped);
1878        my $tail_len = length($tail);
1879        my @filtered;
1880
1881        for my $m (@matches) {
1882                if ($m->[0] > $chop_len) {
1883                        push @filtered, [ $chop_len, $chop_len + $tail_len ] if ($tail_len > 0);
1884                        last;
1885                } elsif ($m->[1] > $chop_len) {
1886                        push @filtered, [ $m->[0], $chop_len + $tail_len ];
1887                        last;
1888                }
1889                push @filtered, $m;
1890        }
1891
1892        return esc_html_hl_regions($chopped . $tail, 'match', @filtered);
1893}
1894
1895## ----------------------------------------------------------------------
1896## functions returning short strings
1897
1898# CSS class for given age value (in seconds)
1899sub age_class {
1900        my $age = shift;
1901
1902        if (!defined $age) {
1903                return "noage";
1904        } elsif ($age < 60*60*2) {
1905                return "age0";
1906        } elsif ($age < 60*60*24*2) {
1907                return "age1";
1908        } else {
1909                return "age2";
1910        }
1911}
1912
1913# convert age in seconds to "nn units ago" string
1914sub age_string {
1915        my $age = shift;
1916        my $age_str;
1917
1918        if ($age > 60*60*24*365*2) {
1919                $age_str = (int $age/60/60/24/365);
1920                $age_str .= " years ago";
1921        } elsif ($age > 60*60*24*(365/12)*2) {
1922                $age_str = int $age/60/60/24/(365/12);
1923                $age_str .= " months ago";
1924        } elsif ($age > 60*60*24*7*2) {
1925                $age_str = int $age/60/60/24/7;
1926                $age_str .= " weeks ago";
1927        } elsif ($age > 60*60*24*2) {
1928                $age_str = int $age/60/60/24;
1929                $age_str .= " days ago";
1930        } elsif ($age > 60*60*2) {
1931                $age_str = int $age/60/60;
1932                $age_str .= " hours ago";
1933        } elsif ($age > 60*2) {
1934                $age_str = int $age/60;
1935                $age_str .= " min ago";
1936        } elsif ($age > 2) {
1937                $age_str = int $age;
1938                $age_str .= " sec ago";
1939        } else {
1940                $age_str .= " right now";
1941        }
1942        return $age_str;
1943}
1944
1945use constant {
1946        S_IFINVALID => 0030000,
1947        S_IFGITLINK => 0160000,
1948};
1949
1950# submodule/subproject, a commit object reference
1951sub S_ISGITLINK {
1952        my $mode = shift;
1953
1954        return (($mode & S_IFMT) == S_IFGITLINK)
1955}
1956
1957# convert file mode in octal to symbolic file mode string
1958sub mode_str {
1959        my $mode = oct shift;
1960
1961        if (S_ISGITLINK($mode)) {
1962                return 'm---------';
1963        } elsif (S_ISDIR($mode & S_IFMT)) {
1964                return 'drwxr-xr-x';
1965        } elsif (S_ISLNK($mode)) {
1966                return 'lrwxrwxrwx';
1967        } elsif (S_ISREG($mode)) {
1968                # git cares only about the executable bit
1969                if ($mode & S_IXUSR) {
1970                        return '-rwxr-xr-x';
1971                } else {
1972                        return '-rw-r--r--';
1973                };
1974        } else {
1975                return '----------';
1976        }
1977}
1978
1979# convert file mode in octal to file type string
1980sub file_type {
1981        my $mode = shift;
1982
1983        if ($mode !~ m/^[0-7]+$/) {
1984                return $mode;
1985        } else {
1986                $mode = oct $mode;
1987        }
1988
1989        if (S_ISGITLINK($mode)) {
1990                return "submodule";
1991        } elsif (S_ISDIR($mode & S_IFMT)) {
1992                return "directory";
1993        } elsif (S_ISLNK($mode)) {
1994                return "symlink";
1995        } elsif (S_ISREG($mode)) {
1996                return "file";
1997        } else {
1998                return "unknown";
1999        }
2000}
2001
2002# convert file mode in octal to file type description string
2003sub file_type_long {
2004        my $mode = shift;
2005
2006        if ($mode !~ m/^[0-7]+$/) {
2007                return $mode;
2008        } else {
2009                $mode = oct $mode;
2010        }
2011
2012        if (S_ISGITLINK($mode)) {
2013                return "submodule";
2014        } elsif (S_ISDIR($mode & S_IFMT)) {
2015                return "directory";
2016        } elsif (S_ISLNK($mode)) {
2017                return "symlink";
2018        } elsif (S_ISREG($mode)) {
2019                if ($mode & S_IXUSR) {
2020                        return "executable";
2021                } else {
2022                        return "file";
2023                };
2024        } else {
2025                return "unknown";
2026        }
2027}
2028
2029
2030## ----------------------------------------------------------------------
2031## functions returning short HTML fragments, or transforming HTML fragments
2032## which don't belong to other sections
2033
2034# format line of commit message.
2035sub format_log_line_html {
2036        my $line = shift;
2037
2038        $line = esc_html($line, -nbsp=>1);
2039        $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
2040                $cgi->a({-href => href(action=>"object", hash=>$1),
2041                                        -class => "text"}, $1);
2042        }eg;
2043
2044        return $line;
2045}
2046
2047# format marker of refs pointing to given object
2048
2049# the destination action is chosen based on object type and current context:
2050# - for annotated tags, we choose the tag view unless it's the current view
2051#   already, in which case we go to shortlog view
2052# - for other refs, we keep the current view if we're in history, shortlog or
2053#   log view, and select shortlog otherwise
2054sub format_ref_marker {
2055        my ($refs, $id) = @_;
2056        my $markers = '';
2057
2058        if (defined $refs->{$id}) {
2059                foreach my $ref (@{$refs->{$id}}) {
2060                        # this code exploits the fact that non-lightweight tags are the
2061                        # only indirect objects, and that they are the only objects for which
2062                        # we want to use tag instead of shortlog as action
2063                        my ($type, $name) = qw();
2064                        my $indirect = ($ref =~ s/\^\{\}$//);
2065                        # e.g. tags/v2.6.11 or heads/next
2066                        if ($ref =~ m!^(.*?)s?/(.*)$!) {
2067                                $type = $1;
2068                                $name = $2;
2069                        } else {
2070                                $type = "ref";
2071                                $name = $ref;
2072                        }
2073
2074                        my $class = $type;
2075                        $class .= " indirect" if $indirect;
2076
2077                        my $dest_action = "shortlog";
2078
2079                        if ($indirect) {
2080                                $dest_action = "tag" unless $action eq "tag";
2081                        } elsif ($action =~ /^(history|(short)?log)$/) {
2082                                $dest_action = $action;
2083                        }
2084
2085                        my $dest = "";
2086                        $dest .= "refs/" unless $ref =~ m!^refs/!;
2087                        $dest .= $ref;
2088
2089                        my $link = $cgi->a({
2090                                -href => href(
2091                                        action=>$dest_action,
2092                                        hash=>$dest
2093                                )}, esc_html($name));
2094
2095                        $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
2096                                $link . "</span>";
2097                }
2098        }
2099
2100        if ($markers) {
2101                return ' <span class="refs">'. $markers . '</span>';
2102        } else {
2103                return "";
2104        }
2105}
2106
2107# format, perhaps shortened and with markers, title line
2108sub format_subject_html {
2109        my ($long, $short, $href, $extra) = @_;
2110        $extra = '' unless defined($extra);
2111
2112        if (length($short) < length($long)) {
2113                $long =~ s/[[:cntrl:]]/?/g;
2114                return $cgi->a({-href => $href, -class => "list subject",
2115                                -title => to_utf8($long)},
2116                       esc_html($short)) . $extra;
2117        } else {
2118                return $cgi->a({-href => $href, -class => "list subject"},
2119                       esc_html($long)) . $extra;
2120        }
2121}
2122
2123# Rather than recomputing the url for an email multiple times, we cache it
2124# after the first hit. This gives a visible benefit in views where the avatar
2125# for the same email is used repeatedly (e.g. shortlog).
2126# The cache is shared by all avatar engines (currently gravatar only), which
2127# are free to use it as preferred. Since only one avatar engine is used for any
2128# given page, there's no risk for cache conflicts.
2129our %avatar_cache = ();
2130
2131# Compute the picon url for a given email, by using the picon search service over at
2132# http://www.cs.indiana.edu/picons/search.html
2133sub picon_url {
2134        my $email = lc shift;
2135        if (!$avatar_cache{$email}) {
2136                my ($user, $domain) = split('@', $email);
2137                $avatar_cache{$email} =
2138                        "//www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
2139                        "$domain/$user/" .
2140                        "users+domains+unknown/up/single";
2141        }
2142        return $avatar_cache{$email};
2143}
2144
2145# Compute the gravatar url for a given email, if it's not in the cache already.
2146# Gravatar stores only the part of the URL before the size, since that's the
2147# one computationally more expensive. This also allows reuse of the cache for
2148# different sizes (for this particular engine).
2149sub gravatar_url {
2150        my $email = lc shift;
2151        my $size = shift;
2152        $avatar_cache{$email} ||=
2153                "//www.gravatar.com/avatar/" .
2154                        Digest::MD5::md5_hex($email) . "?s=";
2155        return $avatar_cache{$email} . $size;
2156}
2157
2158# Insert an avatar for the given $email at the given $size if the feature
2159# is enabled.
2160sub git_get_avatar {
2161        my ($email, %opts) = @_;
2162        my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
2163        my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
2164        $opts{-size} ||= 'default';
2165        my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
2166        my $url = "";
2167        if ($git_avatar eq 'gravatar') {
2168                $url = gravatar_url($email, $size);
2169        } elsif ($git_avatar eq 'picon') {
2170                $url = picon_url($email);
2171        }
2172        # Other providers can be added by extending the if chain, defining $url
2173        # as needed. If no variant puts something in $url, we assume avatars
2174        # are completely disabled/unavailable.
2175        if ($url) {
2176                return $pre_white .
2177                       "<img width=\"$size\" " .
2178                            "class=\"avatar\" " .
2179                            "src=\"".esc_url($url)."\" " .
2180                            "alt=\"\" " .
2181                       "/>" . $post_white;
2182        } else {
2183                return "";
2184        }
2185}
2186
2187sub format_search_author {
2188        my ($author, $searchtype, $displaytext) = @_;
2189        my $have_search = gitweb_check_feature('search');
2190
2191        if ($have_search) {
2192                my $performed = "";
2193                if ($searchtype eq 'author') {
2194                        $performed = "authored";
2195                } elsif ($searchtype eq 'committer') {
2196                        $performed = "committed";
2197                }
2198
2199                return $cgi->a({-href => href(action=>"search", hash=>$hash,
2200                                searchtext=>$author,
2201                                searchtype=>$searchtype), class=>"list",
2202                                title=>"Search for commits $performed by $author"},
2203                                $displaytext);
2204
2205        } else {
2206                return $displaytext;
2207        }
2208}
2209
2210# format the author name of the given commit with the given tag
2211# the author name is chopped and escaped according to the other
2212# optional parameters (see chop_str).
2213sub format_author_html {
2214        my $tag = shift;
2215        my $co = shift;
2216        my $author = chop_and_escape_str($co->{'author_name'}, @_);
2217        return "<$tag class=\"author\">" .
2218               format_search_author($co->{'author_name'}, "author",
2219                       git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2220                       $author) .
2221               "</$tag>";
2222}
2223
2224# format git diff header line, i.e. "diff --(git|combined|cc) ..."
2225sub format_git_diff_header_line {
2226        my $line = shift;
2227        my $diffinfo = shift;
2228        my ($from, $to) = @_;
2229
2230        if ($diffinfo->{'nparents'}) {
2231                # combined diff
2232                $line =~ s!^(diff (.*?) )"?.*$!$1!;
2233                if ($to->{'href'}) {
2234                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2235                                         esc_path($to->{'file'}));
2236                } else { # file was deleted (no href)
2237                        $line .= esc_path($to->{'file'});
2238                }
2239        } else {
2240                # "ordinary" diff
2241                $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2242                if ($from->{'href'}) {
2243                        $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2244                                         'a/' . esc_path($from->{'file'}));
2245                } else { # file was added (no href)
2246                        $line .= 'a/' . esc_path($from->{'file'});
2247                }
2248                $line .= ' ';
2249                if ($to->{'href'}) {
2250                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2251                                         'b/' . esc_path($to->{'file'}));
2252                } else { # file was deleted
2253                        $line .= 'b/' . esc_path($to->{'file'});
2254                }
2255        }
2256
2257        return "<div class=\"diff header\">$line</div>\n";
2258}
2259
2260# format extended diff header line, before patch itself
2261sub format_extended_diff_header_line {
2262        my $line = shift;
2263        my $diffinfo = shift;
2264        my ($from, $to) = @_;
2265
2266        # match <path>
2267        if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2268                $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2269                                       esc_path($from->{'file'}));
2270        }
2271        if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2272                $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2273                                 esc_path($to->{'file'}));
2274        }
2275        # match single <mode>
2276        if ($line =~ m/\s(\d{6})$/) {
2277                $line .= '<span class="info"> (' .
2278                         file_type_long($1) .
2279                         ')</span>';
2280        }
2281        # match <hash>
2282        if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2283                # can match only for combined diff
2284                $line = 'index ';
2285                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2286                        if ($from->{'href'}[$i]) {
2287                                $line .= $cgi->a({-href=>$from->{'href'}[$i],
2288                                                  -class=>"hash"},
2289                                                 substr($diffinfo->{'from_id'}[$i],0,7));
2290                        } else {
2291                                $line .= '0' x 7;
2292                        }
2293                        # separator
2294                        $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2295                }
2296                $line .= '..';
2297                if ($to->{'href'}) {
2298                        $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2299                                         substr($diffinfo->{'to_id'},0,7));
2300                } else {
2301                        $line .= '0' x 7;
2302                }
2303
2304        } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2305                # can match only for ordinary diff
2306                my ($from_link, $to_link);
2307                if ($from->{'href'}) {
2308                        $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2309                                             substr($diffinfo->{'from_id'},0,7));
2310                } else {
2311                        $from_link = '0' x 7;
2312                }
2313                if ($to->{'href'}) {
2314                        $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2315                                           substr($diffinfo->{'to_id'},0,7));
2316                } else {
2317                        $to_link = '0' x 7;
2318                }
2319                my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2320                $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2321        }
2322
2323        return $line . "<br/>\n";
2324}
2325
2326# format from-file/to-file diff header
2327sub format_diff_from_to_header {
2328        my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2329        my $line;
2330        my $result = '';
2331
2332        $line = $from_line;
2333        #assert($line =~ m/^---/) if DEBUG;
2334        # no extra formatting for "^--- /dev/null"
2335        if (! $diffinfo->{'nparents'}) {
2336                # ordinary (single parent) diff
2337                if ($line =~ m!^--- "?a/!) {
2338                        if ($from->{'href'}) {
2339                                $line = '--- a/' .
2340                                        $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2341                                                esc_path($from->{'file'}));
2342                        } else {
2343                                $line = '--- a/' .
2344                                        esc_path($from->{'file'});
2345                        }
2346                }
2347                $result .= qq!<div class="diff from_file">$line</div>\n!;
2348
2349        } else {
2350                # combined diff (merge commit)
2351                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2352                        if ($from->{'href'}[$i]) {
2353                                $line = '--- ' .
2354                                        $cgi->a({-href=>href(action=>"blobdiff",
2355                                                             hash_parent=>$diffinfo->{'from_id'}[$i],
2356                                                             hash_parent_base=>$parents[$i],
2357                                                             file_parent=>$from->{'file'}[$i],
2358                                                             hash=>$diffinfo->{'to_id'},
2359                                                             hash_base=>$hash,
2360                                                             file_name=>$to->{'file'}),
2361                                                 -class=>"path",
2362                                                 -title=>"diff" . ($i+1)},
2363                                                $i+1) .
2364                                        '/' .
2365                                        $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2366                                                esc_path($from->{'file'}[$i]));
2367                        } else {
2368                                $line = '--- /dev/null';
2369                        }
2370                        $result .= qq!<div class="diff from_file">$line</div>\n!;
2371                }
2372        }
2373
2374        $line = $to_line;
2375        #assert($line =~ m/^\+\+\+/) if DEBUG;
2376        # no extra formatting for "^+++ /dev/null"
2377        if ($line =~ m!^\+\+\+ "?b/!) {
2378                if ($to->{'href'}) {
2379                        $line = '+++ b/' .
2380                                $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2381                                        esc_path($to->{'file'}));
2382                } else {
2383                        $line = '+++ b/' .
2384                                esc_path($to->{'file'});
2385                }
2386        }
2387        $result .= qq!<div class="diff to_file">$line</div>\n!;
2388
2389        return $result;
2390}
2391
2392# create note for patch simplified by combined diff
2393sub format_diff_cc_simplified {
2394        my ($diffinfo, @parents) = @_;
2395        my $result = '';
2396
2397        $result .= "<div class=\"diff header\">" .
2398                   "diff --cc ";
2399        if (!is_deleted($diffinfo)) {
2400                $result .= $cgi->a({-href => href(action=>"blob",
2401                                                  hash_base=>$hash,
2402                                                  hash=>$diffinfo->{'to_id'},
2403                                                  file_name=>$diffinfo->{'to_file'}),
2404                                    -class => "path"},
2405                                   esc_path($diffinfo->{'to_file'}));
2406        } else {
2407                $result .= esc_path($diffinfo->{'to_file'});
2408        }
2409        $result .= "</div>\n" . # class="diff header"
2410                   "<div class=\"diff nodifferences\">" .
2411                   "Simple merge" .
2412                   "</div>\n"; # class="diff nodifferences"
2413
2414        return $result;
2415}
2416
2417sub diff_line_class {
2418        my ($line, $from, $to) = @_;
2419
2420        # ordinary diff
2421        my $num_sign = 1;
2422        # combined diff
2423        if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2424                $num_sign = scalar @{$from->{'href'}};
2425        }
2426
2427        my @diff_line_classifier = (
2428                { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2429                { regexp => qr/^\\/,               class => "incomplete"  },
2430                { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2431                # classifier for context must come before classifier add/rem,
2432                # or we would have to use more complicated regexp, for example
2433                # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2434                { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2435                { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2436        );
2437        for my $clsfy (@diff_line_classifier) {
2438                return $clsfy->{'class'}
2439                        if ($line =~ $clsfy->{'regexp'});
2440        }
2441
2442        # fallback
2443        return "";
2444}
2445
2446# assumes that $from and $to are defined and correctly filled,
2447# and that $line holds a line of chunk header for unified diff
2448sub format_unidiff_chunk_header {
2449        my ($line, $from, $to) = @_;
2450
2451        my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2452                $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2453
2454        $from_lines = 0 unless defined $from_lines;
2455        $to_lines   = 0 unless defined $to_lines;
2456
2457        if ($from->{'href'}) {
2458                $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2459                                     -class=>"list"}, $from_text);
2460        }
2461        if ($to->{'href'}) {
2462                $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2463                                     -class=>"list"}, $to_text);
2464        }
2465        $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2466                "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2467        return $line;
2468}
2469
2470# assumes that $from and $to are defined and correctly filled,
2471# and that $line holds a line of chunk header for combined diff
2472sub format_cc_diff_chunk_header {
2473        my ($line, $from, $to) = @_;
2474
2475        my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2476        my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2477
2478        @from_text = split(' ', $ranges);
2479        for (my $i = 0; $i < @from_text; ++$i) {
2480                ($from_start[$i], $from_nlines[$i]) =
2481                        (split(',', substr($from_text[$i], 1)), 0);
2482        }
2483
2484        $to_text   = pop @from_text;
2485        $to_start  = pop @from_start;
2486        $to_nlines = pop @from_nlines;
2487
2488        $line = "<span class=\"chunk_info\">$prefix ";
2489        for (my $i = 0; $i < @from_text; ++$i) {
2490                if ($from->{'href'}[$i]) {
2491                        $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2492                                          -class=>"list"}, $from_text[$i]);
2493                } else {
2494                        $line .= $from_text[$i];
2495                }
2496                $line .= " ";
2497        }
2498        if ($to->{'href'}) {
2499                $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2500                                  -class=>"list"}, $to_text);
2501        } else {
2502                $line .= $to_text;
2503        }
2504        $line .= " $prefix</span>" .
2505                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2506        return $line;
2507}
2508
2509# process patch (diff) line (not to be used for diff headers),
2510# returning HTML-formatted (but not wrapped) line.
2511# If the line is passed as a reference, it is treated as HTML and not
2512# esc_html()'ed.
2513sub format_diff_line {
2514        my ($line, $diff_class, $from, $to) = @_;
2515
2516        if (ref($line)) {
2517                $line = $$line;
2518        } else {
2519                chomp $line;
2520                $line = untabify($line);
2521
2522                if ($from && $to && $line =~ m/^\@{2} /) {
2523                        $line = format_unidiff_chunk_header($line, $from, $to);
2524                } elsif ($from && $to && $line =~ m/^\@{3}/) {
2525                        $line = format_cc_diff_chunk_header($line, $from, $to);
2526                } else {
2527                        $line = esc_html($line, -nbsp=>1);
2528                }
2529        }
2530
2531        my $diff_classes = "diff";
2532        $diff_classes .= " $diff_class" if ($diff_class);
2533        $line = "<div class=\"$diff_classes\">$line</div>\n";
2534
2535        return $line;
2536}
2537
2538# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2539# linked.  Pass the hash of the tree/commit to snapshot.
2540sub format_snapshot_links {
2541        my ($hash) = @_;
2542        my $num_fmts = @snapshot_fmts;
2543        if ($num_fmts > 1) {
2544                # A parenthesized list of links bearing format names.
2545                # e.g. "snapshot (_tar.gz_ _zip_)"
2546                return "snapshot (" . join(' ', map
2547                        $cgi->a({
2548                                -href => href(
2549                                        action=>"snapshot",
2550                                        hash=>$hash,
2551                                        snapshot_format=>$_
2552                                )
2553                        }, $known_snapshot_formats{$_}{'display'})
2554                , @snapshot_fmts) . ")";
2555        } elsif ($num_fmts == 1) {
2556                # A single "snapshot" link whose tooltip bears the format name.
2557                # i.e. "_snapshot_"
2558                my ($fmt) = @snapshot_fmts;
2559                return
2560                        $cgi->a({
2561                                -href => href(
2562                                        action=>"snapshot",
2563                                        hash=>$hash,
2564                                        snapshot_format=>$fmt
2565                                ),
2566                                -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2567                        }, "snapshot");
2568        } else { # $num_fmts == 0
2569                return undef;
2570        }
2571}
2572
2573## ......................................................................
2574## functions returning values to be passed, perhaps after some
2575## transformation, to other functions; e.g. returning arguments to href()
2576
2577# returns hash to be passed to href to generate gitweb URL
2578# in -title key it returns description of link
2579sub get_feed_info {
2580        my $format = shift || 'Atom';
2581        my %res = (action => lc($format));
2582        my $matched_ref = 0;
2583
2584        # feed links are possible only for project views
2585        return unless (defined $project);
2586        # some views should link to OPML, or to generic project feed,
2587        # or don't have specific feed yet (so they should use generic)
2588        return if (!$action || $action =~ /^(?:tags|heads|forks|tag|search)$/x);
2589
2590        my $branch = undef;
2591        # branches refs uses 'refs/' + $get_branch_refs()[x] + '/' prefix
2592        # (fullname) to differentiate from tag links; this also makes
2593        # possible to detect branch links
2594        for my $ref (get_branch_refs()) {
2595                if ((defined $hash_base && $hash_base =~ m!^refs/\Q$ref\E/(.*)$!) ||
2596                    (defined $hash      && $hash      =~ m!^refs/\Q$ref\E/(.*)$!)) {
2597                        $branch = $1;
2598                        $matched_ref = $ref;
2599                        last;
2600                }
2601        }
2602        # find log type for feed description (title)
2603        my $type = 'log';
2604        if (defined $file_name) {
2605                $type  = "history of $file_name";
2606                $type .= "/" if ($action eq 'tree');
2607                $type .= " on '$branch'" if (defined $branch);
2608        } else {
2609                $type = "log of $branch" if (defined $branch);
2610        }
2611
2612        $res{-title} = $type;
2613        $res{'hash'} = (defined $branch ? "refs/$matched_ref/$branch" : undef);
2614        $res{'file_name'} = $file_name;
2615
2616        return %res;
2617}
2618
2619## ----------------------------------------------------------------------
2620## git utility subroutines, invoking git commands
2621
2622# returns path to the core git executable and the --git-dir parameter as list
2623sub git_cmd {
2624        $number_of_git_cmds++;
2625        return $GIT, '--git-dir='.$git_dir;
2626}
2627
2628# quote the given arguments for passing them to the shell
2629# quote_command("command", "arg 1", "arg with ' and ! characters")
2630# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2631# Try to avoid using this function wherever possible.
2632sub quote_command {
2633        return join(' ',
2634                map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2635}
2636
2637# get HEAD ref of given project as hash
2638sub git_get_head_hash {
2639        return git_get_full_hash(shift, 'HEAD');
2640}
2641
2642sub git_get_full_hash {
2643        return git_get_hash(@_);
2644}
2645
2646sub git_get_short_hash {
2647        return git_get_hash(@_, '--short=7');
2648}
2649
2650sub git_get_hash {
2651        my ($project, $hash, @options) = @_;
2652        my $o_git_dir = $git_dir;
2653        my $retval = undef;
2654        $git_dir = "$projectroot/$project";
2655        if (open my $fd, '-|', git_cmd(), 'rev-parse',
2656            '--verify', '-q', @options, $hash) {
2657                $retval = <$fd>;
2658                chomp $retval if defined $retval;
2659                close $fd;
2660        }
2661        if (defined $o_git_dir) {
2662                $git_dir = $o_git_dir;
2663        }
2664        return $retval;
2665}
2666
2667# get type of given object
2668sub git_get_type {
2669        my $hash = shift;
2670
2671        open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2672        my $type = <$fd>;
2673        close $fd or return;
2674        chomp $type;
2675        return $type;
2676}
2677
2678# repository configuration
2679our $config_file = '';
2680our %config;
2681
2682# store multiple values for single key as anonymous array reference
2683# single values stored directly in the hash, not as [ <value> ]
2684sub hash_set_multi {
2685        my ($hash, $key, $value) = @_;
2686
2687        if (!exists $hash->{$key}) {
2688                $hash->{$key} = $value;
2689        } elsif (!ref $hash->{$key}) {
2690                $hash->{$key} = [ $hash->{$key}, $value ];
2691        } else {
2692                push @{$hash->{$key}}, $value;
2693        }
2694}
2695
2696# return hash of git project configuration
2697# optionally limited to some section, e.g. 'gitweb'
2698sub git_parse_project_config {
2699        my $section_regexp = shift;
2700        my %config;
2701
2702        local $/ = "\0";
2703
2704        open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2705                or return;
2706
2707        while (my $keyval = <$fh>) {
2708                chomp $keyval;
2709                my ($key, $value) = split(/\n/, $keyval, 2);
2710
2711                hash_set_multi(\%config, $key, $value)
2712                        if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2713        }
2714        close $fh;
2715
2716        return %config;
2717}
2718
2719# convert config value to boolean: 'true' or 'false'
2720# no value, number > 0, 'true' and 'yes' values are true
2721# rest of values are treated as false (never as error)
2722sub config_to_bool {
2723        my $val = shift;
2724
2725        return 1 if !defined $val;             # section.key
2726
2727        # strip leading and trailing whitespace
2728        $val =~ s/^\s+//;
2729        $val =~ s/\s+$//;
2730
2731        return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2732                ($val =~ /^(?:true|yes)$/i));  # section.key = true
2733}
2734
2735# convert config value to simple decimal number
2736# an optional value suffix of 'k', 'm', or 'g' will cause the value
2737# to be multiplied by 1024, 1048576, or 1073741824
2738sub config_to_int {
2739        my $val = shift;
2740
2741        # strip leading and trailing whitespace
2742        $val =~ s/^\s+//;
2743        $val =~ s/\s+$//;
2744
2745        if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2746                $unit = lc($unit);
2747                # unknown unit is treated as 1
2748                return $num * ($unit eq 'g' ? 1073741824 :
2749                               $unit eq 'm' ?    1048576 :
2750                               $unit eq 'k' ?       1024 : 1);
2751        }
2752        return $val;
2753}
2754
2755# convert config value to array reference, if needed
2756sub config_to_multi {
2757        my $val = shift;
2758
2759        return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2760}
2761
2762sub git_get_project_config {
2763        my ($key, $type) = @_;
2764
2765        return unless defined $git_dir;
2766
2767        # key sanity check
2768        return unless ($key);
2769        # only subsection, if exists, is case sensitive,
2770        # and not lowercased by 'git config -z -l'
2771        if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2772                $lo =~ s/_//g;
2773                $key = join(".", lc($hi), $mi, lc($lo));
2774                return if ($lo =~ /\W/ || $hi =~ /\W/);
2775        } else {
2776                $key = lc($key);
2777                $key =~ s/_//g;
2778                return if ($key =~ /\W/);
2779        }
2780        $key =~ s/^gitweb\.//;
2781
2782        # type sanity check
2783        if (defined $type) {
2784                $type =~ s/^--//;
2785                $type = undef
2786                        unless ($type eq 'bool' || $type eq 'int');
2787        }
2788
2789        # get config
2790        if (!defined $config_file ||
2791            $config_file ne "$git_dir/config") {
2792                %config = git_parse_project_config('gitweb');
2793                $config_file = "$git_dir/config";
2794        }
2795
2796        # check if config variable (key) exists
2797        return unless exists $config{"gitweb.$key"};
2798
2799        # ensure given type
2800        if (!defined $type) {
2801                return $config{"gitweb.$key"};
2802        } elsif ($type eq 'bool') {
2803                # backward compatibility: 'git config --bool' returns true/false
2804                return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2805        } elsif ($type eq 'int') {
2806                return config_to_int($config{"gitweb.$key"});
2807        }
2808        return $config{"gitweb.$key"};
2809}
2810
2811# get hash of given path at given ref
2812sub git_get_hash_by_path {
2813        my $base = shift;
2814        my $path = shift || return undef;
2815        my $type = shift;
2816
2817        $path =~ s,/+$,,;
2818
2819        open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2820                or die_error(500, "Open git-ls-tree failed");
2821        my $line = <$fd>;
2822        close $fd or return undef;
2823
2824        if (!defined $line) {
2825                # there is no tree or hash given by $path at $base
2826                return undef;
2827        }
2828
2829        #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2830        $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2831        if (defined $type && $type ne $2) {
2832                # type doesn't match
2833                return undef;
2834        }
2835        return $3;
2836}
2837
2838# get path of entry with given hash at given tree-ish (ref)
2839# used to get 'from' filename for combined diff (merge commit) for renames
2840sub git_get_path_by_hash {
2841        my $base = shift || return;
2842        my $hash = shift || return;
2843
2844        local $/ = "\0";
2845
2846        open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2847                or return undef;
2848        while (my $line = <$fd>) {
2849                chomp $line;
2850
2851                #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2852                #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2853                if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2854                        close $fd;
2855                        return $1;
2856                }
2857        }
2858        close $fd;
2859        return undef;
2860}
2861
2862## ......................................................................
2863## git utility functions, directly accessing git repository
2864
2865# get the value of config variable either from file named as the variable
2866# itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2867# configuration variable in the repository config file.
2868sub git_get_file_or_project_config {
2869        my ($path, $name) = @_;
2870
2871        $git_dir = "$projectroot/$path";
2872        open my $fd, '<', "$git_dir/$name"
2873                or return git_get_project_config($name);
2874        my $conf = <$fd>;
2875        close $fd;
2876        if (defined $conf) {
2877                chomp $conf;
2878        }
2879        return $conf;
2880}
2881
2882sub git_get_project_description {
2883        my $path = shift;
2884        return git_get_file_or_project_config($path, 'description');
2885}
2886
2887sub git_get_project_category {
2888        my $path = shift;
2889        return git_get_file_or_project_config($path, 'category');
2890}
2891
2892
2893# supported formats:
2894# * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2895#   - if its contents is a number, use it as tag weight,
2896#   - otherwise add a tag with weight 1
2897# * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2898#   the same value multiple times increases tag weight
2899# * `gitweb.ctag' multi-valued repo config variable
2900sub git_get_project_ctags {
2901        my $project = shift;
2902        my $ctags = {};
2903
2904        $git_dir = "$projectroot/$project";
2905        if (opendir my $dh, "$git_dir/ctags") {
2906                my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2907                foreach my $tagfile (@files) {
2908                        open my $ct, '<', $tagfile
2909                                or next;
2910                        my $val = <$ct>;
2911                        chomp $val if $val;
2912                        close $ct;
2913
2914                        (my $ctag = $tagfile) =~ s#.*/##;
2915                        if ($val =~ /^\d+$/) {
2916                                $ctags->{$ctag} = $val;
2917                        } else {
2918                                $ctags->{$ctag} = 1;
2919                        }
2920                }
2921                closedir $dh;
2922
2923        } elsif (open my $fh, '<', "$git_dir/ctags") {
2924                while (my $line = <$fh>) {
2925                        chomp $line;
2926                        $ctags->{$line}++ if $line;
2927                }
2928                close $fh;
2929
2930        } else {
2931                my $taglist = config_to_multi(git_get_project_config('ctag'));
2932                foreach my $tag (@$taglist) {
2933                        $ctags->{$tag}++;
2934                }
2935        }
2936
2937        return $ctags;
2938}
2939
2940# return hash, where keys are content tags ('ctags'),
2941# and values are sum of weights of given tag in every project
2942sub git_gather_all_ctags {
2943        my $projects = shift;
2944        my $ctags = {};
2945
2946        foreach my $p (@$projects) {
2947                foreach my $ct (keys %{$p->{'ctags'}}) {
2948                        $ctags->{$ct} += $p->{'ctags'}->{$ct};
2949                }
2950        }
2951
2952        return $ctags;
2953}
2954
2955sub git_populate_project_tagcloud {
2956        my $ctags = shift;
2957
2958        # First, merge different-cased tags; tags vote on casing
2959        my %ctags_lc;
2960        foreach (keys %$ctags) {
2961                $ctags_lc{lc $_}->{count} += $ctags->{$_};
2962                if (not $ctags_lc{lc $_}->{topcount}
2963                    or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2964                        $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2965                        $ctags_lc{lc $_}->{topname} = $_;
2966                }
2967        }
2968
2969        my $cloud;
2970        my $matched = $input_params{'ctag'};
2971        if (eval { require HTML::TagCloud; 1; }) {
2972                $cloud = HTML::TagCloud->new;
2973                foreach my $ctag (sort keys %ctags_lc) {
2974                        # Pad the title with spaces so that the cloud looks
2975                        # less crammed.
2976                        my $title = esc_html($ctags_lc{$ctag}->{topname});
2977                        $title =~ s/ /&nbsp;/g;
2978                        $title =~ s/^/&nbsp;/g;
2979                        $title =~ s/$/&nbsp;/g;
2980                        if (defined $matched && $matched eq $ctag) {
2981                                $title = qq(<span class="match">$title</span>);
2982                        }
2983                        $cloud->add($title, href(project=>undef, ctag=>$ctag),
2984                                    $ctags_lc{$ctag}->{count});
2985                }
2986        } else {
2987                $cloud = {};
2988                foreach my $ctag (keys %ctags_lc) {
2989                        my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2990                        if (defined $matched && $matched eq $ctag) {
2991                                $title = qq(<span class="match">$title</span>);
2992                        }
2993                        $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2994                        $cloud->{$ctag}{ctag} =
2995                                $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2996                }
2997        }
2998        return $cloud;
2999}
3000
3001sub git_show_project_tagcloud {
3002        my ($cloud, $count) = @_;
3003        if (ref $cloud eq 'HTML::TagCloud') {
3004                return $cloud->html_and_css($count);
3005        } else {
3006                my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
3007                return
3008                        '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
3009                        join (', ', map {
3010                                $cloud->{$_}->{'ctag'}
3011                        } splice(@tags, 0, $count)) .
3012                        '</div>';
3013        }
3014}
3015
3016sub git_get_project_url_list {
3017        my $path = shift;
3018
3019        $git_dir = "$projectroot/$path";
3020        open my $fd, '<', "$git_dir/cloneurl"
3021                or return wantarray ?
3022                @{ config_to_multi(git_get_project_config('url')) } :
3023                   config_to_multi(git_get_project_config('url'));
3024        my @git_project_url_list = map { chomp; $_ } <$fd>;
3025        close $fd;
3026
3027        return wantarray ? @git_project_url_list : \@git_project_url_list;
3028}
3029
3030sub git_get_projects_list {
3031        my $filter = shift || '';
3032        my $paranoid = shift;
3033        my @list;
3034
3035        if (-d $projects_list) {
3036                # search in directory
3037                my $dir = $projects_list;
3038                # remove the trailing "/"
3039                $dir =~ s!/+$!!;
3040                my $pfxlen = length("$dir");
3041                my $pfxdepth = ($dir =~ tr!/!!);
3042                # when filtering, search only given subdirectory
3043                if ($filter && !$paranoid) {
3044                        $dir .= "/$filter";
3045                        $dir =~ s!/+$!!;
3046                }
3047
3048                File::Find::find({
3049                        follow_fast => 1, # follow symbolic links
3050                        follow_skip => 2, # ignore duplicates
3051                        dangling_symlinks => 0, # ignore dangling symlinks, silently
3052                        wanted => sub {
3053                                # global variables
3054                                our $project_maxdepth;
3055                                our $projectroot;
3056                                # skip project-list toplevel, if we get it.
3057                                return if (m!^[/.]$!);
3058                                # only directories can be git repositories
3059                                return unless (-d $_);
3060                                # don't traverse too deep (Find is super slow on os x)
3061                                # $project_maxdepth excludes depth of $projectroot
3062                                if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
3063                                        $File::Find::prune = 1;
3064                                        return;
3065                                }
3066
3067                                my $path = substr($File::Find::name, $pfxlen + 1);
3068                                # paranoidly only filter here
3069                                if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
3070                                        next;
3071                                }
3072                                # we check related file in $projectroot
3073                                if (check_export_ok("$projectroot/$path")) {
3074                                        push @list, { path => $path };
3075                                        $File::Find::prune = 1;
3076                                }
3077                        },
3078                }, "$dir");
3079
3080        } elsif (-f $projects_list) {
3081                # read from file(url-encoded):
3082                # 'git%2Fgit.git Linus+Torvalds'
3083                # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3084                # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3085                open my $fd, '<', $projects_list or return;
3086        PROJECT:
3087                while (my $line = <$fd>) {
3088                        chomp $line;
3089                        my ($path, $owner) = split ' ', $line;
3090                        $path = unescape($path);
3091                        $owner = unescape($owner);
3092                        if (!defined $path) {
3093                                next;
3094                        }
3095                        # if $filter is rpovided, check if $path begins with $filter
3096                        if ($filter && $path !~ m!^\Q$filter\E/!) {
3097                                next;
3098                        }
3099                        if (check_export_ok("$projectroot/$path")) {
3100                                my $pr = {
3101                                        path => $path
3102                                };
3103                                if ($owner) {
3104                                        $pr->{'owner'} = to_utf8($owner);
3105                                }
3106                                push @list, $pr;
3107                        }
3108                }
3109                close $fd;
3110        }
3111        return @list;
3112}
3113
3114# written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
3115# as side effects it sets 'forks' field to list of forks for forked projects
3116sub filter_forks_from_projects_list {
3117        my $projects = shift;
3118
3119        my %trie; # prefix tree of directories (path components)
3120        # generate trie out of those directories that might contain forks
3121        foreach my $pr (@$projects) {
3122                my $path = $pr->{'path'};
3123                $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
3124                next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
3125                next unless ($path);      # skip '.git' repository: tests, git-instaweb
3126                next unless (-d "$projectroot/$path"); # containing directory exists
3127                $pr->{'forks'} = [];      # there can be 0 or more forks of project
3128
3129                # add to trie
3130                my @dirs = split('/', $path);
3131                # walk the trie, until either runs out of components or out of trie
3132                my $ref = \%trie;
3133                while (scalar @dirs &&
3134                       exists($ref->{$dirs[0]})) {
3135                        $ref = $ref->{shift @dirs};
3136                }
3137                # create rest of trie structure from rest of components
3138                foreach my $dir (@dirs) {
3139                        $ref = $ref->{$dir} = {};
3140                }
3141                # create end marker, store $pr as a data
3142                $ref->{''} = $pr if (!exists $ref->{''});
3143        }
3144
3145        # filter out forks, by finding shortest prefix match for paths
3146        my @filtered;
3147 PROJECT:
3148        foreach my $pr (@$projects) {
3149                # trie lookup
3150                my $ref = \%trie;
3151        DIR:
3152                foreach my $dir (split('/', $pr->{'path'})) {
3153                        if (exists $ref->{''}) {
3154                                # found [shortest] prefix, is a fork - skip it
3155                                push @{$ref->{''}{'forks'}}, $pr;
3156                                next PROJECT;
3157                        }
3158                        if (!exists $ref->{$dir}) {
3159                                # not in trie, cannot have prefix, not a fork
3160                                push @filtered, $pr;
3161                                next PROJECT;
3162                        }
3163                        # If the dir is there, we just walk one step down the trie.
3164                        $ref = $ref->{$dir};
3165                }
3166                # we ran out of trie
3167                # (shouldn't happen: it's either no match, or end marker)
3168                push @filtered, $pr;
3169        }
3170
3171        return @filtered;
3172}
3173
3174# note: fill_project_list_info must be run first,
3175# for 'descr_long' and 'ctags' to be filled
3176sub search_projects_list {
3177        my ($projlist, %opts) = @_;
3178        my $tagfilter  = $opts{'tagfilter'};
3179        my $search_re = $opts{'search_regexp'};
3180
3181        return @$projlist
3182                unless ($tagfilter || $search_re);
3183
3184        # searching projects require filling to be run before it;
3185        fill_project_list_info($projlist,
3186                               $tagfilter  ? 'ctags' : (),
3187                               $search_re ? ('path', 'descr') : ());
3188        my @projects;
3189 PROJECT:
3190        foreach my $pr (@$projlist) {
3191
3192                if ($tagfilter) {
3193                        next unless ref($pr->{'ctags'}) eq 'HASH';
3194                        next unless
3195                                grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
3196                }
3197
3198                if ($search_re) {
3199                        next unless
3200                                $pr->{'path'} =~ /$search_re/ ||
3201                                $pr->{'descr_long'} =~ /$search_re/;
3202                }
3203
3204                push @projects, $pr;
3205        }
3206
3207        return @projects;
3208}
3209
3210our $gitweb_project_owner = undef;
3211sub git_get_project_list_from_file {
3212
3213        return if (defined $gitweb_project_owner);
3214
3215        $gitweb_project_owner = {};
3216        # read from file (url-encoded):
3217        # 'git%2Fgit.git Linus+Torvalds'
3218        # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3219        # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3220        if (-f $projects_list) {
3221                open(my $fd, '<', $projects_list);
3222                while (my $line = <$fd>) {
3223                        chomp $line;
3224                        my ($pr, $ow) = split ' ', $line;
3225                        $pr = unescape($pr);
3226                        $ow = unescape($ow);
3227                        $gitweb_project_owner->{$pr} = to_utf8($ow);
3228                }
3229                close $fd;
3230        }
3231}
3232
3233sub git_get_project_owner {
3234        my $project = shift;
3235        my $owner;
3236
3237        return undef unless $project;
3238        $git_dir = "$projectroot/$project";
3239
3240        if (!defined $gitweb_project_owner) {
3241                git_get_project_list_from_file();
3242        }
3243
3244        if (exists $gitweb_project_owner->{$project}) {
3245                $owner = $gitweb_project_owner->{$project};
3246        }
3247        if (!defined $owner){
3248                $owner = git_get_project_config('owner');
3249        }
3250        if (!defined $owner) {
3251                $owner = get_file_owner("$git_dir");
3252        }
3253
3254        return $owner;
3255}
3256
3257sub git_get_last_activity {
3258        my ($path) = @_;
3259        my $fd;
3260
3261        $git_dir = "$projectroot/$path";
3262        open($fd, "-|", git_cmd(), 'for-each-ref',
3263             '--format=%(committer)',
3264             '--sort=-committerdate',
3265             '--count=1',
3266             map { "refs/$_" } get_branch_refs ()) or return;
3267        my $most_recent = <$fd>;
3268        close $fd or return;
3269        if (defined $most_recent &&
3270            $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3271                my $timestamp = $1;
3272                my $age = time - $timestamp;
3273                return ($age, age_string($age));
3274        }
3275        return (undef, undef);
3276}
3277
3278# Implementation note: when a single remote is wanted, we cannot use 'git
3279# remote show -n' because that command always work (assuming it's a remote URL
3280# if it's not defined), and we cannot use 'git remote show' because that would
3281# try to make a network roundtrip. So the only way to find if that particular
3282# remote is defined is to walk the list provided by 'git remote -v' and stop if
3283# and when we find what we want.
3284sub git_get_remotes_list {
3285        my $wanted = shift;
3286        my %remotes = ();
3287
3288        open my $fd, '-|' , git_cmd(), 'remote', '-v';
3289        return unless $fd;
3290        while (my $remote = <$fd>) {
3291                chomp $remote;
3292                $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3293                next if $wanted and not $remote eq $wanted;
3294                my ($url, $key) = ($1, $2);
3295
3296                $remotes{$remote} ||= { 'heads' => () };
3297                $remotes{$remote}{$key} = $url;
3298        }
3299        close $fd or return;
3300        return wantarray ? %remotes : \%remotes;
3301}
3302
3303# Takes a hash of remotes as first parameter and fills it by adding the
3304# available remote heads for each of the indicated remotes.
3305sub fill_remote_heads {
3306        my $remotes = shift;
3307        my @heads = map { "remotes/$_" } keys %$remotes;
3308        my @remoteheads = git_get_heads_list(undef, @heads);
3309        foreach my $remote (keys %$remotes) {
3310                $remotes->{$remote}{'heads'} = [ grep {
3311                        $_->{'name'} =~ s!^$remote/!!
3312                        } @remoteheads ];
3313        }
3314}
3315
3316sub git_get_references {
3317        my $type = shift || "";
3318        my %refs;
3319        # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3320        # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3321        open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3322                ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3323                or return;
3324
3325        while (my $line = <$fd>) {
3326                chomp $line;
3327                if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3328                        if (defined $refs{$1}) {
3329                                push @{$refs{$1}}, $2;
3330                        } else {
3331                                $refs{$1} = [ $2 ];
3332                        }
3333                }
3334        }
3335        close $fd or return;
3336        return \%refs;
3337}
3338
3339sub git_get_rev_name_tags {
3340        my $hash = shift || return undef;
3341
3342        open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3343                or return;
3344        my $name_rev = <$fd>;
3345        close $fd;
3346
3347        if ($name_rev =~ m|^$hash tags/(.*)$|) {
3348                return $1;
3349        } else {
3350                # catches also '$hash undefined' output
3351                return undef;
3352        }
3353}
3354
3355## ----------------------------------------------------------------------
3356## parse to hash functions
3357
3358sub parse_date {
3359        my $epoch = shift;
3360        my $tz = shift || "-0000";
3361
3362        my %date;
3363        my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3364        my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3365        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3366        $date{'hour'} = $hour;
3367        $date{'minute'} = $min;
3368        $date{'mday'} = $mday;
3369        $date{'day'} = $days[$wday];
3370        $date{'month'} = $months[$mon];
3371        $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3372                             $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3373        $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3374                             $mday, $months[$mon], $hour ,$min;
3375        $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3376                             1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3377
3378        my ($tz_sign, $tz_hour, $tz_min) =
3379                ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3380        $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3381        my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3382        ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3383        $date{'hour_local'} = $hour;
3384        $date{'minute_local'} = $min;
3385        $date{'tz_local'} = $tz;
3386        $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3387                                  1900+$year, $mon+1, $mday,
3388                                  $hour, $min, $sec, $tz);
3389        return %date;
3390}
3391
3392sub parse_tag {
3393        my $tag_id = shift;
3394        my %tag;
3395        my @comment;
3396
3397        open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3398        $tag{'id'} = $tag_id;
3399        while (my $line = <$fd>) {
3400                chomp $line;
3401                if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3402                        $tag{'object'} = $1;
3403                } elsif ($line =~ m/^type (.+)$/) {
3404                        $tag{'type'} = $1;
3405                } elsif ($line =~ m/^tag (.+)$/) {
3406                        $tag{'name'} = $1;
3407                } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3408                        $tag{'author'} = $1;
3409                        $tag{'author_epoch'} = $2;
3410                        $tag{'author_tz'} = $3;
3411                        if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3412                                $tag{'author_name'}  = $1;
3413                                $tag{'author_email'} = $2;
3414                        } else {
3415                                $tag{'author_name'} = $tag{'author'};
3416                        }
3417                } elsif ($line =~ m/--BEGIN/) {
3418                        push @comment, $line;
3419                        last;
3420                } elsif ($line eq "") {
3421                        last;
3422                }
3423        }
3424        push @comment, <$fd>;
3425        $tag{'comment'} = \@comment;
3426        close $fd or return;
3427        if (!defined $tag{'name'}) {
3428                return
3429        };
3430        return %tag
3431}
3432
3433sub parse_commit_text {
3434        my ($commit_text, $withparents) = @_;
3435        my @commit_lines = split '\n', $commit_text;
3436        my %co;
3437
3438        pop @commit_lines; # Remove '\0'
3439
3440        if (! @commit_lines) {
3441                return;
3442        }
3443
3444        my $header = shift @commit_lines;
3445        if ($header !~ m/^[0-9a-fA-F]{40}/) {
3446                return;
3447        }
3448        ($co{'id'}, my @parents) = split ' ', $header;
3449        while (my $line = shift @commit_lines) {
3450                last if $line eq "\n";
3451                if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3452                        $co{'tree'} = $1;
3453                } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3454                        push @parents, $1;
3455                } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3456                        $co{'author'} = to_utf8($1);
3457                        $co{'author_epoch'} = $2;
3458                        $co{'author_tz'} = $3;
3459                        if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3460                                $co{'author_name'}  = $1;
3461                                $co{'author_email'} = $2;
3462                        } else {
3463                                $co{'author_name'} = $co{'author'};
3464                        }
3465                } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3466                        $co{'committer'} = to_utf8($1);
3467                        $co{'committer_epoch'} = $2;
3468                        $co{'committer_tz'} = $3;
3469                        if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3470                                $co{'committer_name'}  = $1;
3471                                $co{'committer_email'} = $2;
3472                        } else {
3473                                $co{'committer_name'} = $co{'committer'};
3474                        }
3475                }
3476        }
3477        if (!defined $co{'tree'}) {
3478                return;
3479        };
3480        $co{'parents'} = \@parents;
3481        $co{'parent'} = $parents[0];
3482
3483        foreach my $title (@commit_lines) {
3484                $title =~ s/^    //;
3485                if ($title ne "") {
3486                        $co{'title'} = chop_str($title, 80, 5);
3487                        # remove leading stuff of merges to make the interesting part visible
3488                        if (length($title) > 50) {
3489                                $title =~ s/^Automatic //;
3490                                $title =~ s/^merge (of|with) /Merge ... /i;
3491                                if (length($title) > 50) {
3492                                        $title =~ s/(http|rsync):\/\///;
3493                                }
3494                                if (length($title) > 50) {
3495                                        $title =~ s/(master|www|rsync)\.//;
3496                                }
3497                                if (length($title) > 50) {
3498                                        $title =~ s/kernel.org:?//;
3499                                }
3500                                if (length($title) > 50) {
3501                                        $title =~ s/\/pub\/scm//;
3502                                }
3503                        }
3504                        $co{'title_short'} = chop_str($title, 50, 5);
3505                        last;
3506                }
3507        }
3508        if (! defined $co{'title'} || $co{'title'} eq "") {
3509                $co{'title'} = $co{'title_short'} = '(no commit message)';
3510        }
3511        # remove added spaces
3512        foreach my $line (@commit_lines) {
3513                $line =~ s/^    //;
3514        }
3515        $co{'comment'} = \@commit_lines;
3516
3517        my $age = time - $co{'committer_epoch'};
3518        $co{'age'} = $age;
3519        $co{'age_string'} = age_string($age);
3520        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3521        if ($age > 60*60*24*7*2) {
3522                $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3523                $co{'age_string_age'} = $co{'age_string'};
3524        } else {
3525                $co{'age_string_date'} = $co{'age_string'};
3526                $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3527        }
3528        return %co;
3529}
3530
3531sub parse_commit {
3532        my ($commit_id) = @_;
3533        my %co;
3534
3535        local $/ = "\0";
3536
3537        open my $fd, "-|", git_cmd(), "rev-list",
3538                "--parents",
3539                "--header",
3540                "--max-count=1",
3541                $commit_id,
3542                "--",
3543                or die_error(500, "Open git-rev-list failed");
3544        %co = parse_commit_text(<$fd>, 1);
3545        close $fd;
3546
3547        return %co;
3548}
3549
3550sub parse_commits {
3551        my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3552        my @cos;
3553
3554        $maxcount ||= 1;
3555        $skip ||= 0;
3556
3557        local $/ = "\0";
3558
3559        open my $fd, "-|", git_cmd(), "rev-list",
3560                "--header",
3561                @args,
3562                ("--max-count=" . $maxcount),
3563                ("--skip=" . $skip),
3564                @extra_options,
3565                $commit_id,
3566                "--",
3567                ($filename ? ($filename) : ())
3568                or die_error(500, "Open git-rev-list failed");
3569        while (my $line = <$fd>) {
3570                my %co = parse_commit_text($line);
3571                push @cos, \%co;
3572        }
3573        close $fd;
3574
3575        return wantarray ? @cos : \@cos;
3576}
3577
3578# parse line of git-diff-tree "raw" output
3579sub parse_difftree_raw_line {
3580        my $line = shift;
3581        my %res;
3582
3583        # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3584        # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3585        if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3586                $res{'from_mode'} = $1;
3587                $res{'to_mode'} = $2;
3588                $res{'from_id'} = $3;
3589                $res{'to_id'} = $4;
3590                $res{'status'} = $5;
3591                $res{'similarity'} = $6;
3592                if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3593                        ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3594                } else {
3595                        $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3596                }
3597        }
3598        # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3599        # combined diff (for merge commit)
3600        elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3601                $res{'nparents'}  = length($1);
3602                $res{'from_mode'} = [ split(' ', $2) ];
3603                $res{'to_mode'} = pop @{$res{'from_mode'}};
3604                $res{'from_id'} = [ split(' ', $3) ];
3605                $res{'to_id'} = pop @{$res{'from_id'}};
3606                $res{'status'} = [ split('', $4) ];
3607                $res{'to_file'} = unquote($5);
3608        }
3609        # 'c512b523472485aef4fff9e57b229d9d243c967f'
3610        elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3611                $res{'commit'} = $1;
3612        }
3613
3614        return wantarray ? %res : \%res;
3615}
3616
3617# wrapper: return parsed line of git-diff-tree "raw" output
3618# (the argument might be raw line, or parsed info)
3619sub parsed_difftree_line {
3620        my $line_or_ref = shift;
3621
3622        if (ref($line_or_ref) eq "HASH") {
3623                # pre-parsed (or generated by hand)
3624                return $line_or_ref;
3625        } else {
3626                return parse_difftree_raw_line($line_or_ref);
3627        }
3628}
3629
3630# parse line of git-ls-tree output
3631sub parse_ls_tree_line {
3632        my $line = shift;
3633        my %opts = @_;
3634        my %res;
3635
3636        if ($opts{'-l'}) {
3637                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3638                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3639
3640                $res{'mode'} = $1;
3641                $res{'type'} = $2;
3642                $res{'hash'} = $3;
3643                $res{'size'} = $4;
3644                if ($opts{'-z'}) {
3645                        $res{'name'} = $5;
3646                } else {
3647                        $res{'name'} = unquote($5);
3648                }
3649        } else {
3650                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3651                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3652
3653                $res{'mode'} = $1;
3654                $res{'type'} = $2;
3655                $res{'hash'} = $3;
3656                if ($opts{'-z'}) {
3657                        $res{'name'} = $4;
3658                } else {
3659                        $res{'name'} = unquote($4);
3660                }
3661        }
3662
3663        return wantarray ? %res : \%res;
3664}
3665
3666# generates _two_ hashes, references to which are passed as 2 and 3 argument
3667sub parse_from_to_diffinfo {
3668        my ($diffinfo, $from, $to, @parents) = @_;
3669
3670        if ($diffinfo->{'nparents'}) {
3671                # combined diff
3672                $from->{'file'} = [];
3673                $from->{'href'} = [];
3674                fill_from_file_info($diffinfo, @parents)
3675                        unless exists $diffinfo->{'from_file'};
3676                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3677                        $from->{'file'}[$i] =
3678                                defined $diffinfo->{'from_file'}[$i] ?
3679                                        $diffinfo->{'from_file'}[$i] :
3680                                        $diffinfo->{'to_file'};
3681                        if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3682                                $from->{'href'}[$i] = href(action=>"blob",
3683                                                           hash_base=>$parents[$i],
3684                                                           hash=>$diffinfo->{'from_id'}[$i],
3685                                                           file_name=>$from->{'file'}[$i]);
3686                        } else {
3687                                $from->{'href'}[$i] = undef;
3688                        }
3689                }
3690        } else {
3691                # ordinary (not combined) diff
3692                $from->{'file'} = $diffinfo->{'from_file'};
3693                if ($diffinfo->{'status'} ne "A") { # not new (added) file
3694                        $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3695                                               hash=>$diffinfo->{'from_id'},
3696                                               file_name=>$from->{'file'});
3697                } else {
3698                        delete $from->{'href'};
3699                }
3700        }
3701
3702        $to->{'file'} = $diffinfo->{'to_file'};
3703        if (!is_deleted($diffinfo)) { # file exists in result
3704                $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3705                                     hash=>$diffinfo->{'to_id'},
3706                                     file_name=>$to->{'file'});
3707        } else {
3708                delete $to->{'href'};
3709        }
3710}
3711
3712## ......................................................................
3713## parse to array of hashes functions
3714
3715sub git_get_heads_list {
3716        my ($limit, @classes) = @_;
3717        @classes = get_branch_refs() unless @classes;
3718        my @patterns = map { "refs/$_" } @classes;
3719        my @headslist;
3720
3721        open my $fd, '-|', git_cmd(), 'for-each-ref',
3722                ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3723                '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3724                @patterns
3725                or return;
3726        while (my $line = <$fd>) {
3727                my %ref_item;
3728
3729                chomp $line;
3730                my ($refinfo, $committerinfo) = split(/\0/, $line);
3731                my ($hash, $name, $title) = split(' ', $refinfo, 3);
3732                my ($committer, $epoch, $tz) =
3733                        ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3734                $ref_item{'fullname'}  = $name;
3735                my $strip_refs = join '|', map { quotemeta } get_branch_refs();
3736                $name =~ s!^refs/($strip_refs|remotes)/!!;
3737                $ref_item{'name'} = $name;
3738                # for refs neither in 'heads' nor 'remotes' we want to
3739                # show their ref dir
3740                my $ref_dir = (defined $1) ? $1 : '';
3741                if ($ref_dir ne '' and $ref_dir ne 'heads' and $ref_dir ne 'remotes') {
3742                    $ref_item{'name'} .= ' (' . $ref_dir . ')';
3743                }
3744
3745                $ref_item{'id'}    = $hash;
3746                $ref_item{'title'} = $title || '(no commit message)';
3747                $ref_item{'epoch'} = $epoch;
3748                if ($epoch) {
3749                        $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3750                } else {
3751                        $ref_item{'age'} = "unknown";
3752                }
3753
3754                push @headslist, \%ref_item;
3755        }
3756        close $fd;
3757
3758        return wantarray ? @headslist : \@headslist;
3759}
3760
3761sub git_get_tags_list {
3762        my $limit = shift;
3763        my @tagslist;
3764
3765        open my $fd, '-|', git_cmd(), 'for-each-ref',
3766                ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3767                '--format=%(objectname) %(objecttype) %(refname) '.
3768                '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3769                'refs/tags'
3770                or return;
3771        while (my $line = <$fd>) {
3772                my %ref_item;
3773
3774                chomp $line;
3775                my ($refinfo, $creatorinfo) = split(/\0/, $line);
3776                my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3777                my ($creator, $epoch, $tz) =
3778                        ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3779                $ref_item{'fullname'} = $name;
3780                $name =~ s!^refs/tags/!!;
3781
3782                $ref_item{'type'} = $type;
3783                $ref_item{'id'} = $id;
3784                $ref_item{'name'} = $name;
3785                if ($type eq "tag") {
3786                        $ref_item{'subject'} = $title;
3787                        $ref_item{'reftype'} = $reftype;
3788                        $ref_item{'refid'}   = $refid;
3789                } else {
3790                        $ref_item{'reftype'} = $type;
3791                        $ref_item{'refid'}   = $id;
3792                }
3793
3794                if ($type eq "tag" || $type eq "commit") {
3795                        $ref_item{'epoch'} = $epoch;
3796                        if ($epoch) {
3797                                $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3798                        } else {
3799                                $ref_item{'age'} = "unknown";
3800                        }
3801                }
3802
3803                push @tagslist, \%ref_item;
3804        }
3805        close $fd;
3806
3807        return wantarray ? @tagslist : \@tagslist;
3808}
3809
3810## ----------------------------------------------------------------------
3811## filesystem-related functions
3812
3813sub get_file_owner {
3814        my $path = shift;
3815
3816        my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3817        my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3818        if (!defined $gcos) {
3819                return undef;
3820        }
3821        my $owner = $gcos;
3822        $owner =~ s/[,;].*$//;
3823        return to_utf8($owner);
3824}
3825
3826# assume that file exists
3827sub insert_file {
3828        my $filename = shift;
3829
3830        open my $fd, '<', $filename;
3831        print map { to_utf8($_) } <$fd>;
3832        close $fd;
3833}
3834
3835## ......................................................................
3836## mimetype related functions
3837
3838sub mimetype_guess_file {
3839        my $filename = shift;
3840        my $mimemap = shift;
3841        -r $mimemap or return undef;
3842
3843        my %mimemap;
3844        open(my $mh, '<', $mimemap) or return undef;
3845        while (<$mh>) {
3846                next if m/^#/; # skip comments
3847                my ($mimetype, @exts) = split(/\s+/);
3848                foreach my $ext (@exts) {
3849                        $mimemap{$ext} = $mimetype;
3850                }
3851        }
3852        close($mh);
3853
3854        $filename =~ /\.([^.]*)$/;
3855        return $mimemap{$1};
3856}
3857
3858sub mimetype_guess {
3859        my $filename = shift;
3860        my $mime;
3861        $filename =~ /\./ or return undef;
3862
3863        if ($mimetypes_file) {
3864                my $file = $mimetypes_file;
3865                if ($file !~ m!^/!) { # if it is relative path
3866                        # it is relative to project
3867                        $file = "$projectroot/$project/$file";
3868                }
3869                $mime = mimetype_guess_file($filename, $file);
3870        }
3871        $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3872        return $mime;
3873}
3874
3875sub blob_mimetype {
3876        my $fd = shift;
3877        my $filename = shift;
3878
3879        if ($filename) {
3880                my $mime = mimetype_guess($filename);
3881                $mime and return $mime;
3882        }
3883
3884        # just in case
3885        return $default_blob_plain_mimetype unless $fd;
3886
3887        if (-T $fd) {
3888                return 'text/plain';
3889        } elsif (! $filename) {
3890                return 'application/octet-stream';
3891        } elsif ($filename =~ m/\.png$/i) {
3892                return 'image/png';
3893        } elsif ($filename =~ m/\.gif$/i) {
3894                return 'image/gif';
3895        } elsif ($filename =~ m/\.jpe?g$/i) {
3896                return 'image/jpeg';
3897        } else {
3898                return 'application/octet-stream';
3899        }
3900}
3901
3902sub blob_contenttype {
3903        my ($fd, $file_name, $type) = @_;
3904
3905        $type ||= blob_mimetype($fd, $file_name);
3906        if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3907                $type .= "; charset=$default_text_plain_charset";
3908        }
3909
3910        return $type;
3911}
3912
3913# guess file syntax for syntax highlighting; return undef if no highlighting
3914# the name of syntax can (in the future) depend on syntax highlighter used
3915sub guess_file_syntax {
3916        my ($highlight, $file_name) = @_;
3917        return undef unless ($highlight && defined $file_name);
3918        my $basename = basename($file_name, '.in');
3919        return $highlight_basename{$basename}
3920                if exists $highlight_basename{$basename};
3921
3922        $basename =~ /\.([^.]*)$/;
3923        my $ext = $1 or return undef;
3924        return $highlight_ext{$ext}
3925                if exists $highlight_ext{$ext};
3926
3927        return undef;
3928}
3929
3930# run highlighter and return FD of its output,
3931# or return original FD if no highlighting
3932sub run_highlighter {
3933        my ($fd, $highlight, $syntax) = @_;
3934        return $fd unless ($highlight);
3935
3936        close $fd;
3937        my $syntax_arg = (defined $syntax) ? "--syntax $syntax" : "--force";
3938        open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3939                  quote_command($^X, '-CO', '-MEncode=decode,FB_DEFAULT', '-pse',
3940                    '$_ = decode($fe, $_, FB_DEFAULT) if !utf8::decode($_);',
3941                    '--', "-fe=$fallback_encoding")." | ".
3942                  quote_command($highlight_bin).
3943                  " --replace-tabs=8 --fragment $syntax_arg |"
3944                or die_error(500, "Couldn't open file or run syntax highlighter");
3945        return $fd;
3946}
3947
3948## ======================================================================
3949## functions printing HTML: header, footer, error page
3950
3951sub get_page_title {
3952        my $title = to_utf8($site_name);
3953
3954        unless (defined $project) {
3955                if (defined $project_filter) {
3956                        $title .= " - projects in '" . esc_path($project_filter) . "'";
3957                }
3958                return $title;
3959        }
3960        $title .= " - " . to_utf8($project);
3961
3962        return $title unless (defined $action);
3963        $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3964
3965        return $title unless (defined $file_name);
3966        $title .= " - " . esc_path($file_name);
3967        if ($action eq "tree" && $file_name !~ m|/$|) {
3968                $title .= "/";
3969        }
3970
3971        return $title;
3972}
3973
3974sub get_content_type_html {
3975        # require explicit support from the UA if we are to send the page as
3976        # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3977        # we have to do this because MSIE sometimes globs '*/*', pretending to
3978        # support xhtml+xml but choking when it gets what it asked for.
3979        if (defined $cgi->http('HTTP_ACCEPT') &&
3980            $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3981            $cgi->Accept('application/xhtml+xml') != 0) {
3982                return 'application/xhtml+xml';
3983        } else {
3984                return 'text/html';
3985        }
3986}
3987
3988sub print_feed_meta {
3989        if (defined $project) {
3990                my %href_params = get_feed_info();
3991                if (!exists $href_params{'-title'}) {
3992                        $href_params{'-title'} = 'log';
3993                }
3994
3995                foreach my $format (qw(RSS Atom)) {
3996                        my $type = lc($format);
3997                        my %link_attr = (
3998                                '-rel' => 'alternate',
3999                                '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
4000                                '-type' => "application/$type+xml"
4001                        );
4002
4003                        $href_params{'extra_options'} = undef;
4004                        $href_params{'action'} = $type;
4005                        $link_attr{'-href'} = href(%href_params);
4006                        print "<link ".
4007                              "rel=\"$link_attr{'-rel'}\" ".
4008                              "title=\"$link_attr{'-title'}\" ".
4009                              "href=\"$link_attr{'-href'}\" ".
4010                              "type=\"$link_attr{'-type'}\" ".
4011                              "/>\n";
4012
4013                        $href_params{'extra_options'} = '--no-merges';
4014                        $link_attr{'-href'} = href(%href_params);
4015                        $link_attr{'-title'} .= ' (no merges)';
4016                        print "<link ".
4017                              "rel=\"$link_attr{'-rel'}\" ".
4018                              "title=\"$link_attr{'-title'}\" ".
4019                              "href=\"$link_attr{'-href'}\" ".
4020                              "type=\"$link_attr{'-type'}\" ".
4021                              "/>\n";
4022                }
4023
4024        } else {
4025                printf('<link rel="alternate" title="%s projects list" '.
4026                       'href="%s" type="text/plain; charset=utf-8" />'."\n",
4027                       esc_attr($site_name), href(project=>undef, action=>"project_index"));
4028                printf('<link rel="alternate" title="%s projects feeds" '.
4029                       'href="%s" type="text/x-opml" />'."\n",
4030                       esc_attr($site_name), href(project=>undef, action=>"opml"));
4031        }
4032}
4033
4034sub print_header_links {
4035        my $status = shift;
4036
4037        # print out each stylesheet that exist, providing backwards capability
4038        # for those people who defined $stylesheet in a config file
4039        if (defined $stylesheet) {
4040                print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
4041        } else {
4042                foreach my $stylesheet (@stylesheets) {
4043                        next unless $stylesheet;
4044                        print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
4045                }
4046        }
4047        print_feed_meta()
4048                if ($status eq '200 OK');
4049        if (defined $favicon) {
4050                print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
4051        }
4052}
4053
4054sub print_nav_breadcrumbs_path {
4055        my $dirprefix = undef;
4056        while (my $part = shift) {
4057                $dirprefix .= "/" if defined $dirprefix;
4058                $dirprefix .= $part;
4059                print $cgi->a({-href => href(project => undef,
4060                                             project_filter => $dirprefix,
4061                                             action => "project_list")},
4062                              esc_html($part)) . " / ";
4063        }
4064}
4065
4066sub print_nav_breadcrumbs {
4067        my %opts = @_;
4068
4069        for my $crumb (@extra_breadcrumbs, [ $home_link_str => $home_link ]) {
4070                print $cgi->a({-href => esc_url($crumb->[1])}, $crumb->[0]) . " / ";
4071        }
4072        if (defined $project) {
4073                my @dirname = split '/', $project;
4074                my $projectbasename = pop @dirname;
4075                print_nav_breadcrumbs_path(@dirname);
4076                print $cgi->a({-href => href(action=>"summary")}, esc_html($projectbasename));
4077                if (defined $action) {
4078                        my $action_print = $action ;
4079                        if (defined $opts{-action_extra}) {
4080                                $action_print = $cgi->a({-href => href(action=>$action)},
4081                                        $action);
4082                        }
4083                        print " / $action_print";
4084                }
4085                if (defined $opts{-action_extra}) {
4086                        print " / $opts{-action_extra}";
4087                }
4088                print "\n";
4089        } elsif (defined $project_filter) {
4090                print_nav_breadcrumbs_path(split '/', $project_filter);
4091        }
4092}
4093
4094sub print_search_form {
4095        if (!defined $searchtext) {
4096                $searchtext = "";
4097        }
4098        my $search_hash;
4099        if (defined $hash_base) {
4100                $search_hash = $hash_base;
4101        } elsif (defined $hash) {
4102                $search_hash = $hash;
4103        } else {
4104                $search_hash = "HEAD";
4105        }
4106        my $action = $my_uri;
4107        my $use_pathinfo = gitweb_check_feature('pathinfo');
4108        if ($use_pathinfo) {
4109                $action .= "/".esc_url($project);
4110        }
4111        print $cgi->start_form(-method => "get", -action => $action) .
4112              "<div class=\"search\">\n" .
4113              (!$use_pathinfo &&
4114              $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
4115              $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
4116              $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
4117              $cgi->popup_menu(-name => 'st', -default => 'commit',
4118                               -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
4119              " " . $cgi->a({-href => href(action=>"search_help"),
4120                             -title => "search help" }, "?") . " search:\n",
4121              $cgi->textfield(-name => "s", -value => $searchtext, -override => 1) . "\n" .
4122              "<span title=\"Extended regular expression\">" .
4123              $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
4124                             -checked => $search_use_regexp) .
4125              "</span>" .
4126              "</div>" .
4127              $cgi->end_form() . "\n";
4128}
4129
4130sub git_header_html {
4131        my $status = shift || "200 OK";
4132        my $expires = shift;
4133        my %opts = @_;
4134
4135        my $title = get_page_title();
4136        my $content_type = get_content_type_html();
4137        print $cgi->header(-type=>$content_type, -charset => 'utf-8',
4138                           -status=> $status, -expires => $expires)
4139                unless ($opts{'-no_http_header'});
4140        my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
4141        print <<EOF;
4142<?xml version="1.0" encoding="utf-8"?>
4143<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
4144<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
4145<!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
4146<!-- git core binaries version $git_version -->
4147<head>
4148<meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
4149<meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
4150<meta name="robots" content="index, nofollow"/>
4151<title>$title</title>
4152EOF
4153        # the stylesheet, favicon etc urls won't work correctly with path_info
4154        # unless we set the appropriate base URL
4155        if ($ENV{'PATH_INFO'}) {
4156                print "<base href=\"".esc_url($base_url)."\" />\n";
4157        }
4158        print_header_links($status);
4159
4160        if (defined $site_html_head_string) {
4161                print to_utf8($site_html_head_string);
4162        }
4163
4164        print "</head>\n" .
4165              "<body>\n";
4166
4167        if (defined $site_header && -f $site_header) {
4168                insert_file($site_header);
4169        }
4170
4171        print "<div class=\"page_header\">\n";
4172        if (defined $logo) {
4173                print $cgi->a({-href => esc_url($logo_url),
4174                               -title => $logo_label},
4175                              $cgi->img({-src => esc_url($logo),
4176                                         -width => 72, -height => 27,
4177                                         -alt => "git",
4178                                         -class => "logo"}));
4179        }
4180        print_nav_breadcrumbs(%opts);
4181        print "</div>\n";
4182
4183        my $have_search = gitweb_check_feature('search');
4184        if (defined $project && $have_search) {
4185                print_search_form();
4186        }
4187}
4188
4189sub git_footer_html {
4190        my $feed_class = 'rss_logo';
4191
4192        print "<div class=\"page_footer\">\n";
4193        if (defined $project) {
4194                my $descr = git_get_project_description($project);
4195                if (defined $descr) {
4196                        print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
4197                }
4198
4199                my %href_params = get_feed_info();
4200                if (!%href_params) {
4201                        $feed_class .= ' generic';
4202                }
4203                $href_params{'-title'} ||= 'log';
4204
4205                foreach my $format (qw(RSS Atom)) {
4206                        $href_params{'action'} = lc($format);
4207                        print $cgi->a({-href => href(%href_params),
4208                                      -title => "$href_params{'-title'} $format feed",
4209                                      -class => $feed_class}, $format)."\n";
4210                }
4211
4212        } else {
4213                print $cgi->a({-href => href(project=>undef, action=>"opml",
4214                                             project_filter => $project_filter),
4215                              -class => $feed_class}, "OPML") . " ";
4216                print $cgi->a({-href => href(project=>undef, action=>"project_index",
4217                                             project_filter => $project_filter),
4218                              -class => $feed_class}, "TXT") . "\n";
4219        }
4220        print "</div>\n"; # class="page_footer"
4221
4222        if (defined $t0 && gitweb_check_feature('timed')) {
4223                print "<div id=\"generating_info\">\n";
4224                print 'This page took '.
4225                      '<span id="generating_time" class="time_span">'.
4226                      tv_interval($t0, [ gettimeofday() ]).
4227                      ' seconds </span>'.
4228                      ' and '.
4229                      '<span id="generating_cmd">'.
4230                      $number_of_git_cmds.
4231                      '</span> git commands '.
4232                      " to generate.\n";
4233                print "</div>\n"; # class="page_footer"
4234        }
4235
4236        if (defined $site_footer && -f $site_footer) {
4237                insert_file($site_footer);
4238        }
4239
4240        print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
4241        if (defined $action &&
4242            $action eq 'blame_incremental') {
4243                print qq!<script type="text/javascript">\n!.
4244                      qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
4245                      qq!           "!. href() .qq!");\n!.
4246                      qq!</script>\n!;
4247        } else {
4248                my ($jstimezone, $tz_cookie, $datetime_class) =
4249                        gitweb_get_feature('javascript-timezone');
4250
4251                print qq!<script type="text/javascript">\n!.
4252                      qq!window.onload = function () {\n!;
4253                if (gitweb_check_feature('javascript-actions')) {
4254                        print qq!       fixLinks();\n!;
4255                }
4256                if ($jstimezone && $tz_cookie && $datetime_class) {
4257                        print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4258                              qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4259                }
4260                print qq!};\n!.
4261                      qq!</script>\n!;
4262        }
4263
4264        print "</body>\n" .
4265              "</html>";
4266}
4267
4268# die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4269# Example: die_error(404, 'Hash not found')
4270# By convention, use the following status codes (as defined in RFC 2616):
4271# 400: Invalid or missing CGI parameters, or
4272#      requested object exists but has wrong type.
4273# 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4274#      this server or project.
4275# 404: Requested object/revision/project doesn't exist.
4276# 500: The server isn't configured properly, or
4277#      an internal error occurred (e.g. failed assertions caused by bugs), or
4278#      an unknown error occurred (e.g. the git binary died unexpectedly).
4279# 503: The server is currently unavailable (because it is overloaded,
4280#      or down for maintenance).  Generally, this is a temporary state.
4281sub die_error {
4282        my $status = shift || 500;
4283        my $error = esc_html(shift) || "Internal Server Error";
4284        my $extra = shift;
4285        my %opts = @_;
4286
4287        my %http_responses = (
4288                400 => '400 Bad Request',
4289                403 => '403 Forbidden',
4290                404 => '404 Not Found',
4291                500 => '500 Internal Server Error',
4292                503 => '503 Service Unavailable',
4293        );
4294        git_header_html($http_responses{$status}, undef, %opts);
4295        print <<EOF;
4296<div class="page_body">
4297<br /><br />
4298$status - $error
4299<br />
4300EOF
4301        if (defined $extra) {
4302                print "<hr />\n" .
4303                      "$extra\n";
4304        }
4305        print "</div>\n";
4306
4307        git_footer_html();
4308        goto DONE_GITWEB
4309                unless ($opts{'-error_handler'});
4310}
4311
4312## ----------------------------------------------------------------------
4313## functions printing or outputting HTML: navigation
4314
4315sub git_print_page_nav {
4316        my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4317        $extra = '' if !defined $extra; # pager or formats
4318
4319        my @navs = qw(summary shortlog log commit commitdiff tree);
4320        if ($suppress) {
4321                @navs = grep { $_ ne $suppress } @navs;
4322        }
4323
4324        my %arg = map { $_ => {action=>$_} } @navs;
4325        if (defined $head) {
4326                for (qw(commit commitdiff)) {
4327                        $arg{$_}{'hash'} = $head;
4328                }
4329                if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4330                        for (qw(shortlog log)) {
4331                                $arg{$_}{'hash'} = $head;
4332                        }
4333                }
4334        }
4335
4336        $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4337        $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4338
4339        my @actions = gitweb_get_feature('actions');
4340        my %repl = (
4341                '%' => '%',
4342                'n' => $project,         # project name
4343                'f' => $git_dir,         # project path within filesystem
4344                'h' => $treehead || '',  # current hash ('h' parameter)
4345                'b' => $treebase || '',  # hash base ('hb' parameter)
4346        );
4347        while (@actions) {
4348                my ($label, $link, $pos) = splice(@actions,0,3);
4349                # insert
4350                @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4351                # munch munch
4352                $link =~ s/%([%nfhb])/$repl{$1}/g;
4353                $arg{$label}{'_href'} = $link;
4354        }
4355
4356        print "<div class=\"page_nav\">\n" .
4357                (join " | ",
4358                 map { $_ eq $current ?
4359                       $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4360                 } @navs);
4361        print "<br/>\n$extra<br/>\n" .
4362              "</div>\n";
4363}
4364
4365# returns a submenu for the nagivation of the refs views (tags, heads,
4366# remotes) with the current view disabled and the remotes view only
4367# available if the feature is enabled
4368sub format_ref_views {
4369        my ($current) = @_;
4370        my @ref_views = qw{tags heads};
4371        push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4372        return join " | ", map {
4373                $_ eq $current ? $_ :
4374                $cgi->a({-href => href(action=>$_)}, $_)
4375        } @ref_views
4376}
4377
4378sub format_paging_nav {
4379        my ($action, $page, $has_next_link) = @_;
4380        my $paging_nav;
4381
4382
4383        if ($page > 0) {
4384                $paging_nav .=
4385                        $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4386                        " &sdot; " .
4387                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
4388                                 -accesskey => "p", -title => "Alt-p"}, "prev");
4389        } else {
4390                $paging_nav .= "first &sdot; prev";
4391        }
4392
4393        if ($has_next_link) {
4394                $paging_nav .= " &sdot; " .
4395                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
4396                                 -accesskey => "n", -title => "Alt-n"}, "next");
4397        } else {
4398                $paging_nav .= " &sdot; next";
4399        }
4400
4401        return $paging_nav;
4402}
4403
4404## ......................................................................
4405## functions printing or outputting HTML: div
4406
4407sub git_print_header_div {
4408        my ($action, $title, $hash, $hash_base) = @_;
4409        my %args = ();
4410
4411        $args{'action'} = $action;
4412        $args{'hash'} = $hash if $hash;
4413        $args{'hash_base'} = $hash_base if $hash_base;
4414
4415        print "<div class=\"header\">\n" .
4416              $cgi->a({-href => href(%args), -class => "title"},
4417              $title ? $title : $action) .
4418              "\n</div>\n";
4419}
4420
4421sub format_repo_url {
4422        my ($name, $url) = @_;
4423        return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4424}
4425
4426# Group output by placing it in a DIV element and adding a header.
4427# Options for start_div() can be provided by passing a hash reference as the
4428# first parameter to the function.
4429# Options to git_print_header_div() can be provided by passing an array
4430# reference. This must follow the options to start_div if they are present.
4431# The content can be a scalar, which is output as-is, a scalar reference, which
4432# is output after html escaping, an IO handle passed either as *handle or
4433# *handle{IO}, or a function reference. In the latter case all following
4434# parameters will be taken as argument to the content function call.
4435sub git_print_section {
4436        my ($div_args, $header_args, $content);
4437        my $arg = shift;
4438        if (ref($arg) eq 'HASH') {
4439                $div_args = $arg;
4440                $arg = shift;
4441        }
4442        if (ref($arg) eq 'ARRAY') {
4443                $header_args = $arg;
4444                $arg = shift;
4445        }
4446        $content = $arg;
4447
4448        print $cgi->start_div($div_args);
4449        git_print_header_div(@$header_args);
4450
4451        if (ref($content) eq 'CODE') {
4452                $content->(@_);
4453        } elsif (ref($content) eq 'SCALAR') {
4454                print esc_html($$content);
4455        } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4456                print <$content>;
4457        } elsif (!ref($content) && defined($content)) {
4458                print $content;
4459        }
4460
4461        print $cgi->end_div;
4462}
4463
4464sub format_timestamp_html {
4465        my $date = shift;
4466        my $strtime = $date->{'rfc2822'};
4467
4468        my (undef, undef, $datetime_class) =
4469                gitweb_get_feature('javascript-timezone');
4470        if ($datetime_class) {
4471                $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4472        }
4473
4474        my $localtime_format = '(%02d:%02d %s)';
4475        if ($date->{'hour_local'} < 6) {
4476                $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4477        }
4478        $strtime .= ' ' .
4479                    sprintf($localtime_format,
4480                            $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4481
4482        return $strtime;
4483}
4484
4485# Outputs the author name and date in long form
4486sub git_print_authorship {
4487        my $co = shift;
4488        my %opts = @_;
4489        my $tag = $opts{-tag} || 'div';
4490        my $author = $co->{'author_name'};
4491
4492        my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4493        print "<$tag class=\"author_date\">" .
4494              format_search_author($author, "author", esc_html($author)) .
4495              " [".format_timestamp_html(\%ad)."]".
4496              git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4497              "</$tag>\n";
4498}
4499
4500# Outputs table rows containing the full author or committer information,
4501# in the format expected for 'commit' view (& similar).
4502# Parameters are a commit hash reference, followed by the list of people
4503# to output information for. If the list is empty it defaults to both
4504# author and committer.
4505sub git_print_authorship_rows {
4506        my $co = shift;
4507        # too bad we can't use @people = @_ || ('author', 'committer')
4508        my @people = @_;
4509        @people = ('author', 'committer') unless @people;
4510        foreach my $who (@people) {
4511                my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4512                print "<tr><td>$who</td><td>" .
4513                      format_search_author($co->{"${who}_name"}, $who,
4514                                           esc_html($co->{"${who}_name"})) . " " .
4515                      format_search_author($co->{"${who}_email"}, $who,
4516                                           esc_html("<" . $co->{"${who}_email"} . ">")) .
4517                      "</td><td rowspan=\"2\">" .
4518                      git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4519                      "</td></tr>\n" .
4520                      "<tr>" .
4521                      "<td></td><td>" .
4522                      format_timestamp_html(\%wd) .
4523                      "</td>" .
4524                      "</tr>\n";
4525        }
4526}
4527
4528sub git_print_page_path {
4529        my $name = shift;
4530        my $type = shift;
4531        my $hb = shift;
4532
4533
4534        print "<div class=\"page_path\">";
4535        print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4536                      -title => 'tree root'}, to_utf8("[$project]"));
4537        print " / ";
4538        if (defined $name) {
4539                my @dirname = split '/', $name;
4540                my $basename = pop @dirname;
4541                my $fullname = '';
4542
4543                foreach my $dir (@dirname) {
4544                        $fullname .= ($fullname ? '/' : '') . $dir;
4545                        print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4546                                                     hash_base=>$hb),
4547                                      -title => $fullname}, esc_path($dir));
4548                        print " / ";
4549                }
4550                if (defined $type && $type eq 'blob') {
4551                        print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4552                                                     hash_base=>$hb),
4553                                      -title => $name}, esc_path($basename));
4554                } elsif (defined $type && $type eq 'tree') {
4555                        print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4556                                                     hash_base=>$hb),
4557                                      -title => $name}, esc_path($basename));
4558                        print " / ";
4559                } else {
4560                        print esc_path($basename);
4561                }
4562        }
4563        print "<br/></div>\n";
4564}
4565
4566sub git_print_log {
4567        my $log = shift;
4568        my %opts = @_;
4569
4570        if ($opts{'-remove_title'}) {
4571                # remove title, i.e. first line of log
4572                shift @$log;
4573        }
4574        # remove leading empty lines
4575        while (defined $log->[0] && $log->[0] eq "") {
4576                shift @$log;
4577        }
4578
4579        # print log
4580        my $skip_blank_line = 0;
4581        foreach my $line (@$log) {
4582                if ($line =~ m/^\s*([A-Z][-A-Za-z]*-[Bb]y|C[Cc]): /) {
4583                        if (! $opts{'-remove_signoff'}) {
4584                                print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4585                                $skip_blank_line = 1;
4586                        }
4587                        next;
4588                }
4589
4590                if ($line =~ m,\s*([a-z]*link): (https?://\S+),i) {
4591                        if (! $opts{'-remove_signoff'}) {
4592                                print "<span class=\"signoff\">" . esc_html($1) . ": " .
4593                                        "<a href=\"" . esc_html($2) . "\">" . esc_html($2) . "</a>" .
4594                                        "</span><br/>\n";
4595                                $skip_blank_line = 1;
4596                        }
4597                        next;
4598                }
4599
4600                # print only one empty line
4601                # do not print empty line after signoff
4602                if ($line eq "") {
4603                        next if ($skip_blank_line);
4604                        $skip_blank_line = 1;
4605                } else {
4606                        $skip_blank_line = 0;
4607                }
4608
4609                print format_log_line_html($line) . "<br/>\n";
4610        }
4611
4612        if ($opts{'-final_empty_line'}) {
4613                # end with single empty line
4614                print "<br/>\n" unless $skip_blank_line;
4615        }
4616}
4617
4618# return link target (what link points to)
4619sub git_get_link_target {
4620        my $hash = shift;
4621        my $link_target;
4622
4623        # read link
4624        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4625                or return;
4626        {
4627                local $/ = undef;
4628                $link_target = <$fd>;
4629        }
4630        close $fd
4631                or return;
4632
4633        return $link_target;
4634}
4635
4636# given link target, and the directory (basedir) the link is in,
4637# return target of link relative to top directory (top tree);
4638# return undef if it is not possible (including absolute links).
4639sub normalize_link_target {
4640        my ($link_target, $basedir) = @_;
4641
4642        # absolute symlinks (beginning with '/') cannot be normalized
4643        return if (substr($link_target, 0, 1) eq '/');
4644
4645        # normalize link target to path from top (root) tree (dir)
4646        my $path;
4647        if ($basedir) {
4648                $path = $basedir . '/' . $link_target;
4649        } else {
4650                # we are in top (root) tree (dir)
4651                $path = $link_target;
4652        }
4653
4654        # remove //, /./, and /../
4655        my @path_parts;
4656        foreach my $part (split('/', $path)) {
4657                # discard '.' and ''
4658                next if (!$part || $part eq '.');
4659                # handle '..'
4660                if ($part eq '..') {
4661                        if (@path_parts) {
4662                                pop @path_parts;
4663                        } else {
4664                                # link leads outside repository (outside top dir)
4665                                return;
4666                        }
4667                } else {
4668                        push @path_parts, $part;
4669                }
4670        }
4671        $path = join('/', @path_parts);
4672
4673        return $path;
4674}
4675
4676# print tree entry (row of git_tree), but without encompassing <tr> element
4677sub git_print_tree_entry {
4678        my ($t, $basedir, $hash_base, $have_blame) = @_;
4679
4680        my %base_key = ();
4681        $base_key{'hash_base'} = $hash_base if defined $hash_base;
4682
4683        # The format of a table row is: mode list link.  Where mode is
4684        # the mode of the entry, list is the name of the entry, an href,
4685        # and link is the action links of the entry.
4686
4687        print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4688        if (exists $t->{'size'}) {
4689                print "<td class=\"size\">$t->{'size'}</td>\n";
4690        }
4691        if ($t->{'type'} eq "blob") {
4692                print "<td class=\"list\">" .
4693                        $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4694                                               file_name=>"$basedir$t->{'name'}", %base_key),
4695                                -class => "list"}, esc_path($t->{'name'}));
4696                if (S_ISLNK(oct $t->{'mode'})) {
4697                        my $link_target = git_get_link_target($t->{'hash'});
4698                        if ($link_target) {
4699                                my $norm_target = normalize_link_target($link_target, $basedir);
4700                                if (defined $norm_target) {
4701                                        print " -> " .
4702                                              $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4703                                                                     file_name=>$norm_target),
4704                                                       -title => $norm_target}, esc_path($link_target));
4705                                } else {
4706                                        print " -> " . esc_path($link_target);
4707                                }
4708                        }
4709                }
4710                print "</td>\n";
4711                print "<td class=\"link\">";
4712                print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4713                                             file_name=>"$basedir$t->{'name'}", %base_key)},
4714                              "blob");
4715                if ($have_blame) {
4716                        print " | " .
4717                              $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4718                                                     file_name=>"$basedir$t->{'name'}", %base_key)},
4719                                      "blame");
4720                }
4721                if (defined $hash_base) {
4722                        print " | " .
4723                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4724                                                     hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4725                                      "history");
4726                }
4727                print " | " .
4728                        $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4729                                               file_name=>"$basedir$t->{'name'}")},
4730                                "raw");
4731                print "</td>\n";
4732
4733        } elsif ($t->{'type'} eq "tree") {
4734                print "<td class=\"list\">";
4735                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4736                                             file_name=>"$basedir$t->{'name'}",
4737                                             %base_key)},
4738                              esc_path($t->{'name'}));
4739                print "</td>\n";
4740                print "<td class=\"link\">";
4741                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4742                                             file_name=>"$basedir$t->{'name'}",
4743                                             %base_key)},
4744                              "tree");
4745                if (defined $hash_base) {
4746                        print " | " .
4747                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4748                                                     file_name=>"$basedir$t->{'name'}")},
4749                                      "history");
4750                }
4751                print "</td>\n";
4752        } else {
4753                # unknown object: we can only present history for it
4754                # (this includes 'commit' object, i.e. submodule support)
4755                print "<td class=\"list\">" .
4756                      esc_path($t->{'name'}) .
4757                      "</td>\n";
4758                print "<td class=\"link\">";
4759                if (defined $hash_base) {
4760                        print $cgi->a({-href => href(action=>"history",
4761                                                     hash_base=>$hash_base,
4762                                                     file_name=>"$basedir$t->{'name'}")},
4763                                      "history");
4764                }
4765                print "</td>\n";
4766        }
4767}
4768
4769## ......................................................................
4770## functions printing large fragments of HTML
4771
4772# get pre-image filenames for merge (combined) diff
4773sub fill_from_file_info {
4774        my ($diff, @parents) = @_;
4775
4776        $diff->{'from_file'} = [ ];
4777        $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4778        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4779                if ($diff->{'status'}[$i] eq 'R' ||
4780                    $diff->{'status'}[$i] eq 'C') {
4781                        $diff->{'from_file'}[$i] =
4782                                git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4783                }
4784        }
4785
4786        return $diff;
4787}
4788
4789# is current raw difftree line of file deletion
4790sub is_deleted {
4791        my $diffinfo = shift;
4792
4793        return $diffinfo->{'to_id'} eq ('0' x 40);
4794}
4795
4796# does patch correspond to [previous] difftree raw line
4797# $diffinfo  - hashref of parsed raw diff format
4798# $patchinfo - hashref of parsed patch diff format
4799#              (the same keys as in $diffinfo)
4800sub is_patch_split {
4801        my ($diffinfo, $patchinfo) = @_;
4802
4803        return defined $diffinfo && defined $patchinfo
4804                && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4805}
4806
4807
4808sub git_difftree_body {
4809        my ($difftree, $hash, @parents) = @_;
4810        my ($parent) = $parents[0];
4811        my $have_blame = gitweb_check_feature('blame');
4812        print "<div class=\"list_head\">\n";
4813        if ($#{$difftree} > 10) {
4814                print(($#{$difftree} + 1) . " files changed:\n");
4815        }
4816        print "</div>\n";
4817
4818        print "<table class=\"" .
4819              (@parents > 1 ? "combined " : "") .
4820              "diff_tree\">\n";
4821
4822        # header only for combined diff in 'commitdiff' view
4823        my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4824        if ($has_header) {
4825                # table header
4826                print "<thead><tr>\n" .
4827                       "<th></th><th></th>\n"; # filename, patchN link
4828                for (my $i = 0; $i < @parents; $i++) {
4829                        my $par = $parents[$i];
4830                        print "<th>" .
4831                              $cgi->a({-href => href(action=>"commitdiff",
4832                                                     hash=>$hash, hash_parent=>$par),
4833                                       -title => 'commitdiff to parent number ' .
4834                                                  ($i+1) . ': ' . substr($par,0,7)},
4835                                      $i+1) .
4836                              "&nbsp;</th>\n";
4837                }
4838                print "</tr></thead>\n<tbody>\n";
4839        }
4840
4841        my $alternate = 1;
4842        my $patchno = 0;
4843        foreach my $line (@{$difftree}) {
4844                my $diff = parsed_difftree_line($line);
4845
4846                if ($alternate) {
4847                        print "<tr class=\"dark\">\n";
4848                } else {
4849                        print "<tr class=\"light\">\n";
4850                }
4851                $alternate ^= 1;
4852
4853                if (exists $diff->{'nparents'}) { # combined diff
4854
4855                        fill_from_file_info($diff, @parents)
4856                                unless exists $diff->{'from_file'};
4857
4858                        if (!is_deleted($diff)) {
4859                                # file exists in the result (child) commit
4860                                print "<td>" .
4861                                      $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4862                                                             file_name=>$diff->{'to_file'},
4863                                                             hash_base=>$hash),
4864                                              -class => "list"}, esc_path($diff->{'to_file'})) .
4865                                      "</td>\n";
4866                        } else {
4867                                print "<td>" .
4868                                      esc_path($diff->{'to_file'}) .
4869                                      "</td>\n";
4870                        }
4871
4872                        if ($action eq 'commitdiff') {
4873                                # link to patch
4874                                $patchno++;
4875                                print "<td class=\"link\">" .
4876                                      $cgi->a({-href => href(-anchor=>"patch$patchno")},
4877                                              "patch") .
4878                                      " | " .
4879                                      "</td>\n";
4880                        }
4881
4882                        my $has_history = 0;
4883                        my $not_deleted = 0;
4884                        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4885                                my $hash_parent = $parents[$i];
4886                                my $from_hash = $diff->{'from_id'}[$i];
4887                                my $from_path = $diff->{'from_file'}[$i];
4888                                my $status = $diff->{'status'}[$i];
4889
4890                                $has_history ||= ($status ne 'A');
4891                                $not_deleted ||= ($status ne 'D');
4892
4893                                if ($status eq 'A') {
4894                                        print "<td  class=\"link\" align=\"right\"> | </td>\n";
4895                                } elsif ($status eq 'D') {
4896                                        print "<td class=\"link\">" .
4897                                              $cgi->a({-href => href(action=>"blob",
4898                                                                     hash_base=>$hash,
4899                                                                     hash=>$from_hash,
4900                                                                     file_name=>$from_path)},
4901                                                      "blob" . ($i+1)) .
4902                                              " | </td>\n";
4903                                } else {
4904                                        if ($diff->{'to_id'} eq $from_hash) {
4905                                                print "<td class=\"link nochange\">";
4906                                        } else {
4907                                                print "<td class=\"link\">";
4908                                        }
4909                                        print $cgi->a({-href => href(action=>"blobdiff",
4910                                                                     hash=>$diff->{'to_id'},
4911                                                                     hash_parent=>$from_hash,
4912                                                                     hash_base=>$hash,
4913                                                                     hash_parent_base=>$hash_parent,
4914                                                                     file_name=>$diff->{'to_file'},
4915                                                                     file_parent=>$from_path)},
4916                                                      "diff" . ($i+1)) .
4917                                              " | </td>\n";
4918                                }
4919                        }
4920
4921                        print "<td class=\"link\">";
4922                        if ($not_deleted) {
4923                                print $cgi->a({-href => href(action=>"blob",
4924                                                             hash=>$diff->{'to_id'},
4925                                                             file_name=>$diff->{'to_file'},
4926                                                             hash_base=>$hash)},
4927                                              "blob");
4928                                print " | " if ($has_history);
4929                        }
4930                        if ($has_history) {
4931                                print $cgi->a({-href => href(action=>"history",
4932                                                             file_name=>$diff->{'to_file'},
4933                                                             hash_base=>$hash)},
4934                                              "history");
4935                        }
4936                        print "</td>\n";
4937
4938                        print "</tr>\n";
4939                        next; # instead of 'else' clause, to avoid extra indent
4940                }
4941                # else ordinary diff
4942
4943                my ($to_mode_oct, $to_mode_str, $to_file_type);
4944                my ($from_mode_oct, $from_mode_str, $from_file_type);
4945                if ($diff->{'to_mode'} ne ('0' x 6)) {
4946                        $to_mode_oct = oct $diff->{'to_mode'};
4947                        if (S_ISREG($to_mode_oct)) { # only for regular file
4948                                $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4949                        }
4950                        $to_file_type = file_type($diff->{'to_mode'});
4951                }
4952                if ($diff->{'from_mode'} ne ('0' x 6)) {
4953                        $from_mode_oct = oct $diff->{'from_mode'};
4954                        if (S_ISREG($from_mode_oct)) { # only for regular file
4955                                $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4956                        }
4957                        $from_file_type = file_type($diff->{'from_mode'});
4958                }
4959
4960                if ($diff->{'status'} eq "A") { # created
4961                        my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4962                        $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4963                        $mode_chng   .= "]</span>";
4964                        print "<td>";
4965                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4966                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4967                                      -class => "list"}, esc_path($diff->{'file'}));
4968                        print "</td>\n";
4969                        print "<td>$mode_chng</td>\n";
4970                        print "<td class=\"link\">";
4971                        if ($action eq 'commitdiff') {
4972                                # link to patch
4973                                $patchno++;
4974                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4975                                              "patch") .
4976                                      " | ";
4977                        }
4978                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4979                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4980                                      "blob");
4981                        print "</td>\n";
4982
4983                } elsif ($diff->{'status'} eq "D") { # deleted
4984                        my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4985                        print "<td>";
4986                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4987                                                     hash_base=>$parent, file_name=>$diff->{'file'}),
4988                                       -class => "list"}, esc_path($diff->{'file'}));
4989                        print "</td>\n";
4990                        print "<td>$mode_chng</td>\n";
4991                        print "<td class=\"link\">";
4992                        if ($action eq 'commitdiff') {
4993                                # link to patch
4994                                $patchno++;
4995                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4996                                              "patch") .
4997                                      " | ";
4998                        }
4999                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
5000                                                     hash_base=>$parent, file_name=>$diff->{'file'})},
5001                                      "blob") . " | ";
5002                        if ($have_blame) {
5003                                print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
5004                                                             file_name=>$diff->{'file'})},
5005                                              "blame") . " | ";
5006                        }
5007                        print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
5008                                                     file_name=>$diff->{'file'})},
5009                                      "history");
5010                        print "</td>\n";
5011
5012                } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
5013                        my $mode_chnge = "";
5014                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
5015                                $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
5016                                if ($from_file_type ne $to_file_type) {
5017                                        $mode_chnge .= " from $from_file_type to $to_file_type";
5018                                }
5019                                if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
5020                                        if ($from_mode_str && $to_mode_str) {
5021                                                $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
5022                                        } elsif ($to_mode_str) {
5023                                                $mode_chnge .= " mode: $to_mode_str";
5024                                        }
5025                                }
5026                                $mode_chnge .= "]</span>\n";
5027                        }
5028                        print "<td>";
5029                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
5030                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
5031                                      -class => "list"}, esc_path($diff->{'file'}));
5032                        print "</td>\n";
5033                        print "<td>$mode_chnge</td>\n";
5034                        print "<td class=\"link\">";
5035                        if ($action eq 'commitdiff') {
5036                                # link to patch
5037                                $patchno++;
5038                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
5039                                              "patch") .
5040                                      " | ";
5041                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
5042                                # "commit" view and modified file (not onlu mode changed)
5043                                print $cgi->a({-href => href(action=>"blobdiff",
5044                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
5045                                                             hash_base=>$hash, hash_parent_base=>$parent,
5046                                                             file_name=>$diff->{'file'})},
5047                                              "diff") .
5048                                      " | ";
5049                        }
5050                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
5051                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
5052                                       "blob") . " | ";
5053                        if ($have_blame) {
5054                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
5055                                                             file_name=>$diff->{'file'})},
5056                                              "blame") . " | ";
5057                        }
5058                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
5059                                                     file_name=>$diff->{'file'})},
5060                                      "history");
5061                        print "</td>\n";
5062
5063                } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
5064                        my %status_name = ('R' => 'moved', 'C' => 'copied');
5065                        my $nstatus = $status_name{$diff->{'status'}};
5066                        my $mode_chng = "";
5067                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
5068                                # mode also for directories, so we cannot use $to_mode_str
5069                                $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
5070                        }
5071                        print "<td>" .
5072                              $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
5073                                                     hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
5074                                      -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
5075                              "<td><span class=\"file_status $nstatus\">[$nstatus from " .
5076                              $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
5077                                                     hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
5078                                      -class => "list"}, esc_path($diff->{'from_file'})) .
5079                              " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
5080                              "<td class=\"link\">";
5081                        if ($action eq 'commitdiff') {
5082                                # link to patch
5083                                $patchno++;
5084                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
5085                                              "patch") .
5086                                      " | ";
5087                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
5088                                # "commit" view and modified file (not only pure rename or copy)
5089                                print $cgi->a({-href => href(action=>"blobdiff",
5090                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
5091                                                             hash_base=>$hash, hash_parent_base=>$parent,
5092                                                             file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
5093                                              "diff") .
5094                                      " | ";
5095                        }
5096                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
5097                                                     hash_base=>$parent, file_name=>$diff->{'to_file'})},
5098                                      "blob") . " | ";
5099                        if ($have_blame) {
5100                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
5101                                                             file_name=>$diff->{'to_file'})},
5102                                              "blame") . " | ";
5103                        }
5104                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
5105                                                    file_name=>$diff->{'to_file'})},
5106                                      "history");
5107                        print "</td>\n";
5108
5109                } # we should not encounter Unmerged (U) or Unknown (X) status
5110                print "</tr>\n";
5111        }
5112        print "</tbody>" if $has_header;
5113        print "</table>\n";
5114}
5115
5116# Print context lines and then rem/add lines in a side-by-side manner.
5117sub print_sidebyside_diff_lines {
5118        my ($ctx, $rem, $add) = @_;
5119
5120        # print context block before add/rem block
5121        if (@$ctx) {
5122                print join '',
5123                        '<div class="chunk_block ctx">',
5124                                '<div class="old">',
5125                                @$ctx,
5126                                '</div>',
5127                                '<div class="new">',
5128                                @$ctx,
5129                                '</div>',
5130                        '</div>';
5131        }
5132
5133        if (!@$add) {
5134                # pure removal
5135                print join '',
5136                        '<div class="chunk_block rem">',
5137                                '<div class="old">',
5138                                @$rem,
5139                                '</div>',
5140                        '</div>';
5141        } elsif (!@$rem) {
5142                # pure addition
5143                print join '',
5144                        '<div class="chunk_block add">',
5145                                '<div class="new">',
5146                                @$add,
5147                                '</div>',
5148                        '</div>';
5149        } else {
5150                print join '',
5151                        '<div class="chunk_block chg">',
5152                                '<div class="old">',
5153                                @$rem,
5154                                '</div>',
5155                                '<div class="new">',
5156                                @$add,
5157                                '</div>',
5158                        '</div>';
5159        }
5160}
5161
5162# Print context lines and then rem/add lines in inline manner.
5163sub print_inline_diff_lines {
5164        my ($ctx, $rem, $add) = @_;
5165
5166        print @$ctx, @$rem, @$add;
5167}
5168
5169# Format removed and added line, mark changed part and HTML-format them.
5170# Implementation is based on contrib/diff-highlight
5171sub format_rem_add_lines_pair {
5172        my ($rem, $add, $num_parents) = @_;
5173
5174        # We need to untabify lines before split()'ing them;
5175        # otherwise offsets would be invalid.
5176        chomp $rem;
5177        chomp $add;
5178        $rem = untabify($rem);
5179        $add = untabify($add);
5180
5181        my @rem = split(//, $rem);
5182        my @add = split(//, $add);
5183        my ($esc_rem, $esc_add);
5184        # Ignore leading +/- characters for each parent.
5185        my ($prefix_len, $suffix_len) = ($num_parents, 0);
5186        my ($prefix_has_nonspace, $suffix_has_nonspace);
5187
5188        my $shorter = (@rem < @add) ? @rem : @add;
5189        while ($prefix_len < $shorter) {
5190                last if ($rem[$prefix_len] ne $add[$prefix_len]);
5191
5192                $prefix_has_nonspace = 1 if ($rem[$prefix_len] !~ /\s/);
5193                $prefix_len++;
5194        }
5195
5196        while ($prefix_len + $suffix_len < $shorter) {
5197                last if ($rem[-1 - $suffix_len] ne $add[-1 - $suffix_len]);
5198
5199                $suffix_has_nonspace = 1 if ($rem[-1 - $suffix_len] !~ /\s/);
5200                $suffix_len++;
5201        }
5202
5203        # Mark lines that are different from each other, but have some common
5204        # part that isn't whitespace.  If lines are completely different, don't
5205        # mark them because that would make output unreadable, especially if
5206        # diff consists of multiple lines.
5207        if ($prefix_has_nonspace || $suffix_has_nonspace) {
5208                $esc_rem = esc_html_hl_regions($rem, 'marked',
5209                        [$prefix_len, @rem - $suffix_len], -nbsp=>1);
5210                $esc_add = esc_html_hl_regions($add, 'marked',
5211                        [$prefix_len, @add - $suffix_len], -nbsp=>1);
5212        } else {
5213                $esc_rem = esc_html($rem, -nbsp=>1);
5214                $esc_add = esc_html($add, -nbsp=>1);
5215        }
5216
5217        return format_diff_line(\$esc_rem, 'rem'),
5218               format_diff_line(\$esc_add, 'add');
5219}
5220
5221# HTML-format diff context, removed and added lines.
5222sub format_ctx_rem_add_lines {
5223        my ($ctx, $rem, $add, $num_parents) = @_;
5224        my (@new_ctx, @new_rem, @new_add);
5225        my $can_highlight = 0;
5226        my $is_combined = ($num_parents > 1);
5227
5228        # Highlight if every removed line has a corresponding added line.
5229        if (@$add > 0 && @$add == @$rem) {
5230                $can_highlight = 1;
5231
5232                # Highlight lines in combined diff only if the chunk contains
5233                # diff between the same version, e.g.
5234                #
5235                #    - a
5236                #   -  b
5237                #    + c
5238                #   +  d
5239                #
5240                # Otherwise the highlightling would be confusing.
5241                if ($is_combined) {
5242                        for (my $i = 0; $i < @$add; $i++) {
5243                                my $prefix_rem = substr($rem->[$i], 0, $num_parents);
5244                                my $prefix_add = substr($add->[$i], 0, $num_parents);
5245
5246                                $prefix_rem =~ s/-/+/g;
5247
5248                                if ($prefix_rem ne $prefix_add) {
5249                                        $can_highlight = 0;
5250                                        last;
5251                                }
5252                        }
5253                }
5254        }
5255
5256        if ($can_highlight) {
5257                for (my $i = 0; $i < @$add; $i++) {
5258                        my ($line_rem, $line_add) = format_rem_add_lines_pair(
5259                                $rem->[$i], $add->[$i], $num_parents);
5260                        push @new_rem, $line_rem;
5261                        push @new_add, $line_add;
5262                }
5263        } else {
5264                @new_rem = map { format_diff_line($_, 'rem') } @$rem;
5265                @new_add = map { format_diff_line($_, 'add') } @$add;
5266        }
5267
5268        @new_ctx = map { format_diff_line($_, 'ctx') } @$ctx;
5269
5270        return (\@new_ctx, \@new_rem, \@new_add);
5271}
5272
5273# Print context lines and then rem/add lines.
5274sub print_diff_lines {
5275        my ($ctx, $rem, $add, $diff_style, $num_parents) = @_;
5276        my $is_combined = $num_parents > 1;
5277
5278        ($ctx, $rem, $add) = format_ctx_rem_add_lines($ctx, $rem, $add,
5279                $num_parents);
5280
5281        if ($diff_style eq 'sidebyside' && !$is_combined) {
5282                print_sidebyside_diff_lines($ctx, $rem, $add);
5283        } else {
5284                # default 'inline' style and unknown styles
5285                print_inline_diff_lines($ctx, $rem, $add);
5286        }
5287}
5288
5289sub print_diff_chunk {
5290        my ($diff_style, $num_parents, $from, $to, @chunk) = @_;
5291        my (@ctx, @rem, @add);
5292
5293        # The class of the previous line.
5294        my $prev_class = '';
5295
5296        return unless @chunk;
5297
5298        # incomplete last line might be among removed or added lines,
5299        # or both, or among context lines: find which
5300        for (my $i = 1; $i < @chunk; $i++) {
5301                if ($chunk[$i][0] eq 'incomplete') {
5302                        $chunk[$i][0] = $chunk[$i-1][0];
5303                }
5304        }
5305
5306        # guardian
5307        push @chunk, ["", ""];
5308
5309        foreach my $line_info (@chunk) {
5310                my ($class, $line) = @$line_info;
5311
5312                # print chunk headers
5313                if ($class && $class eq 'chunk_header') {
5314                        print format_diff_line($line, $class, $from, $to);
5315                        next;
5316                }
5317
5318                ## print from accumulator when have some add/rem lines or end
5319                # of chunk (flush context lines), or when have add and rem
5320                # lines and new block is reached (otherwise add/rem lines could
5321                # be reordered)
5322                if (!$class || ((@rem || @add) && $class eq 'ctx') ||
5323                    (@rem && @add && $class ne $prev_class)) {
5324                        print_diff_lines(\@ctx, \@rem, \@add,
5325                                         $diff_style, $num_parents);
5326                        @ctx = @rem = @add = ();
5327                }
5328
5329                ## adding lines to accumulator
5330                # guardian value
5331                last unless $line;
5332                # rem, add or change
5333                if ($class eq 'rem') {
5334                        push @rem, $line;
5335                } elsif ($class eq 'add') {
5336                        push @add, $line;
5337                }
5338                # context line
5339                if ($class eq 'ctx') {
5340                        push @ctx, $line;
5341                }
5342
5343                $prev_class = $class;
5344        }
5345}
5346
5347sub git_patchset_body {
5348        my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
5349        my ($hash_parent) = $hash_parents[0];
5350
5351        my $is_combined = (@hash_parents > 1);
5352        my $patch_idx = 0;
5353        my $patch_number = 0;
5354        my $patch_line;
5355        my $diffinfo;
5356        my $to_name;
5357        my (%from, %to);
5358        my @chunk; # for side-by-side diff
5359
5360        print "<div class=\"patchset\">\n";
5361
5362        # skip to first patch
5363        while ($patch_line = <$fd>) {
5364                chomp $patch_line;
5365
5366                last if ($patch_line =~ m/^diff /);
5367        }
5368
5369 PATCH:
5370        while ($patch_line) {
5371
5372                # parse "git diff" header line
5373                if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
5374                        # $1 is from_name, which we do not use
5375                        $to_name = unquote($2);
5376                        $to_name =~ s!^b/!!;
5377                } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
5378                        # $1 is 'cc' or 'combined', which we do not use
5379                        $to_name = unquote($2);
5380                } else {
5381                        $to_name = undef;
5382                }
5383
5384                # check if current patch belong to current raw line
5385                # and parse raw git-diff line if needed
5386                if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
5387                        # this is continuation of a split patch
5388                        print "<div class=\"patch cont\">\n";
5389                } else {
5390                        # advance raw git-diff output if needed
5391                        $patch_idx++ if defined $diffinfo;
5392
5393                        # read and prepare patch information
5394                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5395
5396                        # compact combined diff output can have some patches skipped
5397                        # find which patch (using pathname of result) we are at now;
5398                        if ($is_combined) {
5399                                while ($to_name ne $diffinfo->{'to_file'}) {
5400                                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5401                                              format_diff_cc_simplified($diffinfo, @hash_parents) .
5402                                              "</div>\n";  # class="patch"
5403
5404                                        $patch_idx++;
5405                                        $patch_number++;
5406
5407                                        last if $patch_idx > $#$difftree;
5408                                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5409                                }
5410                        }
5411
5412                        # modifies %from, %to hashes
5413                        parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5414
5415                        # this is first patch for raw difftree line with $patch_idx index
5416                        # we index @$difftree array from 0, but number patches from 1
5417                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5418                }
5419
5420                # git diff header
5421                #assert($patch_line =~ m/^diff /) if DEBUG;
5422                #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5423                $patch_number++;
5424                # print "git diff" header
5425                print format_git_diff_header_line($patch_line, $diffinfo,
5426                                                  \%from, \%to);
5427
5428                # print extended diff header
5429                print "<div class=\"diff extended_header\">\n";
5430        EXTENDED_HEADER:
5431                while ($patch_line = <$fd>) {
5432                        chomp $patch_line;
5433
5434                        last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5435
5436                        print format_extended_diff_header_line($patch_line, $diffinfo,
5437                                                               \%from, \%to);
5438                }
5439                print "</div>\n"; # class="diff extended_header"
5440
5441                # from-file/to-file diff header
5442                if (! $patch_line) {
5443                        print "</div>\n"; # class="patch"
5444                        last PATCH;
5445                }
5446                next PATCH if ($patch_line =~ m/^diff /);
5447                #assert($patch_line =~ m/^---/) if DEBUG;
5448
5449                my $last_patch_line = $patch_line;
5450                $patch_line = <$fd>;
5451                chomp $patch_line;
5452                #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5453
5454                print format_diff_from_to_header($last_patch_line, $patch_line,
5455                                                 $diffinfo, \%from, \%to,
5456                                                 @hash_parents);
5457
5458                # the patch itself
5459        LINE:
5460                while ($patch_line = <$fd>) {
5461                        chomp $patch_line;
5462
5463                        next PATCH if ($patch_line =~ m/^diff /);
5464
5465                        my $class = diff_line_class($patch_line, \%from, \%to);
5466
5467                        if ($class eq 'chunk_header') {
5468                                print_diff_chunk($diff_style, scalar @hash_parents, \%from, \%to, @chunk);
5469                                @chunk = ();
5470                        }
5471
5472                        push @chunk, [ $class, $patch_line ];
5473                }
5474
5475        } continue {
5476                if (@chunk) {
5477                        print_diff_chunk($diff_style, scalar @hash_parents, \%from, \%to, @chunk);
5478                        @chunk = ();
5479                }
5480                print "</div>\n"; # class="patch"
5481        }
5482
5483        # for compact combined (--cc) format, with chunk and patch simplification
5484        # the patchset might be empty, but there might be unprocessed raw lines
5485        for (++$patch_idx if $patch_number > 0;
5486             $patch_idx < @$difftree;
5487             ++$patch_idx) {
5488                # read and prepare patch information
5489                $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5490
5491                # generate anchor for "patch" links in difftree / whatchanged part
5492                print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5493                      format_diff_cc_simplified($diffinfo, @hash_parents) .
5494                      "</div>\n";  # class="patch"
5495
5496                $patch_number++;
5497        }
5498
5499        if ($patch_number == 0) {
5500                if (@hash_parents > 1) {
5501                        print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5502                } else {
5503                        print "<div class=\"diff nodifferences\">No differences found</div>\n";
5504                }
5505        }
5506
5507        print "</div>\n"; # class="patchset"
5508}
5509
5510# . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5511
5512sub git_project_search_form {
5513        my ($searchtext, $search_use_regexp) = @_;
5514
5515        my $limit = '';
5516        if ($project_filter) {
5517                $limit = " in '$project_filter/'";
5518        }
5519
5520        print "<div class=\"projsearch\">\n";
5521        print $cgi->start_form(-method => 'get', -action => $my_uri) .
5522              $cgi->hidden(-name => 'a', -value => 'project_list')  . "\n";
5523        print $cgi->hidden(-name => 'pf', -value => $project_filter). "\n"
5524                if (defined $project_filter);
5525        print $cgi->textfield(-name => 's', -value => $searchtext,
5526                              -title => "Search project by name and description$limit",
5527                              -size => 60) . "\n" .
5528              "<span title=\"Extended regular expression\">" .
5529              $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
5530                             -checked => $search_use_regexp) .
5531              "</span>\n" .
5532              $cgi->submit(-name => 'btnS', -value => 'Search') .
5533              $cgi->end_form() . "\n" .
5534              $cgi->a({-href => href(project => undef, searchtext => undef,
5535                                     project_filter => $project_filter)},
5536                      esc_html("List all projects$limit")) . "<br />\n";
5537        print "</div>\n";
5538}
5539
5540# entry for given @keys needs filling if at least one of keys in list
5541# is not present in %$project_info
5542sub project_info_needs_filling {
5543        my ($project_info, @keys) = @_;
5544
5545        # return List::MoreUtils::any { !exists $project_info->{$_} } @keys;
5546        foreach my $key (@keys) {
5547                if (!exists $project_info->{$key}) {
5548                        return 1;
5549                }
5550        }
5551        return;
5552}
5553
5554# fills project list info (age, description, owner, category, forks, etc.)
5555# for each project in the list, removing invalid projects from
5556# returned list, or fill only specified info.
5557#
5558# Invalid projects are removed from the returned list if and only if you
5559# ask 'age' or 'age_string' to be filled, because they are the only fields
5560# that run unconditionally git command that requires repository, and
5561# therefore do always check if project repository is invalid.
5562#
5563# USAGE:
5564# * fill_project_list_info(\@project_list, 'descr_long', 'ctags')
5565#   ensures that 'descr_long' and 'ctags' fields are filled
5566# * @project_list = fill_project_list_info(\@project_list)
5567#   ensures that all fields are filled (and invalid projects removed)
5568#
5569# NOTE: modifies $projlist, but does not remove entries from it
5570sub fill_project_list_info {
5571        my ($projlist, @wanted_keys) = @_;
5572        my @projects;
5573        my $filter_set = sub { return @_; };
5574        if (@wanted_keys) {
5575                my %wanted_keys = map { $_ => 1 } @wanted_keys;
5576                $filter_set = sub { return grep { $wanted_keys{$_} } @_; };
5577        }
5578
5579        my $show_ctags = gitweb_check_feature('ctags');
5580 PROJECT:
5581        foreach my $pr (@$projlist) {
5582                if (project_info_needs_filling($pr, $filter_set->('age', 'age_string'))) {
5583                        my (@activity) = git_get_last_activity($pr->{'path'});
5584                        unless (@activity) {
5585                                next PROJECT;
5586                        }
5587                        ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5588                }
5589                if (project_info_needs_filling($pr, $filter_set->('descr', 'descr_long'))) {
5590                        my $descr = git_get_project_description($pr->{'path'}) || "";
5591                        $descr = to_utf8($descr);
5592                        $pr->{'descr_long'} = $descr;
5593                        $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5594                }
5595                if (project_info_needs_filling($pr, $filter_set->('owner'))) {
5596                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5597                }
5598                if ($show_ctags &&
5599                    project_info_needs_filling($pr, $filter_set->('ctags'))) {
5600                        $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5601                }
5602                if ($projects_list_group_categories &&
5603                    project_info_needs_filling($pr, $filter_set->('category'))) {
5604                        my $cat = git_get_project_category($pr->{'path'}) ||
5605                                                           $project_list_default_category;
5606                        $pr->{'category'} = to_utf8($cat);
5607                }
5608
5609                push @projects, $pr;
5610        }
5611
5612        return @projects;
5613}
5614
5615sub sort_projects_list {
5616        my ($projlist, $order) = @_;
5617
5618        sub order_str {
5619                my $key = shift;
5620                return sub { $a->{$key} cmp $b->{$key} };
5621        }
5622
5623        sub order_num_then_undef {
5624                my $key = shift;
5625                return sub {
5626                        defined $a->{$key} ?
5627                                (defined $b->{$key} ? $a->{$key} <=> $b->{$key} : -1) :
5628                                (defined $b->{$key} ? 1 : 0)
5629                };
5630        }
5631
5632        my %orderings = (
5633                project => order_str('path'),
5634                descr => order_str('descr_long'),
5635                owner => order_str('owner'),
5636                age => order_num_then_undef('age'),
5637        );
5638
5639        my $ordering = $orderings{$order};
5640        return defined $ordering ? sort $ordering @$projlist : @$projlist;
5641}
5642
5643# returns a hash of categories, containing the list of project
5644# belonging to each category
5645sub build_projlist_by_category {
5646        my ($projlist, $from, $to) = @_;
5647        my %categories;
5648
5649        $from = 0 unless defined $from;
5650        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5651
5652        for (my $i = $from; $i <= $to; $i++) {
5653                my $pr = $projlist->[$i];
5654                push @{$categories{ $pr->{'category'} }}, $pr;
5655        }
5656
5657        return wantarray ? %categories : \%categories;
5658}
5659
5660# print 'sort by' <th> element, generating 'sort by $name' replay link
5661# if that order is not selected
5662sub print_sort_th {
5663        print format_sort_th(@_);
5664}
5665
5666sub format_sort_th {
5667        my ($name, $order, $header) = @_;
5668        my $sort_th = "";
5669        $header ||= ucfirst($name);
5670
5671        if ($order eq $name) {
5672                $sort_th .= "<th>$header</th>\n";
5673        } else {
5674                $sort_th .= "<th>" .
5675                            $cgi->a({-href => href(-replay=>1, order=>$name),
5676                                     -class => "header"}, $header) .
5677                            "</th>\n";
5678        }
5679
5680        return $sort_th;
5681}
5682
5683sub git_project_list_rows {
5684        my ($projlist, $from, $to, $check_forks) = @_;
5685
5686        $from = 0 unless defined $from;
5687        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5688
5689        my $alternate = 1;
5690        for (my $i = $from; $i <= $to; $i++) {
5691                my $pr = $projlist->[$i];
5692
5693                if ($alternate) {
5694                        print "<tr class=\"dark\">\n";
5695                } else {
5696                        print "<tr class=\"light\">\n";
5697                }
5698                $alternate ^= 1;
5699
5700                if ($check_forks) {
5701                        print "<td>";
5702                        if ($pr->{'forks'}) {
5703                                my $nforks = scalar @{$pr->{'forks'}};
5704                                if ($nforks > 0) {
5705                                        print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5706                                                       -title => "$nforks forks"}, "+");
5707                                } else {
5708                                        print $cgi->span({-title => "$nforks forks"}, "+");
5709                                }
5710                        }
5711                        print "</td>\n";
5712                }
5713                print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5714                                        -class => "list"},
5715                                       esc_html_match_hl($pr->{'path'}, $search_regexp)) .
5716                      "</td>\n" .
5717                      "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5718                                        -class => "list",
5719                                        -title => $pr->{'descr_long'}},
5720                                        $search_regexp
5721                                        ? esc_html_match_hl_chopped($pr->{'descr_long'},
5722                                                                    $pr->{'descr'}, $search_regexp)
5723                                        : esc_html($pr->{'descr'})) .
5724                      "</td>\n";
5725                unless ($omit_owner) {
5726                        print "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5727                }
5728                unless ($omit_age_column) {
5729                        print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5730                            (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n";
5731                }
5732                print"<td class=\"link\">" .
5733                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5734                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5735                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5736                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5737                      ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5738                      "</td>\n" .
5739                      "</tr>\n";
5740        }
5741}
5742
5743sub git_project_list_body {
5744        # actually uses global variable $project
5745        my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5746        my @projects = @$projlist;
5747
5748        my $check_forks = gitweb_check_feature('forks');
5749        my $show_ctags  = gitweb_check_feature('ctags');
5750        my $tagfilter = $show_ctags ? $input_params{'ctag'} : undef;
5751        $check_forks = undef
5752                if ($tagfilter || $search_regexp);
5753
5754        # filtering out forks before filling info allows to do less work
5755        @projects = filter_forks_from_projects_list(\@projects)
5756                if ($check_forks);
5757        # search_projects_list pre-fills required info
5758        @projects = search_projects_list(\@projects,
5759                                         'search_regexp' => $search_regexp,
5760                                         'tagfilter'  => $tagfilter)
5761                if ($tagfilter || $search_regexp);
5762        # fill the rest
5763        my @all_fields = ('descr', 'descr_long', 'ctags', 'category');
5764        push @all_fields, ('age', 'age_string') unless($omit_age_column);
5765        push @all_fields, 'owner' unless($omit_owner);
5766        @projects = fill_project_list_info(\@projects, @all_fields);
5767
5768        $order ||= $default_projects_order;
5769        $from = 0 unless defined $from;
5770        $to = $#projects if (!defined $to || $#projects < $to);
5771
5772        # short circuit
5773        if ($from > $to) {
5774                print "<center>\n".
5775                      "<b>No such projects found</b><br />\n".
5776                      "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5777                      "</center>\n<br />\n";
5778                return;
5779        }
5780
5781        @projects = sort_projects_list(\@projects, $order);
5782
5783        if ($show_ctags) {
5784                my $ctags = git_gather_all_ctags(\@projects);
5785                my $cloud = git_populate_project_tagcloud($ctags);
5786                print git_show_project_tagcloud($cloud, 64);
5787        }
5788
5789        print "<table class=\"project_list\">\n";
5790        unless ($no_header) {
5791                print "<tr>\n";
5792                if ($check_forks) {
5793                        print "<th></th>\n";
5794                }
5795                print_sort_th('project', $order, 'Project');
5796                print_sort_th('descr', $order, 'Description');
5797                print_sort_th('owner', $order, 'Owner') unless $omit_owner;
5798                print_sort_th('age', $order, 'Last Change') unless $omit_age_column;
5799                print "<th></th>\n" . # for links
5800                      "</tr>\n";
5801        }
5802
5803        if ($projects_list_group_categories) {
5804                # only display categories with projects in the $from-$to window
5805                @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5806                my %categories = build_projlist_by_category(\@projects, $from, $to);
5807                foreach my $cat (sort keys %categories) {
5808                        unless ($cat eq "") {
5809                                print "<tr>\n";
5810                                if ($check_forks) {
5811                                        print "<td></td>\n";
5812                                }
5813                                print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5814                                print "</tr>\n";
5815                        }
5816
5817                        git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5818                }
5819        } else {
5820                git_project_list_rows(\@projects, $from, $to, $check_forks);
5821        }
5822
5823        if (defined $extra) {
5824                print "<tr>\n";
5825                if ($check_forks) {
5826                        print "<td></td>\n";
5827                }
5828                print "<td colspan=\"5\">$extra</td>\n" .
5829                      "</tr>\n";
5830        }
5831        print "</table>\n";
5832}
5833
5834sub git_log_body {
5835        # uses global variable $project
5836        my ($commitlist, $from, $to, $refs, $extra) = @_;
5837
5838        $from = 0 unless defined $from;
5839        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5840
5841        for (my $i = 0; $i <= $to; $i++) {
5842                my %co = %{$commitlist->[$i]};
5843                next if !%co;
5844                my $commit = $co{'id'};
5845                my $ref = format_ref_marker($refs, $commit);
5846                git_print_header_div('commit',
5847                               "<span class=\"age\">$co{'age_string'}</span>" .
5848                               esc_html($co{'title'}) . $ref,
5849                               $commit);
5850                print "<div class=\"title_text\">\n" .
5851                      "<div class=\"log_link\">\n" .
5852                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5853                      " | " .
5854                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5855                      " | " .
5856                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5857                      "<br/>\n" .
5858                      "</div>\n";
5859                      git_print_authorship(\%co, -tag => 'span');
5860                      print "<br/>\n</div>\n";
5861
5862                print "<div class=\"log_body\">\n";
5863                git_print_log($co{'comment'}, -final_empty_line=> 1);
5864                print "</div>\n";
5865        }
5866        if ($extra) {
5867                print "<div class=\"page_nav\">\n";
5868                print "$extra\n";
5869                print "</div>\n";
5870        }
5871}
5872
5873sub git_shortlog_body {
5874        # uses global variable $project
5875        my ($commitlist, $from, $to, $refs, $extra) = @_;
5876
5877        $from = 0 unless defined $from;
5878        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5879
5880        print "<table class=\"shortlog\">\n";
5881        my $alternate = 1;
5882        for (my $i = $from; $i <= $to; $i++) {
5883                my %co = %{$commitlist->[$i]};
5884                my $commit = $co{'id'};
5885                my $ref = format_ref_marker($refs, $commit);
5886                if ($alternate) {
5887                        print "<tr class=\"dark\">\n";
5888                } else {
5889                        print "<tr class=\"light\">\n";
5890                }
5891                $alternate ^= 1;
5892                # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5893                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5894                      format_author_html('td', \%co, 10) . "<td>";
5895                print format_subject_html($co{'title'}, $co{'title_short'},
5896                                          href(action=>"commit", hash=>$commit), $ref);
5897                print "</td>\n" .
5898                      "<td class=\"link\">" .
5899                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5900                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5901                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5902                my $snapshot_links = format_snapshot_links($commit);
5903                if (defined $snapshot_links) {
5904                        print " | " . $snapshot_links;
5905                }
5906                print "</td>\n" .
5907                      "</tr>\n";
5908        }
5909        if (defined $extra) {
5910                print "<tr>\n" .
5911                      "<td colspan=\"4\">$extra</td>\n" .
5912                      "</tr>\n";
5913        }
5914        print "</table>\n";
5915}
5916
5917sub git_history_body {
5918        # Warning: assumes constant type (blob or tree) during history
5919        my ($commitlist, $from, $to, $refs, $extra,
5920            $file_name, $file_hash, $ftype) = @_;
5921
5922        $from = 0 unless defined $from;
5923        $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5924
5925        print "<table class=\"history\">\n";
5926        my $alternate = 1;
5927        for (my $i = $from; $i <= $to; $i++) {
5928                my %co = %{$commitlist->[$i]};
5929                if (!%co) {
5930                        next;
5931                }
5932                my $commit = $co{'id'};
5933
5934                my $ref = format_ref_marker($refs, $commit);
5935
5936                if ($alternate) {
5937                        print "<tr class=\"dark\">\n";
5938                } else {
5939                        print "<tr class=\"light\">\n";
5940                }
5941                $alternate ^= 1;
5942                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5943        # shortlog:   format_author_html('td', \%co, 10)
5944                      format_author_html('td', \%co, 15, 3) . "<td>";
5945                # originally git_history used chop_str($co{'title'}, 50)
5946                print format_subject_html($co{'title'}, $co{'title_short'},
5947                                          href(action=>"commit", hash=>$commit), $ref);
5948                print "</td>\n" .
5949                      "<td class=\"link\">" .
5950                      $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5951                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5952
5953                if ($ftype eq 'blob') {
5954                        my $blob_current = $file_hash;
5955                        my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5956                        if (defined $blob_current && defined $blob_parent &&
5957                                        $blob_current ne $blob_parent) {
5958                                print " | " .
5959                                        $cgi->a({-href => href(action=>"blobdiff",
5960                                                               hash=>$blob_current, hash_parent=>$blob_parent,
5961                                                               hash_base=>$hash_base, hash_parent_base=>$commit,
5962                                                               file_name=>$file_name)},
5963                                                "diff to current");
5964                        }
5965                }
5966                print "</td>\n" .
5967                      "</tr>\n";
5968        }
5969        if (defined $extra) {
5970                print "<tr>\n" .
5971                      "<td colspan=\"4\">$extra</td>\n" .
5972                      "</tr>\n";
5973        }
5974        print "</table>\n";
5975}
5976
5977sub git_tags_body {
5978        # uses global variable $project
5979        my ($taglist, $from, $to, $extra) = @_;
5980        $from = 0 unless defined $from;
5981        $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5982
5983        print "<table class=\"tags\">\n";
5984        my $alternate = 1;
5985        for (my $i = $from; $i <= $to; $i++) {
5986                my $entry = $taglist->[$i];
5987                my %tag = %$entry;
5988                my $comment = $tag{'subject'};
5989                my $comment_short;
5990                if (defined $comment) {
5991                        $comment_short = chop_str($comment, 30, 5);
5992                }
5993                if ($alternate) {
5994                        print "<tr class=\"dark\">\n";
5995                } else {
5996                        print "<tr class=\"light\">\n";
5997                }
5998                $alternate ^= 1;
5999                if (defined $tag{'age'}) {
6000                        print "<td><i>$tag{'age'}</i></td>\n";
6001                } else {
6002                        print "<td></td>\n";
6003                }
6004                print "<td>" .
6005                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
6006                               -class => "list name"}, esc_html($tag{'name'})) .
6007                      "</td>\n" .
6008                      "<td>";
6009                if (defined $comment) {
6010                        print format_subject_html($comment, $comment_short,
6011                                                  href(action=>"tag", hash=>$tag{'id'}));
6012                }
6013                print "</td>\n" .
6014                      "<td class=\"selflink\">";
6015                if ($tag{'type'} eq "tag") {
6016                        print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
6017                } else {
6018                        print "&nbsp;";
6019                }
6020                print "</td>\n" .
6021                      "<td class=\"link\">" . " | " .
6022                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
6023                if ($tag{'reftype'} eq "commit") {
6024                        print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
6025                              " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
6026                } elsif ($tag{'reftype'} eq "blob") {
6027                        print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
6028                }
6029                print "</td>\n" .
6030                      "</tr>";
6031        }
6032        if (defined $extra) {
6033                print "<tr>\n" .
6034                      "<td colspan=\"5\">$extra</td>\n" .
6035                      "</tr>\n";
6036        }
6037        print "</table>\n";
6038}
6039
6040sub git_heads_body {
6041        # uses global variable $project
6042        my ($headlist, $head_at, $from, $to, $extra) = @_;
6043        $from = 0 unless defined $from;
6044        $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
6045
6046        print "<table class=\"heads\">\n";
6047        my $alternate = 1;
6048        for (my $i = $from; $i <= $to; $i++) {
6049                my $entry = $headlist->[$i];
6050                my %ref = %$entry;
6051                my $curr = defined $head_at && $ref{'id'} eq $head_at;
6052                if ($alternate) {
6053                        print "<tr class=\"dark\">\n";
6054                } else {
6055                        print "<tr class=\"light\">\n";
6056                }
6057                $alternate ^= 1;
6058                print "<td><i>$ref{'age'}</i></td>\n" .
6059                      ($curr ? "<td class=\"current_head\">" : "<td>") .
6060                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
6061                               -class => "list name"},esc_html($ref{'name'})) .
6062                      "</td>\n" .
6063                      "<td class=\"link\">" .
6064                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
6065                      $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
6066                      $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
6067                      "</td>\n" .
6068                      "</tr>";
6069        }
6070        if (defined $extra) {
6071                print "<tr>\n" .
6072                      "<td colspan=\"3\">$extra</td>\n" .
6073                      "</tr>\n";
6074        }
6075        print "</table>\n";
6076}
6077
6078# Display a single remote block
6079sub git_remote_block {
6080        my ($remote, $rdata, $limit, $head) = @_;
6081
6082        my $heads = $rdata->{'heads'};
6083        my $fetch = $rdata->{'fetch'};
6084        my $push = $rdata->{'push'};
6085
6086        my $urls_table = "<table class=\"projects_list\">\n" ;
6087
6088        if (defined $fetch) {
6089                if ($fetch eq $push) {
6090                        $urls_table .= format_repo_url("URL", $fetch);
6091                } else {
6092                        $urls_table .= format_repo_url("Fetch URL", $fetch);
6093                        $urls_table .= format_repo_url("Push URL", $push) if defined $push;
6094                }
6095        } elsif (defined $push) {
6096                $urls_table .= format_repo_url("Push URL", $push);
6097        } else {
6098                $urls_table .= format_repo_url("", "No remote URL");
6099        }
6100
6101        $urls_table .= "</table>\n";
6102
6103        my $dots;
6104        if (defined $limit && $limit < @$heads) {
6105                $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
6106        }
6107
6108        print $urls_table;
6109        git_heads_body($heads, $head, 0, $limit, $dots);
6110}
6111
6112# Display a list of remote names with the respective fetch and push URLs
6113sub git_remotes_list {
6114        my ($remotedata, $limit) = @_;
6115        print "<table class=\"heads\">\n";
6116        my $alternate = 1;
6117        my @remotes = sort keys %$remotedata;
6118
6119        my $limited = $limit && $limit < @remotes;
6120
6121        $#remotes = $limit - 1 if $limited;
6122
6123        while (my $remote = shift @remotes) {
6124                my $rdata = $remotedata->{$remote};
6125                my $fetch = $rdata->{'fetch'};
6126                my $push = $rdata->{'push'};
6127                if ($alternate) {
6128                        print "<tr class=\"dark\">\n";
6129                } else {
6130                        print "<tr class=\"light\">\n";
6131                }
6132                $alternate ^= 1;
6133                print "<td>" .
6134                      $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
6135                               -class=> "list name"},esc_html($remote)) .
6136                      "</td>";
6137                print "<td class=\"link\">" .
6138                      (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
6139                      " | " .
6140                      (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
6141                      "</td>";
6142
6143                print "</tr>\n";
6144        }
6145
6146        if ($limited) {
6147                print "<tr>\n" .
6148                      "<td colspan=\"3\">" .
6149                      $cgi->a({-href => href(action=>"remotes")}, "...") .
6150                      "</td>\n" . "</tr>\n";
6151        }
6152
6153        print "</table>";
6154}
6155
6156# Display remote heads grouped by remote, unless there are too many
6157# remotes, in which case we only display the remote names
6158sub git_remotes_body {
6159        my ($remotedata, $limit, $head) = @_;
6160        if ($limit and $limit < keys %$remotedata) {
6161                git_remotes_list($remotedata, $limit);
6162        } else {
6163                fill_remote_heads($remotedata);
6164                while (my ($remote, $rdata) = each %$remotedata) {
6165                        git_print_section({-class=>"remote", -id=>$remote},
6166                                ["remotes", $remote, $remote], sub {
6167                                        git_remote_block($remote, $rdata, $limit, $head);
6168                                });
6169                }
6170        }
6171}
6172
6173sub git_search_message {
6174        my %co = @_;
6175
6176        my $greptype;
6177        if ($searchtype eq 'commit') {
6178                $greptype = "--grep=";
6179        } elsif ($searchtype eq 'author') {
6180                $greptype = "--author=";
6181        } elsif ($searchtype eq 'committer') {
6182                $greptype = "--committer=";
6183        }
6184        $greptype .= $searchtext;
6185        my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
6186                                       $greptype, '--regexp-ignore-case',
6187                                       $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
6188
6189        my $paging_nav = '';
6190        if ($page > 0) {
6191                $paging_nav .=
6192                        $cgi->a({-href => href(-replay=>1, page=>undef)},
6193                                "first") .
6194                        " &sdot; " .
6195                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
6196                                 -accesskey => "p", -title => "Alt-p"}, "prev");
6197        } else {
6198                $paging_nav .= "first &sdot; prev";
6199        }
6200        my $next_link = '';
6201        if ($#commitlist >= 100) {
6202                $next_link =
6203                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
6204                                 -accesskey => "n", -title => "Alt-n"}, "next");
6205                $paging_nav .= " &sdot; $next_link";
6206        } else {
6207                $paging_nav .= " &sdot; next";
6208        }
6209
6210        git_header_html();
6211
6212        git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
6213        git_print_header_div('commit', esc_html($co{'title'}), $hash);
6214        if ($page == 0 && !@commitlist) {
6215                print "<p>No match.</p>\n";
6216        } else {
6217                git_search_grep_body(\@commitlist, 0, 99, $next_link);
6218        }
6219
6220        git_footer_html();
6221}
6222
6223sub git_search_changes {
6224        my %co = @_;
6225
6226        local $/ = "\n";
6227        open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
6228                '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
6229                ($search_use_regexp ? '--pickaxe-regex' : ())
6230                        or die_error(500, "Open git-log failed");
6231
6232        git_header_html();
6233
6234        git_print_page_nav('','', $hash,$co{'tree'},$hash);
6235        git_print_header_div('commit', esc_html($co{'title'}), $hash);
6236
6237        print "<table class=\"pickaxe search\">\n";
6238        my $alternate = 1;
6239        undef %co;
6240        my @files;
6241        while (my $line = <$fd>) {
6242                chomp $line;
6243                next unless $line;
6244
6245                my %set = parse_difftree_raw_line($line);
6246                if (defined $set{'commit'}) {
6247                        # finish previous commit
6248                        if (%co) {
6249                                print "</td>\n" .
6250                                      "<td class=\"link\">" .
6251                                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
6252                                              "commit") .
6253                                      " | " .
6254                                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
6255                                                             hash_base=>$co{'id'})},
6256                                              "tree") .
6257                                      "</td>\n" .
6258                                      "</tr>\n";
6259                        }
6260
6261                        if ($alternate) {
6262                                print "<tr class=\"dark\">\n";
6263                        } else {
6264                                print "<tr class=\"light\">\n";
6265                        }
6266                        $alternate ^= 1;
6267                        %co = parse_commit($set{'commit'});
6268                        my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6269                        print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6270                              "<td><i>$author</i></td>\n" .
6271                              "<td>" .
6272                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6273                                      -class => "list subject"},
6274                                      chop_and_escape_str($co{'title'}, 50) . "<br/>");
6275                } elsif (defined $set{'to_id'}) {
6276                        next if ($set{'to_id'} =~ m/^0{40}$/);
6277
6278                        print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6279                                                     hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6280                                      -class => "list"},
6281                                      "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6282                              "<br/>\n";
6283                }
6284        }
6285        close $fd;
6286
6287        # finish last commit (warning: repetition!)
6288        if (%co) {
6289                print "</td>\n" .
6290                      "<td class=\"link\">" .
6291                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
6292                              "commit") .
6293                      " | " .
6294                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
6295                                             hash_base=>$co{'id'})},
6296                              "tree") .
6297                      "</td>\n" .
6298                      "</tr>\n";
6299        }
6300
6301        print "</table>\n";
6302
6303        git_footer_html();
6304}
6305
6306sub git_search_files {
6307        my %co = @_;
6308
6309        local $/ = "\n";
6310        open my $fd, "-|", git_cmd(), 'grep', '-n', '-z',
6311                $search_use_regexp ? ('-E', '-i') : '-F',
6312                $searchtext, $co{'tree'}
6313                        or die_error(500, "Open git-grep failed");
6314
6315        git_header_html();
6316
6317        git_print_page_nav('','', $hash,$co{'tree'},$hash);
6318        git_print_header_div('commit', esc_html($co{'title'}), $hash);
6319
6320        print "<table class=\"grep_search\">\n";
6321        my $alternate = 1;
6322        my $matches = 0;
6323        my $lastfile = '';
6324        my $file_href;
6325        while (my $line = <$fd>) {
6326                chomp $line;
6327                my ($file, $lno, $ltext, $binary);
6328                last if ($matches++ > 1000);
6329                if ($line =~ /^Binary file (.+) matches$/) {
6330                        $file = $1;
6331                        $binary = 1;
6332                } else {
6333                        ($file, $lno, $ltext) = split(/\0/, $line, 3);
6334                        $file =~ s/^$co{'tree'}://;
6335                }
6336                if ($file ne $lastfile) {
6337                        $lastfile and print "</td></tr>\n";
6338                        if ($alternate++) {
6339                                print "<tr class=\"dark\">\n";
6340                        } else {
6341                                print "<tr class=\"light\">\n";
6342                        }
6343                        $file_href = href(action=>"blob", hash_base=>$co{'id'},
6344                                          file_name=>$file);
6345                        print "<td class=\"list\">".
6346                                $cgi->a({-href => $file_href, -class => "list"}, esc_path($file));
6347                        print "</td><td>\n";
6348                        $lastfile = $file;
6349                }
6350                if ($binary) {
6351                        print "<div class=\"binary\">Binary file</div>\n";
6352                } else {
6353                        $ltext = untabify($ltext);
6354                        if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6355                                $ltext = esc_html($1, -nbsp=>1);
6356                                $ltext .= '<span class="match">';
6357                                $ltext .= esc_html($2, -nbsp=>1);
6358                                $ltext .= '</span>';
6359                                $ltext .= esc_html($3, -nbsp=>1);
6360                        } else {
6361                                $ltext = esc_html($ltext, -nbsp=>1);
6362                        }
6363                        print "<div class=\"pre\">" .
6364                                $cgi->a({-href => $file_href.'#l'.$lno,
6365                                        -class => "linenr"}, sprintf('%4i', $lno)) .
6366                                ' ' .  $ltext . "</div>\n";
6367                }
6368        }
6369        if ($lastfile) {
6370                print "</td></tr>\n";
6371                if ($matches > 1000) {
6372                        print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6373                }
6374        } else {
6375                print "<div class=\"diff nodifferences\">No matches found</div>\n";
6376        }
6377        close $fd;
6378
6379        print "</table>\n";
6380
6381        git_footer_html();
6382}
6383
6384sub git_search_grep_body {
6385        my ($commitlist, $from, $to, $extra) = @_;
6386        $from = 0 unless defined $from;
6387        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
6388
6389        print "<table class=\"commit_search\">\n";
6390        my $alternate = 1;
6391        for (my $i = $from; $i <= $to; $i++) {
6392                my %co = %{$commitlist->[$i]};
6393                if (!%co) {
6394                        next;
6395                }
6396                my $commit = $co{'id'};
6397                if ($alternate) {
6398                        print "<tr class=\"dark\">\n";
6399                } else {
6400                        print "<tr class=\"light\">\n";
6401                }
6402                $alternate ^= 1;
6403                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6404                      format_author_html('td', \%co, 15, 5) .
6405                      "<td>" .
6406                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6407                               -class => "list subject"},
6408                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
6409                my $comment = $co{'comment'};
6410                foreach my $line (@$comment) {
6411                        if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
6412                                my ($lead, $match, $trail) = ($1, $2, $3);
6413                                $match = chop_str($match, 70, 5, 'center');
6414                                my $contextlen = int((80 - length($match))/2);
6415                                $contextlen = 30 if ($contextlen > 30);
6416                                $lead  = chop_str($lead,  $contextlen, 10, 'left');
6417                                $trail = chop_str($trail, $contextlen, 10, 'right');
6418
6419                                $lead  = esc_html($lead);
6420                                $match = esc_html($match);
6421                                $trail = esc_html($trail);
6422
6423                                print "$lead<span class=\"match\">$match</span>$trail<br />";
6424                        }
6425                }
6426                print "</td>\n" .
6427                      "<td class=\"link\">" .
6428                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6429                      " | " .
6430                      $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
6431                      " | " .
6432                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6433                print "</td>\n" .
6434                      "</tr>\n";
6435        }
6436        if (defined $extra) {
6437                print "<tr>\n" .
6438                      "<td colspan=\"3\">$extra</td>\n" .
6439                      "</tr>\n";
6440        }
6441        print "</table>\n";
6442}
6443
6444## ======================================================================
6445## ======================================================================
6446## actions
6447
6448sub git_project_list {
6449        my $order = $input_params{'order'};
6450        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6451                die_error(400, "Unknown order parameter");
6452        }
6453
6454        my @list = git_get_projects_list($project_filter, $strict_export);
6455        if (!@list) {
6456                die_error(404, "No projects found");
6457        }
6458
6459        git_header_html();
6460        if (defined $home_text && -f $home_text) {
6461                print "<div class=\"index_include\">\n";
6462                insert_file($home_text);
6463                print "</div>\n";
6464        }
6465
6466        git_project_search_form($searchtext, $search_use_regexp);
6467        git_project_list_body(\@list, $order);
6468        git_footer_html();
6469}
6470
6471sub git_forks {
6472        my $order = $input_params{'order'};
6473        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6474                die_error(400, "Unknown order parameter");
6475        }
6476
6477        my $filter = $project;
6478        $filter =~ s/\.git$//;
6479        my @list = git_get_projects_list($filter);
6480        if (!@list) {
6481                die_error(404, "No forks found");
6482        }
6483
6484        git_header_html();
6485        git_print_page_nav('','');
6486        git_print_header_div('summary', "$project forks");
6487        git_project_list_body(\@list, $order);
6488        git_footer_html();
6489}
6490
6491sub git_project_index {
6492        my @projects = git_get_projects_list($project_filter, $strict_export);
6493        if (!@projects) {
6494                die_error(404, "No projects found");
6495        }
6496
6497        print $cgi->header(
6498                -type => 'text/plain',
6499                -charset => 'utf-8',
6500                -content_disposition => 'inline; filename="index.aux"');
6501
6502        foreach my $pr (@projects) {
6503                if (!exists $pr->{'owner'}) {
6504                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6505                }
6506
6507                my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6508                # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6509                $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6510                $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6511                $path  =~ s/ /\+/g;
6512                $owner =~ s/ /\+/g;
6513
6514                print "$path $owner\n";
6515        }
6516}
6517
6518sub git_summary {
6519        my $descr = git_get_project_description($project) || "none";
6520        my %co = parse_commit("HEAD");
6521        my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6522        my $head = $co{'id'};
6523        my $remote_heads = gitweb_check_feature('remote_heads');
6524
6525        my $owner = git_get_project_owner($project);
6526
6527        my $refs = git_get_references();
6528        # These get_*_list functions return one more to allow us to see if
6529        # there are more ...
6530        my @taglist  = git_get_tags_list(16);
6531        my @headlist = git_get_heads_list(16);
6532        my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6533        my @forklist;
6534        my $check_forks = gitweb_check_feature('forks');
6535
6536        if ($check_forks) {
6537                # find forks of a project
6538                my $filter = $project;
6539                $filter =~ s/\.git$//;
6540                @forklist = git_get_projects_list($filter);
6541                # filter out forks of forks
6542                @forklist = filter_forks_from_projects_list(\@forklist)
6543                        if (@forklist);
6544        }
6545
6546        git_header_html();
6547        git_print_page_nav('summary','', $head);
6548
6549        print "<div class=\"title\">&nbsp;</div>\n";
6550        print "<table class=\"projects_list\">\n" .
6551              "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n";
6552        if ($owner and not $omit_owner) {
6553                print  "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6554        }
6555        if (defined $cd{'rfc2822'}) {
6556                print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6557                      "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6558        }
6559
6560        # use per project git URL list in $projectroot/$project/cloneurl
6561        # or make project git URL from git base URL and project name
6562        my $url_tag = "URL";
6563        my @url_list = git_get_project_url_list($project);
6564        @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6565        foreach my $git_url (@url_list) {
6566                next unless $git_url;
6567                print format_repo_url($url_tag, $git_url);
6568                $url_tag = "";
6569        }
6570
6571        # Tag cloud
6572        my $show_ctags = gitweb_check_feature('ctags');
6573        if ($show_ctags) {
6574                my $ctags = git_get_project_ctags($project);
6575                if (%$ctags) {
6576                        # without ability to add tags, don't show if there are none
6577                        my $cloud = git_populate_project_tagcloud($ctags);
6578                        print "<tr id=\"metadata_ctags\">" .
6579                              "<td>content tags</td>" .
6580                              "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6581                              "</tr>\n";
6582                }
6583        }
6584
6585        print "</table>\n";
6586
6587        # If XSS prevention is on, we don't include README.html.
6588        # TODO: Allow a readme in some safe format.
6589        if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6590                print "<div class=\"title\">readme</div>\n" .
6591                      "<div class=\"readme\">\n";
6592                insert_file("$projectroot/$project/README.html");
6593                print "\n</div>\n"; # class="readme"
6594        }
6595
6596        # we need to request one more than 16 (0..15) to check if
6597        # those 16 are all
6598        my @commitlist = $head ? parse_commits($head, 17) : ();
6599        if (@commitlist) {
6600                git_print_header_div('shortlog');
6601                git_shortlog_body(\@commitlist, 0, 15, $refs,
6602                                  $#commitlist <=  15 ? undef :
6603                                  $cgi->a({-href => href(action=>"shortlog")}, "..."));
6604        }
6605
6606        if (@taglist) {
6607                git_print_header_div('tags');
6608                git_tags_body(\@taglist, 0, 15,
6609                              $#taglist <=  15 ? undef :
6610                              $cgi->a({-href => href(action=>"tags")}, "..."));
6611        }
6612
6613        if (@headlist) {
6614                git_print_header_div('heads');
6615                git_heads_body(\@headlist, $head, 0, 15,
6616                               $#headlist <= 15 ? undef :
6617                               $cgi->a({-href => href(action=>"heads")}, "..."));
6618        }
6619
6620        if (%remotedata) {
6621                git_print_header_div('remotes');
6622                git_remotes_body(\%remotedata, 15, $head);
6623        }
6624
6625        if (@forklist) {
6626                git_print_header_div('forks');
6627                git_project_list_body(\@forklist, 'age', 0, 15,
6628                                      $#forklist <= 15 ? undef :
6629                                      $cgi->a({-href => href(action=>"forks")}, "..."),
6630                                      'no_header');
6631        }
6632
6633        git_footer_html();
6634}
6635
6636sub git_tag {
6637        my %tag = parse_tag($hash);
6638
6639        if (! %tag) {
6640                die_error(404, "Unknown tag object");
6641        }
6642
6643        my $head = git_get_head_hash($project);
6644        git_header_html();
6645        git_print_page_nav('','', $head,undef,$head);
6646        git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6647        print "<div class=\"title_text\">\n" .
6648              "<table class=\"object_header\">\n" .
6649              "<tr>\n" .
6650              "<td>object</td>\n" .
6651              "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6652                               $tag{'object'}) . "</td>\n" .
6653              "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6654                                              $tag{'type'}) . "</td>\n" .
6655              "</tr>\n";
6656        if (defined($tag{'author'})) {
6657                git_print_authorship_rows(\%tag, 'author');
6658        }
6659        print "</table>\n\n" .
6660              "</div>\n";
6661        print "<div class=\"page_body\">";
6662        my $comment = $tag{'comment'};
6663        foreach my $line (@$comment) {
6664                chomp $line;
6665                print esc_html($line, -nbsp=>1) . "<br/>\n";
6666        }
6667        print "</div>\n";
6668        git_footer_html();
6669}
6670
6671sub git_blame_common {
6672        my $format = shift || 'porcelain';
6673        if ($format eq 'porcelain' && $input_params{'javascript'}) {
6674                $format = 'incremental';
6675                $action = 'blame_incremental'; # for page title etc
6676        }
6677
6678        # permissions
6679        gitweb_check_feature('blame')
6680                or die_error(403, "Blame view not allowed");
6681
6682        # error checking
6683        die_error(400, "No file name given") unless $file_name;
6684        $hash_base ||= git_get_head_hash($project);
6685        die_error(404, "Couldn't find base commit") unless $hash_base;
6686        my %co = parse_commit($hash_base)
6687                or die_error(404, "Commit not found");
6688        my $ftype = "blob";
6689        if (!defined $hash) {
6690                $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6691                        or die_error(404, "Error looking up file");
6692        } else {
6693                $ftype = git_get_type($hash);
6694                if ($ftype !~ "blob") {
6695                        die_error(400, "Object is not a blob");
6696                }
6697        }
6698
6699        my $fd;
6700        if ($format eq 'incremental') {
6701                # get file contents (as base)
6702                open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6703                        or die_error(500, "Open git-cat-file failed");
6704        } elsif ($format eq 'data') {
6705                # run git-blame --incremental
6706                open $fd, "-|", git_cmd(), "blame", "--incremental",
6707                        $hash_base, "--", $file_name
6708                        or die_error(500, "Open git-blame --incremental failed");
6709        } else {
6710                # run git-blame --porcelain
6711                open $fd, "-|", git_cmd(), "blame", '-p',
6712                        $hash_base, '--', $file_name
6713                        or die_error(500, "Open git-blame --porcelain failed");
6714        }
6715        binmode $fd, ':utf8';
6716
6717        # incremental blame data returns early
6718        if ($format eq 'data') {
6719                print $cgi->header(
6720                        -type=>"text/plain", -charset => "utf-8",
6721                        -status=> "200 OK");
6722                local $| = 1; # output autoflush
6723                while (my $line = <$fd>) {
6724                        print to_utf8($line);
6725                }
6726                close $fd
6727                        or print "ERROR $!\n";
6728
6729                print 'END';
6730                if (defined $t0 && gitweb_check_feature('timed')) {
6731                        print ' '.
6732                              tv_interval($t0, [ gettimeofday() ]).
6733                              ' '.$number_of_git_cmds;
6734                }
6735                print "\n";
6736
6737                return;
6738        }
6739
6740        # page header
6741        git_header_html();
6742        my $formats_nav =
6743                $cgi->a({-href => href(action=>"blob", -replay=>1)},
6744                        "blob") .
6745                " | ";
6746        if ($format eq 'incremental') {
6747                $formats_nav .=
6748                        $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6749                                "blame") . " (non-incremental)";
6750        } else {
6751                $formats_nav .=
6752                        $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6753                                "blame") . " (incremental)";
6754        }
6755        $formats_nav .=
6756                " | " .
6757                $cgi->a({-href => href(action=>"history", -replay=>1)},
6758                        "history") .
6759                " | " .
6760                $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6761                        "HEAD");
6762        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6763        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6764        git_print_page_path($file_name, $ftype, $hash_base);
6765
6766        # page body
6767        if ($format eq 'incremental') {
6768                print "<noscript>\n<div class=\"error\"><center><b>\n".
6769                      "This page requires JavaScript to run.\n Use ".
6770                      $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6771                              'this page').
6772                      " instead.\n".
6773                      "</b></center></div>\n</noscript>\n";
6774
6775                print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6776        }
6777
6778        print qq!<div class="page_body">\n!;
6779        print qq!<div id="progress_info">... / ...</div>\n!
6780                if ($format eq 'incremental');
6781        print qq!<table id="blame_table" class="blame" width="100%">\n!.
6782              #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6783              qq!<thead>\n!.
6784              qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6785              qq!</thead>\n!.
6786              qq!<tbody>\n!;
6787
6788        my @rev_color = qw(light dark);
6789        my $num_colors = scalar(@rev_color);
6790        my $current_color = 0;
6791
6792        if ($format eq 'incremental') {
6793                my $color_class = $rev_color[$current_color];
6794
6795                #contents of a file
6796                my $linenr = 0;
6797        LINE:
6798                while (my $line = <$fd>) {
6799                        chomp $line;
6800                        $linenr++;
6801
6802                        print qq!<tr id="l$linenr" class="$color_class">!.
6803                              qq!<td class="sha1"><a href=""> </a></td>!.
6804                              qq!<td class="linenr">!.
6805                              qq!<a class="linenr" href="">$linenr</a></td>!;
6806                        print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6807                        print qq!</tr>\n!;
6808                }
6809
6810        } else { # porcelain, i.e. ordinary blame
6811                my %metainfo = (); # saves information about commits
6812
6813                # blame data
6814        LINE:
6815                while (my $line = <$fd>) {
6816                        chomp $line;
6817                        # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6818                        # no <lines in group> for subsequent lines in group of lines
6819                        my ($full_rev, $orig_lineno, $lineno, $group_size) =
6820                           ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6821                        if (!exists $metainfo{$full_rev}) {
6822                                $metainfo{$full_rev} = { 'nprevious' => 0 };
6823                        }
6824                        my $meta = $metainfo{$full_rev};
6825                        my $data;
6826                        while ($data = <$fd>) {
6827                                chomp $data;
6828                                last if ($data =~ s/^\t//); # contents of line
6829                                if ($data =~ /^(\S+)(?: (.*))?$/) {
6830                                        $meta->{$1} = $2 unless exists $meta->{$1};
6831                                }
6832                                if ($data =~ /^previous /) {
6833                                        $meta->{'nprevious'}++;
6834                                }
6835                        }
6836                        my $short_rev = substr($full_rev, 0, 8);
6837                        my $author = $meta->{'author'};
6838                        my %date =
6839                                parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6840                        my $date = $date{'iso-tz'};
6841                        if ($group_size) {
6842                                $current_color = ($current_color + 1) % $num_colors;
6843                        }
6844                        my $tr_class = $rev_color[$current_color];
6845                        $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6846                        $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6847                        $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6848                        print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6849                        if ($group_size) {
6850                                print "<td class=\"sha1\"";
6851                                print " title=\"". esc_html($author) . ", $date\"";
6852                                print " rowspan=\"$group_size\"" if ($group_size > 1);
6853                                print ">";
6854                                print $cgi->a({-href => href(action=>"commit",
6855                                                             hash=>$full_rev,
6856                                                             file_name=>$file_name)},
6857                                              esc_html($short_rev));
6858                                if ($group_size >= 2) {
6859                                        my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6860                                        if (@author_initials) {
6861                                                print "<br />" .
6862                                                      esc_html(join('', @author_initials));
6863                                                #           or join('.', ...)
6864                                        }
6865                                }
6866                                print "</td>\n";
6867                        }
6868                        # 'previous' <sha1 of parent commit> <filename at commit>
6869                        if (exists $meta->{'previous'} &&
6870                            $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6871                                $meta->{'parent'} = $1;
6872                                $meta->{'file_parent'} = unquote($2);
6873                        }
6874                        my $linenr_commit =
6875                                exists($meta->{'parent'}) ?
6876                                $meta->{'parent'} : $full_rev;
6877                        my $linenr_filename =
6878                                exists($meta->{'file_parent'}) ?
6879                                $meta->{'file_parent'} : unquote($meta->{'filename'});
6880                        my $blamed = href(action => 'blame',
6881                                          file_name => $linenr_filename,
6882                                          hash_base => $linenr_commit);
6883                        print "<td class=\"linenr\">";
6884                        print $cgi->a({ -href => "$blamed#l$orig_lineno",
6885                                        -class => "linenr" },
6886                                      esc_html($lineno));
6887                        print "</td>";
6888                        print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6889                        print "</tr>\n";
6890                } # end while
6891
6892        }
6893
6894        # footer
6895        print "</tbody>\n".
6896              "</table>\n"; # class="blame"
6897        print "</div>\n";   # class="blame_body"
6898        close $fd
6899                or print "Reading blob failed\n";
6900
6901        git_footer_html();
6902}
6903
6904sub git_blame {
6905        git_blame_common();
6906}
6907
6908sub git_blame_incremental {
6909        git_blame_common('incremental');
6910}
6911
6912sub git_blame_data {
6913        git_blame_common('data');
6914}
6915
6916sub git_tags {
6917        my $head = git_get_head_hash($project);
6918        git_header_html();
6919        git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6920        git_print_header_div('summary', $project);
6921
6922        my @tagslist = git_get_tags_list();
6923        if (@tagslist) {
6924                git_tags_body(\@tagslist);
6925        }
6926        git_footer_html();
6927}
6928
6929sub git_heads {
6930        my $head = git_get_head_hash($project);
6931        git_header_html();
6932        git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6933        git_print_header_div('summary', $project);
6934
6935        my @headslist = git_get_heads_list();
6936        if (@headslist) {
6937                git_heads_body(\@headslist, $head);
6938        }
6939        git_footer_html();
6940}
6941
6942# used both for single remote view and for list of all the remotes
6943sub git_remotes {
6944        gitweb_check_feature('remote_heads')
6945                or die_error(403, "Remote heads view is disabled");
6946
6947        my $head = git_get_head_hash($project);
6948        my $remote = $input_params{'hash'};
6949
6950        my $remotedata = git_get_remotes_list($remote);
6951        die_error(500, "Unable to get remote information") unless defined $remotedata;
6952
6953        unless (%$remotedata) {
6954                die_error(404, defined $remote ?
6955                        "Remote $remote not found" :
6956                        "No remotes found");
6957        }
6958
6959        git_header_html(undef, undef, -action_extra => $remote);
6960        git_print_page_nav('', '',  $head, undef, $head,
6961                format_ref_views($remote ? '' : 'remotes'));
6962
6963        fill_remote_heads($remotedata);
6964        if (defined $remote) {
6965                git_print_header_div('remotes', "$remote remote for $project");
6966                git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6967        } else {
6968                git_print_header_div('summary', "$project remotes");
6969                git_remotes_body($remotedata, undef, $head);
6970        }
6971
6972        git_footer_html();
6973}
6974
6975sub git_blob_plain {
6976        my $type = shift;
6977        my $expires;
6978
6979        if (!defined $hash) {
6980                if (defined $file_name) {
6981                        my $base = $hash_base || git_get_head_hash($project);
6982                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6983                                or die_error(404, "Cannot find file");
6984                } else {
6985                        die_error(400, "No file name defined");
6986                }
6987        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6988                # blobs defined by non-textual hash id's can be cached
6989                $expires = "+1d";
6990        }
6991
6992        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6993                or die_error(500, "Open git-cat-file blob '$hash' failed");
6994
6995        # content-type (can include charset)
6996        $type = blob_contenttype($fd, $file_name, $type);
6997
6998        # "save as" filename, even when no $file_name is given
6999        my $save_as = "$hash";
7000        if (defined $file_name) {
7001                $save_as = $file_name;
7002        } elsif ($type =~ m/^text\//) {
7003                $save_as .= '.txt';
7004        }
7005
7006        # With XSS prevention on, blobs of all types except a few known safe
7007        # ones are served with "Content-Disposition: attachment" to make sure
7008        # they don't run in our security domain.  For certain image types,
7009        # blob view writes an <img> tag referring to blob_plain view, and we
7010        # want to be sure not to break that by serving the image as an
7011        # attachment (though Firefox 3 doesn't seem to care).
7012        my $sandbox = $prevent_xss &&
7013                $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
7014
7015        # serve text/* as text/plain
7016        if ($prevent_xss &&
7017            ($type =~ m!^text/[a-z]+\b(.*)$! ||
7018             ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
7019                my $rest = $1;
7020                $rest = defined $rest ? $rest : '';
7021                $type = "text/plain$rest";
7022        }
7023
7024        print $cgi->header(
7025                -type => $type,
7026                -expires => $expires,
7027                -content_disposition =>
7028                        ($sandbox ? 'attachment' : 'inline')
7029                        . '; filename="' . $save_as . '"');
7030        local $/ = undef;
7031        binmode STDOUT, ':raw';
7032        print <$fd>;
7033        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
7034        close $fd;
7035}
7036
7037sub git_blob {
7038        my $expires;
7039
7040        if (!defined $hash) {
7041                if (defined $file_name) {
7042                        my $base = $hash_base || git_get_head_hash($project);
7043                        $hash = git_get_hash_by_path($base, $file_name, "blob")
7044                                or die_error(404, "Cannot find file");
7045                } else {
7046                        die_error(400, "No file name defined");
7047                }
7048        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7049                # blobs defined by non-textual hash id's can be cached
7050                $expires = "+1d";
7051        }
7052
7053        my $have_blame = gitweb_check_feature('blame');
7054        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
7055                or die_error(500, "Couldn't cat $file_name, $hash");
7056        my $mimetype = blob_mimetype($fd, $file_name);
7057        # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
7058        if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
7059                close $fd;
7060                return git_blob_plain($mimetype);
7061        }
7062        # we can have blame only for text/* mimetype
7063        $have_blame &&= ($mimetype =~ m!^text/!);
7064
7065        my $highlight = gitweb_check_feature('highlight');
7066        my $syntax = guess_file_syntax($highlight, $file_name);
7067        $fd = run_highlighter($fd, $highlight, $syntax);
7068
7069        git_header_html(undef, $expires);
7070        my $formats_nav = '';
7071        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7072                if (defined $file_name) {
7073                        if ($have_blame) {
7074                                $formats_nav .=
7075                                        $cgi->a({-href => href(action=>"blame", -replay=>1)},
7076                                                "blame") .
7077                                        " | ";
7078                        }
7079                        $formats_nav .=
7080                                $cgi->a({-href => href(action=>"history", -replay=>1)},
7081                                        "history") .
7082                                " | " .
7083                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
7084                                        "raw") .
7085                                " | " .
7086                                $cgi->a({-href => href(action=>"blob",
7087                                                       hash_base=>"HEAD", file_name=>$file_name)},
7088                                        "HEAD");
7089                } else {
7090                        $formats_nav .=
7091                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
7092                                        "raw");
7093                }
7094                git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7095                git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7096        } else {
7097                print "<div class=\"page_nav\">\n" .
7098                      "<br/><br/></div>\n" .
7099                      "<div class=\"title\">".esc_html($hash)."</div>\n";
7100        }
7101        git_print_page_path($file_name, "blob", $hash_base);
7102        print "<div class=\"page_body\">\n";
7103        if ($mimetype =~ m!^image/!) {
7104                print qq!<img class="blob" type="!.esc_attr($mimetype).qq!"!;
7105                if ($file_name) {
7106                        print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
7107                }
7108                print qq! src="! .
7109                      href(action=>"blob_plain", hash=>$hash,
7110                           hash_base=>$hash_base, file_name=>$file_name) .
7111                      qq!" />\n!;
7112        } else {
7113                my $nr;
7114                while (my $line = <$fd>) {
7115                        chomp $line;
7116                        $nr++;
7117                        $line = untabify($line);
7118                        printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
7119                               $nr, esc_attr(href(-replay => 1)), $nr, $nr,
7120                               $highlight ? sanitize($line) : esc_html($line, -nbsp=>1);
7121                }
7122        }
7123        close $fd
7124                or print "Reading blob failed.\n";
7125        print "</div>";
7126        git_footer_html();
7127}
7128
7129sub git_tree {
7130        if (!defined $hash_base) {
7131                $hash_base = "HEAD";
7132        }
7133        if (!defined $hash) {
7134                if (defined $file_name) {
7135                        $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
7136                } else {
7137                        $hash = $hash_base;
7138                }
7139        }
7140        die_error(404, "No such tree") unless defined($hash);
7141
7142        my $show_sizes = gitweb_check_feature('show-sizes');
7143        my $have_blame = gitweb_check_feature('blame');
7144
7145        my @entries = ();
7146        {
7147                local $/ = "\0";
7148                open my $fd, "-|", git_cmd(), "ls-tree", '-z',
7149                        ($show_sizes ? '-l' : ()), @extra_options, $hash
7150                        or die_error(500, "Open git-ls-tree failed");
7151                @entries = map { chomp; $_ } <$fd>;
7152                close $fd
7153                        or die_error(404, "Reading tree failed");
7154        }
7155
7156        my $refs = git_get_references();
7157        my $ref = format_ref_marker($refs, $hash_base);
7158        git_header_html();
7159        my $basedir = '';
7160        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7161                my @views_nav = ();
7162                if (defined $file_name) {
7163                        push @views_nav,
7164                                $cgi->a({-href => href(action=>"history", -replay=>1)},
7165                                        "history"),
7166                                $cgi->a({-href => href(action=>"tree",
7167                                                       hash_base=>"HEAD", file_name=>$file_name)},
7168                                        "HEAD"),
7169                }
7170                my $snapshot_links = format_snapshot_links($hash);
7171                if (defined $snapshot_links) {
7172                        # FIXME: Should be available when we have no hash base as well.
7173                        push @views_nav, $snapshot_links;
7174                }
7175                git_print_page_nav('tree','', $hash_base, undef, undef,
7176                                   join(' | ', @views_nav));
7177                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
7178        } else {
7179                undef $hash_base;
7180                print "<div class=\"page_nav\">\n";
7181                print "<br/><br/></div>\n";
7182                print "<div class=\"title\">".esc_html($hash)."</div>\n";
7183        }
7184        if (defined $file_name) {
7185                $basedir = $file_name;
7186                if ($basedir ne '' && substr($basedir, -1) ne '/') {
7187                        $basedir .= '/';
7188                }
7189                git_print_page_path($file_name, 'tree', $hash_base);
7190        }
7191        print "<div class=\"page_body\">\n";
7192        print "<table class=\"tree\">\n";
7193        my $alternate = 1;
7194        # '..' (top directory) link if possible
7195        if (defined $hash_base &&
7196            defined $file_name && $file_name =~ m![^/]+$!) {
7197                if ($alternate) {
7198                        print "<tr class=\"dark\">\n";
7199                } else {
7200                        print "<tr class=\"light\">\n";
7201                }
7202                $alternate ^= 1;
7203
7204                my $up = $file_name;
7205                $up =~ s!/?[^/]+$!!;
7206                undef $up unless $up;
7207                # based on git_print_tree_entry
7208                print '<td class="mode">' . mode_str('040000') . "</td>\n";
7209                print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
7210                print '<td class="list">';
7211                print $cgi->a({-href => href(action=>"tree",
7212                                             hash_base=>$hash_base,
7213                                             file_name=>$up)},
7214                              "..");
7215                print "</td>\n";
7216                print "<td class=\"link\"></td>\n";
7217
7218                print "</tr>\n";
7219        }
7220        foreach my $line (@entries) {
7221                my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
7222
7223                if ($alternate) {
7224                        print "<tr class=\"dark\">\n";
7225                } else {
7226                        print "<tr class=\"light\">\n";
7227                }
7228                $alternate ^= 1;
7229
7230                git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
7231
7232                print "</tr>\n";
7233        }
7234        print "</table>\n" .
7235              "</div>";
7236        git_footer_html();
7237}
7238
7239sub sanitize_for_filename {
7240    my $name = shift;
7241
7242    $name =~ s!/!-!g;
7243    $name =~ s/[^[:alnum:]_.-]//g;
7244
7245    return $name;
7246}
7247
7248sub snapshot_name {
7249        my ($project, $hash) = @_;
7250
7251        # path/to/project.git  -> project
7252        # path/to/project/.git -> project
7253        my $name = to_utf8($project);
7254        $name =~ s,([^/])/*\.git$,$1,;
7255        $name = sanitize_for_filename(basename($name));
7256
7257        my $ver = $hash;
7258        if ($hash =~ /^[0-9a-fA-F]+$/) {
7259                # shorten SHA-1 hash
7260                my $full_hash = git_get_full_hash($project, $hash);
7261                if ($full_hash =~ /^$hash/ && length($hash) > 7) {
7262                        $ver = git_get_short_hash($project, $hash);
7263                }
7264        } elsif ($hash =~ m!^refs/tags/(.*)$!) {
7265                # tags don't need shortened SHA-1 hash
7266                $ver = $1;
7267        } else {
7268                # branches and other need shortened SHA-1 hash
7269                my $strip_refs = join '|', map { quotemeta } get_branch_refs();
7270                if ($hash =~ m!^refs/($strip_refs|remotes)/(.*)$!) {
7271                        my $ref_dir = (defined $1) ? $1 : '';
7272                        $ver = $2;
7273
7274                        $ref_dir = sanitize_for_filename($ref_dir);
7275                        # for refs neither in heads nor remotes we want to
7276                        # add a ref dir to archive name
7277                        if ($ref_dir ne '' and $ref_dir ne 'heads' and $ref_dir ne 'remotes') {
7278                                $ver = $ref_dir . '-' . $ver;
7279                        }
7280                }
7281                $ver .= '-' . git_get_short_hash($project, $hash);
7282        }
7283        # special case of sanitization for filename - we change
7284        # slashes to dots instead of dashes
7285        # in case of hierarchical branch names
7286        $ver =~ s!/!.!g;
7287        $ver =~ s/[^[:alnum:]_.-]//g;
7288
7289        # name = project-version_string
7290        $name = "$name-$ver";
7291
7292        return wantarray ? ($name, $name) : $name;
7293}
7294
7295sub exit_if_unmodified_since {
7296        my ($latest_epoch) = @_;
7297        our $cgi;
7298
7299        my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7300        if (defined $if_modified) {
7301                my $since;
7302                if (eval { require HTTP::Date; 1; }) {
7303                        $since = HTTP::Date::str2time($if_modified);
7304                } elsif (eval { require Time::ParseDate; 1; }) {
7305                        $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7306                }
7307                if (defined $since && $latest_epoch <= $since) {
7308                        my %latest_date = parse_date($latest_epoch);
7309                        print $cgi->header(
7310                                -last_modified => $latest_date{'rfc2822'},
7311                                -status => '304 Not Modified');
7312                        goto DONE_GITWEB;
7313                }
7314        }
7315}
7316
7317sub git_snapshot {
7318        my $format = $input_params{'snapshot_format'};
7319        if (!@snapshot_fmts) {
7320                die_error(403, "Snapshots not allowed");
7321        }
7322        # default to first supported snapshot format
7323        $format ||= $snapshot_fmts[0];
7324        if ($format !~ m/^[a-z0-9]+$/) {
7325                die_error(400, "Invalid snapshot format parameter");
7326        } elsif (!exists($known_snapshot_formats{$format})) {
7327                die_error(400, "Unknown snapshot format");
7328        } elsif ($known_snapshot_formats{$format}{'disabled'}) {
7329                die_error(403, "Snapshot format not allowed");
7330        } elsif (!grep($_ eq $format, @snapshot_fmts)) {
7331                die_error(403, "Unsupported snapshot format");
7332        }
7333
7334        my $type = git_get_type("$hash^{}");
7335        if (!$type) {
7336                die_error(404, 'Object does not exist');
7337        }  elsif ($type eq 'blob') {
7338                die_error(400, 'Object is not a tree-ish');
7339        }
7340
7341        my ($name, $prefix) = snapshot_name($project, $hash);
7342        my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
7343
7344        my %co = parse_commit($hash);
7345        exit_if_unmodified_since($co{'committer_epoch'}) if %co;
7346
7347        my $cmd = quote_command(
7348                git_cmd(), 'archive',
7349                "--format=$known_snapshot_formats{$format}{'format'}",
7350                "--prefix=$prefix/", $hash);
7351        if (exists $known_snapshot_formats{$format}{'compressor'}) {
7352                $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
7353        }
7354
7355        $filename =~ s/(["\\])/\\$1/g;
7356        my %latest_date;
7357        if (%co) {
7358                %latest_date = parse_date($co{'committer_epoch'}, $co{'committer_tz'});
7359        }
7360
7361        print $cgi->header(
7362                -type => $known_snapshot_formats{$format}{'type'},
7363                -content_disposition => 'inline; filename="' . $filename . '"',
7364                %co ? (-last_modified => $latest_date{'rfc2822'}) : (),
7365                -status => '200 OK');
7366
7367        open my $fd, "-|", $cmd
7368                or die_error(500, "Execute git-archive failed");
7369        binmode STDOUT, ':raw';
7370        print <$fd>;
7371        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
7372        close $fd;
7373}
7374
7375sub git_log_generic {
7376        my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
7377
7378        my $head = git_get_head_hash($project);
7379        if (!defined $base) {
7380                $base = $head;
7381        }
7382        if (!defined $page) {
7383                $page = 0;
7384        }
7385        my $refs = git_get_references();
7386
7387        my $commit_hash = $base;
7388        if (defined $parent) {
7389                $commit_hash = "$parent..$base";
7390        }
7391        my @commitlist =
7392                parse_commits($commit_hash, 101, (100 * $page),
7393                              defined $file_name ? ($file_name, "--full-history") : ());
7394
7395        my $ftype;
7396        if (!defined $file_hash && defined $file_name) {
7397                # some commits could have deleted file in question,
7398                # and not have it in tree, but one of them has to have it
7399                for (my $i = 0; $i < @commitlist; $i++) {
7400                        $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
7401                        last if defined $file_hash;
7402                }
7403        }
7404        if (defined $file_hash) {
7405                $ftype = git_get_type($file_hash);
7406        }
7407        if (defined $file_name && !defined $ftype) {
7408                die_error(500, "Unknown type of object");
7409        }
7410        my %co;
7411        if (defined $file_name) {
7412                %co = parse_commit($base)
7413                        or die_error(404, "Unknown commit object");
7414        }
7415
7416
7417        my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
7418        my $next_link = '';
7419        if ($#commitlist >= 100) {
7420                $next_link =
7421                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
7422                                 -accesskey => "n", -title => "Alt-n"}, "next");
7423        }
7424        my $patch_max = gitweb_get_feature('patches');
7425        if ($patch_max && !defined $file_name) {
7426                if ($patch_max < 0 || @commitlist <= $patch_max) {
7427                        $paging_nav .= " &sdot; " .
7428                                $cgi->a({-href => href(action=>"patches", -replay=>1)},
7429                                        "patches");
7430                }
7431        }
7432
7433        git_header_html();
7434        git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
7435        if (defined $file_name) {
7436                git_print_header_div('commit', esc_html($co{'title'}), $base);
7437        } else {
7438                git_print_header_div('summary', $project)
7439        }
7440        git_print_page_path($file_name, $ftype, $hash_base)
7441                if (defined $file_name);
7442
7443        $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
7444                     $file_name, $file_hash, $ftype);
7445
7446        git_footer_html();
7447}
7448
7449sub git_log {
7450        git_log_generic('log', \&git_log_body,
7451                        $hash, $hash_parent);
7452}
7453
7454sub git_commit {
7455        $hash ||= $hash_base || "HEAD";
7456        my %co = parse_commit($hash)
7457            or die_error(404, "Unknown commit object");
7458
7459        my $parent  = $co{'parent'};
7460        my $parents = $co{'parents'}; # listref
7461
7462        # we need to prepare $formats_nav before any parameter munging
7463        my $formats_nav;
7464        if (!defined $parent) {
7465                # --root commitdiff
7466                $formats_nav .= '(initial)';
7467        } elsif (@$parents == 1) {
7468                # single parent commit
7469                $formats_nav .=
7470                        '(parent: ' .
7471                        $cgi->a({-href => href(action=>"commit",
7472                                               hash=>$parent)},
7473                                esc_html(substr($parent, 0, 7))) .
7474                        ')';
7475        } else {
7476                # merge commit
7477                $formats_nav .=
7478                        '(merge: ' .
7479                        join(' ', map {
7480                                $cgi->a({-href => href(action=>"commit",
7481                                                       hash=>$_)},
7482                                        esc_html(substr($_, 0, 7)));
7483                        } @$parents ) .
7484                        ')';
7485        }
7486        if (gitweb_check_feature('patches') && @$parents <= 1) {
7487                $formats_nav .= " | " .
7488                        $cgi->a({-href => href(action=>"patch", -replay=>1)},
7489                                "patch");
7490        }
7491
7492        if (!defined $parent) {
7493                $parent = "--root";
7494        }
7495        my @difftree;
7496        open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
7497                @diff_opts,
7498                (@$parents <= 1 ? $parent : '-c'),
7499                $hash, "--"
7500                or die_error(500, "Open git-diff-tree failed");
7501        @difftree = map { chomp; $_ } <$fd>;
7502        close $fd or die_error(404, "Reading git-diff-tree failed");
7503
7504        # non-textual hash id's can be cached
7505        my $expires;
7506        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7507                $expires = "+1d";
7508        }
7509        my $refs = git_get_references();
7510        my $ref = format_ref_marker($refs, $co{'id'});
7511
7512        git_header_html(undef, $expires);
7513        git_print_page_nav('commit', '',
7514                           $hash, $co{'tree'}, $hash,
7515                           $formats_nav);
7516
7517        if (defined $co{'parent'}) {
7518                git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
7519        } else {
7520                git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
7521        }
7522        print "<div class=\"title_text\">\n" .
7523              "<table class=\"object_header\">\n";
7524        git_print_authorship_rows(\%co);
7525        print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
7526        print "<tr>" .
7527              "<td>tree</td>" .
7528              "<td class=\"sha1\">" .
7529              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7530                       class => "list"}, $co{'tree'}) .
7531              "</td>" .
7532              "<td class=\"link\">" .
7533              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7534                      "tree");
7535        my $snapshot_links = format_snapshot_links($hash);
7536        if (defined $snapshot_links) {
7537                print " | " . $snapshot_links;
7538        }
7539        print "</td>" .
7540              "</tr>\n";
7541
7542        foreach my $par (@$parents) {
7543                print "<tr>" .
7544                      "<td>parent</td>" .
7545                      "<td class=\"sha1\">" .
7546                      $cgi->a({-href => href(action=>"commit", hash=>$par),
7547                               class => "list"}, $par) .
7548                      "</td>" .
7549                      "<td class=\"link\">" .
7550                      $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7551                      " | " .
7552                      $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7553                      "</td>" .
7554                      "</tr>\n";
7555        }
7556        print "</table>".
7557              "</div>\n";
7558
7559        print "<div class=\"page_body\">\n";
7560        git_print_log($co{'comment'});
7561        print "</div>\n";
7562
7563        git_difftree_body(\@difftree, $hash, @$parents);
7564
7565        git_footer_html();
7566}
7567
7568sub git_object {
7569        # object is defined by:
7570        # - hash or hash_base alone
7571        # - hash_base and file_name
7572        my $type;
7573
7574        # - hash or hash_base alone
7575        if ($hash || ($hash_base && !defined $file_name)) {
7576                my $object_id = $hash || $hash_base;
7577
7578                open my $fd, "-|", quote_command(
7579                        git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7580                        or die_error(404, "Object does not exist");
7581                $type = <$fd>;
7582                defined $type && chomp $type;
7583                close $fd
7584                        or die_error(404, "Object does not exist");
7585
7586        # - hash_base and file_name
7587        } elsif ($hash_base && defined $file_name) {
7588                $file_name =~ s,/+$,,;
7589
7590                system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7591                        or die_error(404, "Base object does not exist");
7592
7593                # here errors should not happen
7594                open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7595                        or die_error(500, "Open git-ls-tree failed");
7596                my $line = <$fd>;
7597                close $fd;
7598
7599                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7600                unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7601                        die_error(404, "File or directory for given base does not exist");
7602                }
7603                $type = $2;
7604                $hash = $3;
7605        } else {
7606                die_error(400, "Not enough information to find object");
7607        }
7608
7609        print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7610                                          hash=>$hash, hash_base=>$hash_base,
7611                                          file_name=>$file_name),
7612                             -status => '302 Found');
7613}
7614
7615sub git_blobdiff {
7616        my $format = shift || 'html';
7617        my $diff_style = $input_params{'diff_style'} || 'inline';
7618
7619        my $fd;
7620        my @difftree;
7621        my %diffinfo;
7622        my $expires;
7623
7624        # preparing $fd and %diffinfo for git_patchset_body
7625        # new style URI
7626        if (defined $hash_base && defined $hash_parent_base) {
7627                if (defined $file_name) {
7628                        # read raw output
7629                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7630                                $hash_parent_base, $hash_base,
7631                                "--", (defined $file_parent ? $file_parent : ()), $file_name
7632                                or die_error(500, "Open git-diff-tree failed");
7633                        @difftree = map { chomp; $_ } <$fd>;
7634                        close $fd
7635                                or die_error(404, "Reading git-diff-tree failed");
7636                        @difftree
7637                                or die_error(404, "Blob diff not found");
7638
7639                } elsif (defined $hash &&
7640                         $hash =~ /[0-9a-fA-F]{40}/) {
7641                        # try to find filename from $hash
7642
7643                        # read filtered raw output
7644                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7645                                $hash_parent_base, $hash_base, "--"
7646                                or die_error(500, "Open git-diff-tree failed");
7647                        @difftree =
7648                                # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7649                                # $hash == to_id
7650                                grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7651                                map { chomp; $_ } <$fd>;
7652                        close $fd
7653                                or die_error(404, "Reading git-diff-tree failed");
7654                        @difftree
7655                                or die_error(404, "Blob diff not found");
7656
7657                } else {
7658                        die_error(400, "Missing one of the blob diff parameters");
7659                }
7660
7661                if (@difftree > 1) {
7662                        die_error(400, "Ambiguous blob diff specification");
7663                }
7664
7665                %diffinfo = parse_difftree_raw_line($difftree[0]);
7666                $file_parent ||= $diffinfo{'from_file'} || $file_name;
7667                $file_name   ||= $diffinfo{'to_file'};
7668
7669                $hash_parent ||= $diffinfo{'from_id'};
7670                $hash        ||= $diffinfo{'to_id'};
7671
7672                # non-textual hash id's can be cached
7673                if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7674                    $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7675                        $expires = '+1d';
7676                }
7677
7678                # open patch output
7679                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7680                        '-p', ($format eq 'html' ? "--full-index" : ()),
7681                        $hash_parent_base, $hash_base,
7682                        "--", (defined $file_parent ? $file_parent : ()), $file_name
7683                        or die_error(500, "Open git-diff-tree failed");
7684        }
7685
7686        # old/legacy style URI -- not generated anymore since 1.4.3.
7687        if (!%diffinfo) {
7688                die_error('404 Not Found', "Missing one of the blob diff parameters")
7689        }
7690
7691        # header
7692        if ($format eq 'html') {
7693                my $formats_nav =
7694                        $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7695                                "raw");
7696                $formats_nav .= diff_style_nav($diff_style);
7697                git_header_html(undef, $expires);
7698                if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7699                        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7700                        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7701                } else {
7702                        print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7703                        print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7704                }
7705                if (defined $file_name) {
7706                        git_print_page_path($file_name, "blob", $hash_base);
7707                } else {
7708                        print "<div class=\"page_path\"></div>\n";
7709                }
7710
7711        } elsif ($format eq 'plain') {
7712                print $cgi->header(
7713                        -type => 'text/plain',
7714                        -charset => 'utf-8',
7715                        -expires => $expires,
7716                        -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7717
7718                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7719
7720        } else {
7721                die_error(400, "Unknown blobdiff format");
7722        }
7723
7724        # patch
7725        if ($format eq 'html') {
7726                print "<div class=\"page_body\">\n";
7727
7728                git_patchset_body($fd, $diff_style,
7729                                  [ \%diffinfo ], $hash_base, $hash_parent_base);
7730                close $fd;
7731
7732                print "</div>\n"; # class="page_body"
7733                git_footer_html();
7734
7735        } else {
7736                while (my $line = <$fd>) {
7737                        $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7738                        $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7739
7740                        print $line;
7741
7742                        last if $line =~ m!^\+\+\+!;
7743                }
7744                local $/ = undef;
7745                print <$fd>;
7746                close $fd;
7747        }
7748}
7749
7750sub git_blobdiff_plain {
7751        git_blobdiff('plain');
7752}
7753
7754# assumes that it is added as later part of already existing navigation,
7755# so it returns "| foo | bar" rather than just "foo | bar"
7756sub diff_style_nav {
7757        my ($diff_style, $is_combined) = @_;
7758        $diff_style ||= 'inline';
7759
7760        return "" if ($is_combined);
7761
7762        my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7763        my %styles = @styles;
7764        @styles =
7765                @styles[ map { $_ * 2 } 0..$#styles/2 ];
7766
7767        return join '',
7768                map { " | ".$_ }
7769                map {
7770                        $_ eq $diff_style ? $styles{$_} :
7771                        $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7772                } @styles;
7773}
7774
7775sub git_commitdiff {
7776        my %params = @_;
7777        my $format = $params{-format} || 'html';
7778        my $diff_style = $input_params{'diff_style'} || 'inline';
7779
7780        my ($patch_max) = gitweb_get_feature('patches');
7781        if ($format eq 'patch') {
7782                die_error(403, "Patch view not allowed") unless $patch_max;
7783        }
7784
7785        $hash ||= $hash_base || "HEAD";
7786        my %co = parse_commit($hash)
7787            or die_error(404, "Unknown commit object");
7788
7789        # choose format for commitdiff for merge
7790        if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7791                $hash_parent = '--cc';
7792        }
7793        # we need to prepare $formats_nav before almost any parameter munging
7794        my $formats_nav;
7795        if ($format eq 'html') {
7796                $formats_nav =
7797                        $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7798                                "raw");
7799                if ($patch_max && @{$co{'parents'}} <= 1) {
7800                        $formats_nav .= " | " .
7801                                $cgi->a({-href => href(action=>"patch", -replay=>1)},
7802                                        "patch");
7803                }
7804                $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7805
7806                if (defined $hash_parent &&
7807                    $hash_parent ne '-c' && $hash_parent ne '--cc') {
7808                        # commitdiff with two commits given
7809                        my $hash_parent_short = $hash_parent;
7810                        if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7811                                $hash_parent_short = substr($hash_parent, 0, 7);
7812                        }
7813                        $formats_nav .=
7814                                ' (from';
7815                        for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7816                                if ($co{'parents'}[$i] eq $hash_parent) {
7817                                        $formats_nav .= ' parent ' . ($i+1);
7818                                        last;
7819                                }
7820                        }
7821                        $formats_nav .= ': ' .
7822                                $cgi->a({-href => href(-replay=>1,
7823                                                       hash=>$hash_parent, hash_base=>undef)},
7824                                        esc_html($hash_parent_short)) .
7825                                ')';
7826                } elsif (!$co{'parent'}) {
7827                        # --root commitdiff
7828                        $formats_nav .= ' (initial)';
7829                } elsif (scalar @{$co{'parents'}} == 1) {
7830                        # single parent commit
7831                        $formats_nav .=
7832                                ' (parent: ' .
7833                                $cgi->a({-href => href(-replay=>1,
7834                                                       hash=>$co{'parent'}, hash_base=>undef)},
7835                                        esc_html(substr($co{'parent'}, 0, 7))) .
7836                                ')';
7837                } else {
7838                        # merge commit
7839                        if ($hash_parent eq '--cc') {
7840                                $formats_nav .= ' | ' .
7841                                        $cgi->a({-href => href(-replay=>1,
7842                                                               hash=>$hash, hash_parent=>'-c')},
7843                                                'combined');
7844                        } else { # $hash_parent eq '-c'
7845                                $formats_nav .= ' | ' .
7846                                        $cgi->a({-href => href(-replay=>1,
7847                                                               hash=>$hash, hash_parent=>'--cc')},
7848                                                'compact');
7849                        }
7850                        $formats_nav .=
7851                                ' (merge: ' .
7852                                join(' ', map {
7853                                        $cgi->a({-href => href(-replay=>1,
7854                                                               hash=>$_, hash_base=>undef)},
7855                                                esc_html(substr($_, 0, 7)));
7856                                } @{$co{'parents'}} ) .
7857                                ')';
7858                }
7859        }
7860
7861        my $hash_parent_param = $hash_parent;
7862        if (!defined $hash_parent_param) {
7863                # --cc for multiple parents, --root for parentless
7864                $hash_parent_param =
7865                        @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7866        }
7867
7868        # read commitdiff
7869        my $fd;
7870        my @difftree;
7871        if ($format eq 'html') {
7872                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7873                        "--no-commit-id", "--patch-with-raw", "--full-index",
7874                        $hash_parent_param, $hash, "--"
7875                        or die_error(500, "Open git-diff-tree failed");
7876
7877                while (my $line = <$fd>) {
7878                        chomp $line;
7879                        # empty line ends raw part of diff-tree output
7880                        last unless $line;
7881                        push @difftree, scalar parse_difftree_raw_line($line);
7882                }
7883
7884        } elsif ($format eq 'plain') {
7885                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7886                        '-p', $hash_parent_param, $hash, "--"
7887                        or die_error(500, "Open git-diff-tree failed");
7888        } elsif ($format eq 'patch') {
7889                # For commit ranges, we limit the output to the number of
7890                # patches specified in the 'patches' feature.
7891                # For single commits, we limit the output to a single patch,
7892                # diverging from the git-format-patch default.
7893                my @commit_spec = ();
7894                if ($hash_parent) {
7895                        if ($patch_max > 0) {
7896                                push @commit_spec, "-$patch_max";
7897                        }
7898                        push @commit_spec, '-n', "$hash_parent..$hash";
7899                } else {
7900                        if ($params{-single}) {
7901                                push @commit_spec, '-1';
7902                        } else {
7903                                if ($patch_max > 0) {
7904                                        push @commit_spec, "-$patch_max";
7905                                }
7906                                push @commit_spec, "-n";
7907                        }
7908                        push @commit_spec, '--root', $hash;
7909                }
7910                open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7911                        '--encoding=utf8', '--stdout', @commit_spec
7912                        or die_error(500, "Open git-format-patch failed");
7913        } else {
7914                die_error(400, "Unknown commitdiff format");
7915        }
7916
7917        # non-textual hash id's can be cached
7918        my $expires;
7919        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7920                $expires = "+1d";
7921        }
7922
7923        # write commit message
7924        if ($format eq 'html') {
7925                my $refs = git_get_references();
7926                my $ref = format_ref_marker($refs, $co{'id'});
7927
7928                git_header_html(undef, $expires);
7929                git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7930                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7931                print "<div class=\"title_text\">\n" .
7932                      "<table class=\"object_header\">\n";
7933                git_print_authorship_rows(\%co);
7934                print "</table>".
7935                      "</div>\n";
7936                print "<div class=\"page_body\">\n";
7937                if (@{$co{'comment'}} > 1) {
7938                        print "<div class=\"log\">\n";
7939                        git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7940                        print "</div>\n"; # class="log"
7941                }
7942
7943        } elsif ($format eq 'plain') {
7944                my $refs = git_get_references("tags");
7945                my $tagname = git_get_rev_name_tags($hash);
7946                my $filename = basename($project) . "-$hash.patch";
7947
7948                print $cgi->header(
7949                        -type => 'text/plain',
7950                        -charset => 'utf-8',
7951                        -expires => $expires,
7952                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7953                my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7954                print "From: " . to_utf8($co{'author'}) . "\n";
7955                print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7956                print "Subject: " . to_utf8($co{'title'}) . "\n";
7957
7958                print "X-Git-Tag: $tagname\n" if $tagname;
7959                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7960
7961                foreach my $line (@{$co{'comment'}}) {
7962                        print to_utf8($line) . "\n";
7963                }
7964                print "---\n\n";
7965        } elsif ($format eq 'patch') {
7966                my $filename = basename($project) . "-$hash.patch";
7967
7968                print $cgi->header(
7969                        -type => 'text/plain',
7970                        -charset => 'utf-8',
7971                        -expires => $expires,
7972                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7973        }
7974
7975        # write patch
7976        if ($format eq 'html') {
7977                my $use_parents = !defined $hash_parent ||
7978                        $hash_parent eq '-c' || $hash_parent eq '--cc';
7979                git_difftree_body(\@difftree, $hash,
7980                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7981                print "<br/>\n";
7982
7983                git_patchset_body($fd, $diff_style,
7984                                  \@difftree, $hash,
7985                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7986                close $fd;
7987                print "</div>\n"; # class="page_body"
7988                git_footer_html();
7989
7990        } elsif ($format eq 'plain') {
7991                local $/ = undef;
7992                print <$fd>;
7993                close $fd
7994                        or print "Reading git-diff-tree failed\n";
7995        } elsif ($format eq 'patch') {
7996                local $/ = undef;
7997                print <$fd>;
7998                close $fd
7999                        or print "Reading git-format-patch failed\n";
8000        }
8001}
8002
8003sub git_commitdiff_plain {
8004        git_commitdiff(-format => 'plain');
8005}
8006
8007# format-patch-style patches
8008sub git_patch {
8009        git_commitdiff(-format => 'patch', -single => 1);
8010}
8011
8012sub git_patches {
8013        git_commitdiff(-format => 'patch');
8014}
8015
8016sub git_history {
8017        git_log_generic('history', \&git_history_body,
8018                        $hash_base, $hash_parent_base,
8019                        $file_name, $hash);
8020}
8021
8022sub git_search {
8023        $searchtype ||= 'commit';
8024
8025        # check if appropriate features are enabled
8026        gitweb_check_feature('search')
8027                or die_error(403, "Search is disabled");
8028        if ($searchtype eq 'pickaxe') {
8029                # pickaxe may take all resources of your box and run for several minutes
8030                # with every query - so decide by yourself how public you make this feature
8031                gitweb_check_feature('pickaxe')
8032                        or die_error(403, "Pickaxe search is disabled");
8033        }
8034        if ($searchtype eq 'grep') {
8035                # grep search might be potentially CPU-intensive, too
8036                gitweb_check_feature('grep')
8037                        or die_error(403, "Grep search is disabled");
8038        }
8039
8040        if (!defined $searchtext) {
8041                die_error(400, "Text field is empty");
8042        }
8043        if (!defined $hash) {
8044                $hash = git_get_head_hash($project);
8045        }
8046        my %co = parse_commit($hash);
8047        if (!%co) {
8048                die_error(404, "Unknown commit object");
8049        }
8050        if (!defined $page) {
8051                $page = 0;
8052        }
8053
8054        if ($searchtype eq 'commit' ||
8055            $searchtype eq 'author' ||
8056            $searchtype eq 'committer') {
8057                git_search_message(%co);
8058        } elsif ($searchtype eq 'pickaxe') {
8059                git_search_changes(%co);
8060        } elsif ($searchtype eq 'grep') {
8061                git_search_files(%co);
8062        } else {
8063                die_error(400, "Unknown search type");
8064        }
8065}
8066
8067sub git_search_help {
8068        git_header_html();
8069        git_print_page_nav('','', $hash,$hash,$hash);
8070        print <<EOT;
8071<p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
8072regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
8073the pattern entered is recognized as the POSIX extended
8074<a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
8075insensitive).</p>
8076<dl>
8077<dt><b>commit</b></dt>
8078<dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
8079EOT
8080        my $have_grep = gitweb_check_feature('grep');
8081        if ($have_grep) {
8082                print <<EOT;
8083<dt><b>grep</b></dt>
8084<dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
8085    a different one) are searched for the given pattern. On large trees, this search can take
8086a while and put some strain on the server, so please use it with some consideration. Note that
8087due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
8088case-sensitive.</dd>
8089EOT
8090        }
8091        print <<EOT;
8092<dt><b>author</b></dt>
8093<dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
8094<dt><b>committer</b></dt>
8095<dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
8096EOT
8097        my $have_pickaxe = gitweb_check_feature('pickaxe');
8098        if ($have_pickaxe) {
8099                print <<EOT;
8100<dt><b>pickaxe</b></dt>
8101<dd>All commits that caused the string to appear or disappear from any file (changes that
8102added, removed or "modified" the string) will be listed. This search can take a while and
8103takes a lot of strain on the server, so please use it wisely. Note that since you may be
8104interested even in changes just changing the case as well, this search is case sensitive.</dd>
8105EOT
8106        }
8107        print "</dl>\n";
8108        git_footer_html();
8109}
8110
8111sub git_shortlog {
8112        git_log_generic('shortlog', \&git_shortlog_body,
8113                        $hash, $hash_parent);
8114}
8115
8116## ......................................................................
8117## feeds (RSS, Atom; OPML)
8118
8119sub git_feed {
8120        my $format = shift || 'atom';
8121        my $have_blame = gitweb_check_feature('blame');
8122
8123        # Atom: http://www.atomenabled.org/developers/syndication/
8124        # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
8125        if ($format ne 'rss' && $format ne 'atom') {
8126                die_error(400, "Unknown web feed format");
8127        }
8128
8129        # log/feed of current (HEAD) branch, log of given branch, history of file/directory
8130        my $head = $hash || 'HEAD';
8131        my @commitlist = parse_commits($head, 150, 0, $file_name);
8132
8133        my %latest_commit;
8134        my %latest_date;
8135        my $content_type = "application/$format+xml";
8136        if (defined $cgi->http('HTTP_ACCEPT') &&
8137                 $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
8138                # browser (feed reader) prefers text/xml
8139                $content_type = 'text/xml';
8140        }
8141        if (defined($commitlist[0])) {
8142                %latest_commit = %{$commitlist[0]};
8143                my $latest_epoch = $latest_commit{'committer_epoch'};
8144                exit_if_unmodified_since($latest_epoch);
8145                %latest_date = parse_date($latest_epoch, $latest_commit{'committer_tz'});
8146        }
8147        print $cgi->header(
8148                -type => $content_type,
8149                -charset => 'utf-8',
8150                %latest_date ? (-last_modified => $latest_date{'rfc2822'}) : (),
8151                -status => '200 OK');
8152
8153        # Optimization: skip generating the body if client asks only
8154        # for Last-Modified date.
8155        return if ($cgi->request_method() eq 'HEAD');
8156
8157        # header variables
8158        my $title = "$site_name - $project/$action";
8159        my $feed_type = 'log';
8160        if (defined $hash) {
8161                $title .= " - '$hash'";
8162                $feed_type = 'branch log';
8163                if (defined $file_name) {
8164                        $title .= " :: $file_name";
8165                        $feed_type = 'history';
8166                }
8167        } elsif (defined $file_name) {
8168                $title .= " - $file_name";
8169                $feed_type = 'history';
8170        }
8171        $title .= " $feed_type";
8172        $title = esc_html($title);
8173        my $descr = git_get_project_description($project);
8174        if (defined $descr) {
8175                $descr = esc_html($descr);
8176        } else {
8177                $descr = "$project " .
8178                         ($format eq 'rss' ? 'RSS' : 'Atom') .
8179                         " feed";
8180        }
8181        my $owner = git_get_project_owner($project);
8182        $owner = esc_html($owner);
8183
8184        #header
8185        my $alt_url;
8186        if (defined $file_name) {
8187                $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
8188        } elsif (defined $hash) {
8189                $alt_url = href(-full=>1, action=>"log", hash=>$hash);
8190        } else {
8191                $alt_url = href(-full=>1, action=>"summary");
8192        }
8193        print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
8194        if ($format eq 'rss') {
8195                print <<XML;
8196<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
8197<channel>
8198XML
8199                print "<title>$title</title>\n" .
8200                      "<link>$alt_url</link>\n" .
8201                      "<description>$descr</description>\n" .
8202                      "<language>en</language>\n" .
8203                      # project owner is responsible for 'editorial' content
8204                      "<managingEditor>$owner</managingEditor>\n";
8205                if (defined $logo || defined $favicon) {
8206                        # prefer the logo to the favicon, since RSS
8207                        # doesn't allow both
8208                        my $img = esc_url($logo || $favicon);
8209                        print "<image>\n" .
8210                              "<url>$img</url>\n" .
8211                              "<title>$title</title>\n" .
8212                              "<link>$alt_url</link>\n" .
8213                              "</image>\n";
8214                }
8215                if (%latest_date) {
8216                        print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
8217                        print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
8218                }
8219                print "<generator>gitweb v.$version/$git_version</generator>\n";
8220        } elsif ($format eq 'atom') {
8221                print <<XML;
8222<feed xmlns="http://www.w3.org/2005/Atom">
8223XML
8224                print "<title>$title</title>\n" .
8225                      "<subtitle>$descr</subtitle>\n" .
8226                      '<link rel="alternate" type="text/html" href="' .
8227                      $alt_url . '" />' . "\n" .
8228                      '<link rel="self" type="' . $content_type . '" href="' .
8229                      $cgi->self_url() . '" />' . "\n" .
8230                      "<id>" . href(-full=>1) . "</id>\n" .
8231                      # use project owner for feed author
8232                      "<author><name>$owner</name></author>\n";
8233                if (defined $favicon) {
8234                        print "<icon>" . esc_url($favicon) . "</icon>\n";
8235                }
8236                if (defined $logo) {
8237                        # not twice as wide as tall: 72 x 27 pixels
8238                        print "<logo>" . esc_url($logo) . "</logo>\n";
8239                }
8240                if (! %latest_date) {
8241                        # dummy date to keep the feed valid until commits trickle in:
8242                        print "<updated>1970-01-01T00:00:00Z</updated>\n";
8243                } else {
8244                        print "<updated>$latest_date{'iso-8601'}</updated>\n";
8245                }
8246                print "<generator version='$version/$git_version'>gitweb</generator>\n";
8247        }
8248
8249        # contents
8250        for (my $i = 0; $i <= $#commitlist; $i++) {
8251                my %co = %{$commitlist[$i]};
8252                my $commit = $co{'id'};
8253                # we read 150, we always show 30 and the ones more recent than 48 hours
8254                if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
8255                        last;
8256                }
8257                my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
8258
8259                # get list of changed files
8260                open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
8261                        $co{'parent'} || "--root",
8262                        $co{'id'}, "--", (defined $file_name ? $file_name : ())
8263                        or next;
8264                my @difftree = map { chomp; $_ } <$fd>;
8265                close $fd
8266                        or next;
8267
8268                # print element (entry, item)
8269                my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
8270                if ($format eq 'rss') {
8271                        print "<item>\n" .
8272                              "<title>" . esc_html($co{'title'}) . "</title>\n" .
8273                              "<author>" . esc_html($co{'author'}) . "</author>\n" .
8274                              "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
8275                              "<guid isPermaLink=\"true\">$co_url</guid>\n" .
8276                              "<link>$co_url</link>\n" .
8277                              "<description>" . esc_html($co{'title'}) . "</description>\n" .
8278                              "<content:encoded>" .
8279                              "<![CDATA[\n";
8280                } elsif ($format eq 'atom') {
8281                        print "<entry>\n" .
8282                              "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
8283                              "<updated>$cd{'iso-8601'}</updated>\n" .
8284                              "<author>\n" .
8285                              "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
8286                        if ($co{'author_email'}) {
8287                                print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
8288                        }
8289                        print "</author>\n" .
8290                              # use committer for contributor
8291                              "<contributor>\n" .
8292                              "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
8293                        if ($co{'committer_email'}) {
8294                                print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
8295                        }
8296                        print "</contributor>\n" .
8297                              "<published>$cd{'iso-8601'}</published>\n" .
8298                              "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
8299                              "<id>$co_url</id>\n" .
8300                              "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
8301                              "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
8302                }
8303                my $comment = $co{'comment'};
8304                print "<pre>\n";
8305                foreach my $line (@$comment) {
8306                        $line = esc_html($line);
8307                        print "$line\n";
8308                }
8309                print "</pre><ul>\n";
8310                foreach my $difftree_line (@difftree) {
8311                        my %difftree = parse_difftree_raw_line($difftree_line);
8312                        next if !$difftree{'from_id'};
8313
8314                        my $file = $difftree{'file'} || $difftree{'to_file'};
8315
8316                        print "<li>" .
8317                              "[" .
8318                              $cgi->a({-href => href(-full=>1, action=>"blobdiff",
8319                                                     hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
8320                                                     hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
8321                                                     file_name=>$file, file_parent=>$difftree{'from_file'}),
8322                                      -title => "diff"}, 'D');
8323                        if ($have_blame) {
8324                                print $cgi->a({-href => href(-full=>1, action=>"blame",
8325                                                             file_name=>$file, hash_base=>$commit),
8326                                              -title => "blame"}, 'B');
8327                        }
8328                        # if this is not a feed of a file history
8329                        if (!defined $file_name || $file_name ne $file) {
8330                                print $cgi->a({-href => href(-full=>1, action=>"history",
8331                                                             file_name=>$file, hash=>$commit),
8332                                              -title => "history"}, 'H');
8333                        }
8334                        $file = esc_path($file);
8335                        print "] ".
8336                              "$file</li>\n";
8337                }
8338                if ($format eq 'rss') {
8339                        print "</ul>]]>\n" .
8340                              "</content:encoded>\n" .
8341                              "</item>\n";
8342                } elsif ($format eq 'atom') {
8343                        print "</ul>\n</div>\n" .
8344                              "</content>\n" .
8345                              "</entry>\n";
8346                }
8347        }
8348
8349        # end of feed
8350        if ($format eq 'rss') {
8351                print "</channel>\n</rss>\n";
8352        } elsif ($format eq 'atom') {
8353                print "</feed>\n";
8354        }
8355}
8356
8357sub git_rss {
8358        git_feed('rss');
8359}
8360
8361sub git_atom {
8362        git_feed('atom');
8363}
8364
8365sub git_opml {
8366        my @list = git_get_projects_list($project_filter, $strict_export);
8367        if (!@list) {
8368                die_error(404, "No projects found");
8369        }
8370
8371        print $cgi->header(
8372                -type => 'text/xml',
8373                -charset => 'utf-8',
8374                -content_disposition => 'inline; filename="opml.xml"');
8375
8376        my $title = esc_html($site_name);
8377        my $filter = " within subdirectory ";
8378        if (defined $project_filter) {
8379                $filter .= esc_html($project_filter);
8380        } else {
8381                $filter = "";
8382        }
8383        print <<XML;
8384<?xml version="1.0" encoding="utf-8"?>
8385<opml version="1.0">
8386<head>
8387  <title>$title OPML Export$filter</title>
8388</head>
8389<body>
8390<outline text="git RSS feeds">
8391XML
8392
8393        foreach my $pr (@list) {
8394                my %proj = %$pr;
8395                my $head = git_get_head_hash($proj{'path'});
8396                if (!defined $head) {
8397                        next;
8398                }
8399                $git_dir = "$projectroot/$proj{'path'}";
8400                my %co = parse_commit($head);
8401                if (!%co) {
8402                        next;
8403                }
8404
8405                my $path = esc_html(chop_str($proj{'path'}, 25, 5));
8406                my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
8407                my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
8408                print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
8409        }
8410        print <<XML;
8411</outline>
8412</body>
8413</opml>
8414XML
8415}