gitweb / gitweb.perlon commit Merge git://ozlabs.org/~paulus/gitk (09bb4eb)
   1#!/usr/bin/perl
   2
   3# gitweb - simple web interface to track changes in git repositories
   4#
   5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
   6# (C) 2005, Christian Gierke
   7#
   8# This program is licensed under the GPLv2
   9
  10use 5.008;
  11use strict;
  12use warnings;
  13use CGI qw(:standard :escapeHTML -nosticky);
  14use CGI::Util qw(unescape);
  15use CGI::Carp qw(fatalsToBrowser set_message);
  16use Encode;
  17use Fcntl ':mode';
  18use File::Find qw();
  19use File::Basename qw(basename);
  20use Time::HiRes qw(gettimeofday tv_interval);
  21binmode STDOUT, ':utf8';
  22
  23our $t0 = [ gettimeofday() ];
  24our $number_of_git_cmds = 0;
  25
  26BEGIN {
  27        CGI->compile() if $ENV{'MOD_PERL'};
  28}
  29
  30our $version = "++GIT_VERSION++";
  31
  32our ($my_url, $my_uri, $base_url, $path_info, $home_link);
  33sub evaluate_uri {
  34        our $cgi;
  35
  36        our $my_url = $cgi->url();
  37        our $my_uri = $cgi->url(-absolute => 1);
  38
  39        # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
  40        # needed and used only for URLs with nonempty PATH_INFO
  41        our $base_url = $my_url;
  42
  43        # When the script is used as DirectoryIndex, the URL does not contain the name
  44        # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
  45        # have to do it ourselves. We make $path_info global because it's also used
  46        # later on.
  47        #
  48        # Another issue with the script being the DirectoryIndex is that the resulting
  49        # $my_url data is not the full script URL: this is good, because we want
  50        # generated links to keep implying the script name if it wasn't explicitly
  51        # indicated in the URL we're handling, but it means that $my_url cannot be used
  52        # as base URL.
  53        # Therefore, if we needed to strip PATH_INFO, then we know that we have
  54        # to build the base URL ourselves:
  55        our $path_info = $ENV{"PATH_INFO"};
  56        if ($path_info) {
  57                if ($my_url =~ s,\Q$path_info\E$,, &&
  58                    $my_uri =~ s,\Q$path_info\E$,, &&
  59                    defined $ENV{'SCRIPT_NAME'}) {
  60                        $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
  61                }
  62        }
  63
  64        # target of the home link on top of all pages
  65        our $home_link = $my_uri || "/";
  66}
  67
  68# core git executable to use
  69# this can just be "git" if your webserver has a sensible PATH
  70our $GIT = "++GIT_BINDIR++/git";
  71
  72# absolute fs-path which will be prepended to the project path
  73#our $projectroot = "/pub/scm";
  74our $projectroot = "++GITWEB_PROJECTROOT++";
  75
  76# fs traversing limit for getting project list
  77# the number is relative to the projectroot
  78our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
  79
  80# string of the home link on top of all pages
  81our $home_link_str = "++GITWEB_HOME_LINK_STR++";
  82
  83# name of your site or organization to appear in page titles
  84# replace this with something more descriptive for clearer bookmarks
  85our $site_name = "++GITWEB_SITENAME++"
  86                 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
  87
  88# html snippet to include in the <head> section of each page
  89our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
  90# filename of html text to include at top of each page
  91our $site_header = "++GITWEB_SITE_HEADER++";
  92# html text to include at home page
  93our $home_text = "++GITWEB_HOMETEXT++";
  94# filename of html text to include at bottom of each page
  95our $site_footer = "++GITWEB_SITE_FOOTER++";
  96
  97# URI of stylesheets
  98our @stylesheets = ("++GITWEB_CSS++");
  99# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
 100our $stylesheet = undef;
 101# URI of GIT logo (72x27 size)
 102our $logo = "++GITWEB_LOGO++";
 103# URI of GIT favicon, assumed to be image/png type
 104our $favicon = "++GITWEB_FAVICON++";
 105# URI of gitweb.js (JavaScript code for gitweb)
 106our $javascript = "++GITWEB_JS++";
 107
 108# URI and label (title) of GIT logo link
 109#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
 110#our $logo_label = "git documentation";
 111our $logo_url = "http://git-scm.com/";
 112our $logo_label = "git homepage";
 113
 114# source of projects list
 115our $projects_list = "++GITWEB_LIST++";
 116
 117# the width (in characters) of the projects list "Description" column
 118our $projects_list_description_width = 25;
 119
 120# group projects by category on the projects list
 121# (enabled if this variable evaluates to true)
 122our $projects_list_group_categories = 0;
 123
 124# default category if none specified
 125# (leave the empty string for no category)
 126our $project_list_default_category = "";
 127
 128# default order of projects list
 129# valid values are none, project, descr, owner, and age
 130our $default_projects_order = "project";
 131
 132# show repository only if this file exists
 133# (only effective if this variable evaluates to true)
 134our $export_ok = "++GITWEB_EXPORT_OK++";
 135
 136# show repository only if this subroutine returns true
 137# when given the path to the project, for example:
 138#    sub { return -e "$_[0]/git-daemon-export-ok"; }
 139our $export_auth_hook = undef;
 140
 141# only allow viewing of repositories also shown on the overview page
 142our $strict_export = "++GITWEB_STRICT_EXPORT++";
 143
 144# list of git base URLs used for URL to where fetch project from,
 145# i.e. full URL is "$git_base_url/$project"
 146our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
 147
 148# default blob_plain mimetype and default charset for text/plain blob
 149our $default_blob_plain_mimetype = 'text/plain';
 150our $default_text_plain_charset  = undef;
 151
 152# file to use for guessing MIME types before trying /etc/mime.types
 153# (relative to the current git repository)
 154our $mimetypes_file = undef;
 155
 156# assume this charset if line contains non-UTF-8 characters;
 157# it should be valid encoding (see Encoding::Supported(3pm) for list),
 158# for which encoding all byte sequences are valid, for example
 159# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
 160# could be even 'utf-8' for the old behavior)
 161our $fallback_encoding = 'latin1';
 162
 163# rename detection options for git-diff and git-diff-tree
 164# - default is '-M', with the cost proportional to
 165#   (number of removed files) * (number of new files).
 166# - more costly is '-C' (which implies '-M'), with the cost proportional to
 167#   (number of changed files + number of removed files) * (number of new files)
 168# - even more costly is '-C', '--find-copies-harder' with cost
 169#   (number of files in the original tree) * (number of new files)
 170# - one might want to include '-B' option, e.g. '-B', '-M'
 171our @diff_opts = ('-M'); # taken from git_commit
 172
 173# Disables features that would allow repository owners to inject script into
 174# the gitweb domain.
 175our $prevent_xss = 0;
 176
 177# Path to the highlight executable to use (must be the one from
 178# http://www.andre-simon.de due to assumptions about parameters and output).
 179# Useful if highlight is not installed on your webserver's PATH.
 180# [Default: highlight]
 181our $highlight_bin = "++HIGHLIGHT_BIN++";
 182
 183# information about snapshot formats that gitweb is capable of serving
 184our %known_snapshot_formats = (
 185        # name => {
 186        #       'display' => display name,
 187        #       'type' => mime type,
 188        #       'suffix' => filename suffix,
 189        #       'format' => --format for git-archive,
 190        #       'compressor' => [compressor command and arguments]
 191        #                       (array reference, optional)
 192        #       'disabled' => boolean (optional)}
 193        #
 194        'tgz' => {
 195                'display' => 'tar.gz',
 196                'type' => 'application/x-gzip',
 197                'suffix' => '.tar.gz',
 198                'format' => 'tar',
 199                'compressor' => ['gzip', '-n']},
 200
 201        'tbz2' => {
 202                'display' => 'tar.bz2',
 203                'type' => 'application/x-bzip2',
 204                'suffix' => '.tar.bz2',
 205                'format' => 'tar',
 206                'compressor' => ['bzip2']},
 207
 208        'txz' => {
 209                'display' => 'tar.xz',
 210                'type' => 'application/x-xz',
 211                'suffix' => '.tar.xz',
 212                'format' => 'tar',
 213                'compressor' => ['xz'],
 214                'disabled' => 1},
 215
 216        'zip' => {
 217                'display' => 'zip',
 218                'type' => 'application/x-zip',
 219                'suffix' => '.zip',
 220                'format' => 'zip'},
 221);
 222
 223# Aliases so we understand old gitweb.snapshot values in repository
 224# configuration.
 225our %known_snapshot_format_aliases = (
 226        'gzip'  => 'tgz',
 227        'bzip2' => 'tbz2',
 228        'xz'    => 'txz',
 229
 230        # backward compatibility: legacy gitweb config support
 231        'x-gzip' => undef, 'gz' => undef,
 232        'x-bzip2' => undef, 'bz2' => undef,
 233        'x-zip' => undef, '' => undef,
 234);
 235
 236# Pixel sizes for icons and avatars. If the default font sizes or lineheights
 237# are changed, it may be appropriate to change these values too via
 238# $GITWEB_CONFIG.
 239our %avatar_size = (
 240        'default' => 16,
 241        'double'  => 32
 242);
 243
 244# Used to set the maximum load that we will still respond to gitweb queries.
 245# If server load exceed this value then return "503 server busy" error.
 246# If gitweb cannot determined server load, it is taken to be 0.
 247# Leave it undefined (or set to 'undef') to turn off load checking.
 248our $maxload = 300;
 249
 250# configuration for 'highlight' (http://www.andre-simon.de/)
 251# match by basename
 252our %highlight_basename = (
 253        #'Program' => 'py',
 254        #'Library' => 'py',
 255        'SConstruct' => 'py', # SCons equivalent of Makefile
 256        'Makefile' => 'make',
 257);
 258# match by extension
 259our %highlight_ext = (
 260        # main extensions, defining name of syntax;
 261        # see files in /usr/share/highlight/langDefs/ directory
 262        map { $_ => $_ }
 263                qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
 264        # alternate extensions, see /etc/highlight/filetypes.conf
 265        'h' => 'c',
 266        map { $_ => 'sh'  } qw(bash zsh ksh),
 267        map { $_ => 'cpp' } qw(cxx c++ cc),
 268        map { $_ => 'php' } qw(php3 php4 php5 phps),
 269        map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
 270        map { $_ => 'make'} qw(mak mk),
 271        map { $_ => 'xml' } qw(xhtml html htm),
 272);
 273
 274# You define site-wide feature defaults here; override them with
 275# $GITWEB_CONFIG as necessary.
 276our %feature = (
 277        # feature => {
 278        #       'sub' => feature-sub (subroutine),
 279        #       'override' => allow-override (boolean),
 280        #       'default' => [ default options...] (array reference)}
 281        #
 282        # if feature is overridable (it means that allow-override has true value),
 283        # then feature-sub will be called with default options as parameters;
 284        # return value of feature-sub indicates if to enable specified feature
 285        #
 286        # if there is no 'sub' key (no feature-sub), then feature cannot be
 287        # overridden
 288        #
 289        # use gitweb_get_feature(<feature>) to retrieve the <feature> value
 290        # (an array) or gitweb_check_feature(<feature>) to check if <feature>
 291        # is enabled
 292
 293        # Enable the 'blame' blob view, showing the last commit that modified
 294        # each line in the file. This can be very CPU-intensive.
 295
 296        # To enable system wide have in $GITWEB_CONFIG
 297        # $feature{'blame'}{'default'} = [1];
 298        # To have project specific config enable override in $GITWEB_CONFIG
 299        # $feature{'blame'}{'override'} = 1;
 300        # and in project config gitweb.blame = 0|1;
 301        'blame' => {
 302                'sub' => sub { feature_bool('blame', @_) },
 303                'override' => 0,
 304                'default' => [0]},
 305
 306        # Enable the 'snapshot' link, providing a compressed archive of any
 307        # tree. This can potentially generate high traffic if you have large
 308        # project.
 309
 310        # Value is a list of formats defined in %known_snapshot_formats that
 311        # you wish to offer.
 312        # To disable system wide have in $GITWEB_CONFIG
 313        # $feature{'snapshot'}{'default'} = [];
 314        # To have project specific config enable override in $GITWEB_CONFIG
 315        # $feature{'snapshot'}{'override'} = 1;
 316        # and in project config, a comma-separated list of formats or "none"
 317        # to disable.  Example: gitweb.snapshot = tbz2,zip;
 318        'snapshot' => {
 319                'sub' => \&feature_snapshot,
 320                'override' => 0,
 321                'default' => ['tgz']},
 322
 323        # Enable text search, which will list the commits which match author,
 324        # committer or commit text to a given string.  Enabled by default.
 325        # Project specific override is not supported.
 326        #
 327        # Note that this controls all search features, which means that if
 328        # it is disabled, then 'grep' and 'pickaxe' search would also be
 329        # disabled.
 330        'search' => {
 331                'override' => 0,
 332                'default' => [1]},
 333
 334        # Enable grep search, which will list the files in currently selected
 335        # tree containing the given string. Enabled by default. This can be
 336        # potentially CPU-intensive, of course.
 337        # Note that you need to have 'search' feature enabled too.
 338
 339        # To enable system wide have in $GITWEB_CONFIG
 340        # $feature{'grep'}{'default'} = [1];
 341        # To have project specific config enable override in $GITWEB_CONFIG
 342        # $feature{'grep'}{'override'} = 1;
 343        # and in project config gitweb.grep = 0|1;
 344        'grep' => {
 345                'sub' => sub { feature_bool('grep', @_) },
 346                'override' => 0,
 347                'default' => [1]},
 348
 349        # Enable the pickaxe search, which will list the commits that modified
 350        # a given string in a file. This can be practical and quite faster
 351        # alternative to 'blame', but still potentially CPU-intensive.
 352        # Note that you need to have 'search' feature enabled too.
 353
 354        # To enable system wide have in $GITWEB_CONFIG
 355        # $feature{'pickaxe'}{'default'} = [1];
 356        # To have project specific config enable override in $GITWEB_CONFIG
 357        # $feature{'pickaxe'}{'override'} = 1;
 358        # and in project config gitweb.pickaxe = 0|1;
 359        'pickaxe' => {
 360                'sub' => sub { feature_bool('pickaxe', @_) },
 361                'override' => 0,
 362                'default' => [1]},
 363
 364        # Enable showing size of blobs in a 'tree' view, in a separate
 365        # column, similar to what 'ls -l' does.  This cost a bit of IO.
 366
 367        # To disable system wide have in $GITWEB_CONFIG
 368        # $feature{'show-sizes'}{'default'} = [0];
 369        # To have project specific config enable override in $GITWEB_CONFIG
 370        # $feature{'show-sizes'}{'override'} = 1;
 371        # and in project config gitweb.showsizes = 0|1;
 372        'show-sizes' => {
 373                'sub' => sub { feature_bool('showsizes', @_) },
 374                'override' => 0,
 375                'default' => [1]},
 376
 377        # Make gitweb use an alternative format of the URLs which can be
 378        # more readable and natural-looking: project name is embedded
 379        # directly in the path and the query string contains other
 380        # auxiliary information. All gitweb installations recognize
 381        # URL in either format; this configures in which formats gitweb
 382        # generates links.
 383
 384        # To enable system wide have in $GITWEB_CONFIG
 385        # $feature{'pathinfo'}{'default'} = [1];
 386        # Project specific override is not supported.
 387
 388        # Note that you will need to change the default location of CSS,
 389        # favicon, logo and possibly other files to an absolute URL. Also,
 390        # if gitweb.cgi serves as your indexfile, you will need to force
 391        # $my_uri to contain the script name in your $GITWEB_CONFIG.
 392        'pathinfo' => {
 393                'override' => 0,
 394                'default' => [0]},
 395
 396        # Make gitweb consider projects in project root subdirectories
 397        # to be forks of existing projects. Given project $projname.git,
 398        # projects matching $projname/*.git will not be shown in the main
 399        # projects list, instead a '+' mark will be added to $projname
 400        # there and a 'forks' view will be enabled for the project, listing
 401        # all the forks. If project list is taken from a file, forks have
 402        # to be listed after the main project.
 403
 404        # To enable system wide have in $GITWEB_CONFIG
 405        # $feature{'forks'}{'default'} = [1];
 406        # Project specific override is not supported.
 407        'forks' => {
 408                'override' => 0,
 409                'default' => [0]},
 410
 411        # Insert custom links to the action bar of all project pages.
 412        # This enables you mainly to link to third-party scripts integrating
 413        # into gitweb; e.g. git-browser for graphical history representation
 414        # or custom web-based repository administration interface.
 415
 416        # The 'default' value consists of a list of triplets in the form
 417        # (label, link, position) where position is the label after which
 418        # to insert the link and link is a format string where %n expands
 419        # to the project name, %f to the project path within the filesystem,
 420        # %h to the current hash (h gitweb parameter) and %b to the current
 421        # hash base (hb gitweb parameter); %% expands to %.
 422
 423        # To enable system wide have in $GITWEB_CONFIG e.g.
 424        # $feature{'actions'}{'default'} = [('graphiclog',
 425        #       '/git-browser/by-commit.html?r=%n', 'summary')];
 426        # Project specific override is not supported.
 427        'actions' => {
 428                'override' => 0,
 429                'default' => []},
 430
 431        # Allow gitweb scan project content tags of project repository,
 432        # and display the popular Web 2.0-ish "tag cloud" near the projects
 433        # list.  Note that this is something COMPLETELY different from the
 434        # normal Git tags.
 435
 436        # gitweb by itself can show existing tags, but it does not handle
 437        # tagging itself; you need to do it externally, outside gitweb.
 438        # The format is described in git_get_project_ctags() subroutine.
 439        # You may want to install the HTML::TagCloud Perl module to get
 440        # a pretty tag cloud instead of just a list of tags.
 441
 442        # To enable system wide have in $GITWEB_CONFIG
 443        # $feature{'ctags'}{'default'} = [1];
 444        # Project specific override is not supported.
 445
 446        # In the future whether ctags editing is enabled might depend
 447        # on the value, but using 1 should always mean no editing of ctags.
 448        'ctags' => {
 449                'override' => 0,
 450                'default' => [0]},
 451
 452        # The maximum number of patches in a patchset generated in patch
 453        # view. Set this to 0 or undef to disable patch view, or to a
 454        # negative number to remove any limit.
 455
 456        # To disable system wide have in $GITWEB_CONFIG
 457        # $feature{'patches'}{'default'} = [0];
 458        # To have project specific config enable override in $GITWEB_CONFIG
 459        # $feature{'patches'}{'override'} = 1;
 460        # and in project config gitweb.patches = 0|n;
 461        # where n is the maximum number of patches allowed in a patchset.
 462        'patches' => {
 463                'sub' => \&feature_patches,
 464                'override' => 0,
 465                'default' => [16]},
 466
 467        # Avatar support. When this feature is enabled, views such as
 468        # shortlog or commit will display an avatar associated with
 469        # the email of the committer(s) and/or author(s).
 470
 471        # Currently available providers are gravatar and picon.
 472        # If an unknown provider is specified, the feature is disabled.
 473
 474        # Gravatar depends on Digest::MD5.
 475        # Picon currently relies on the indiana.edu database.
 476
 477        # To enable system wide have in $GITWEB_CONFIG
 478        # $feature{'avatar'}{'default'} = ['<provider>'];
 479        # where <provider> is either gravatar or picon.
 480        # To have project specific config enable override in $GITWEB_CONFIG
 481        # $feature{'avatar'}{'override'} = 1;
 482        # and in project config gitweb.avatar = <provider>;
 483        'avatar' => {
 484                'sub' => \&feature_avatar,
 485                'override' => 0,
 486                'default' => ['']},
 487
 488        # Enable displaying how much time and how many git commands
 489        # it took to generate and display page.  Disabled by default.
 490        # Project specific override is not supported.
 491        'timed' => {
 492                'override' => 0,
 493                'default' => [0]},
 494
 495        # Enable turning some links into links to actions which require
 496        # JavaScript to run (like 'blame_incremental').  Not enabled by
 497        # default.  Project specific override is currently not supported.
 498        'javascript-actions' => {
 499                'override' => 0,
 500                'default' => [0]},
 501
 502        # Enable and configure ability to change common timezone for dates
 503        # in gitweb output via JavaScript.  Enabled by default.
 504        # Project specific override is not supported.
 505        'javascript-timezone' => {
 506                'override' => 0,
 507                'default' => [
 508                        'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
 509                                     # or undef to turn off this feature
 510                        'gitweb_tz', # name of cookie where to store selected timezone
 511                        'datetime',  # CSS class used to mark up dates for manipulation
 512                ]},
 513
 514        # Syntax highlighting support. This is based on Daniel Svensson's
 515        # and Sham Chukoury's work in gitweb-xmms2.git.
 516        # It requires the 'highlight' program present in $PATH,
 517        # and therefore is disabled by default.
 518
 519        # To enable system wide have in $GITWEB_CONFIG
 520        # $feature{'highlight'}{'default'} = [1];
 521
 522        'highlight' => {
 523                'sub' => sub { feature_bool('highlight', @_) },
 524                'override' => 0,
 525                'default' => [0]},
 526
 527        # Enable displaying of remote heads in the heads list
 528
 529        # To enable system wide have in $GITWEB_CONFIG
 530        # $feature{'remote_heads'}{'default'} = [1];
 531        # To have project specific config enable override in $GITWEB_CONFIG
 532        # $feature{'remote_heads'}{'override'} = 1;
 533        # and in project config gitweb.remote_heads = 0|1;
 534        'remote_heads' => {
 535                'sub' => sub { feature_bool('remote_heads', @_) },
 536                'override' => 0,
 537                'default' => [0]},
 538);
 539
 540sub gitweb_get_feature {
 541        my ($name) = @_;
 542        return unless exists $feature{$name};
 543        my ($sub, $override, @defaults) = (
 544                $feature{$name}{'sub'},
 545                $feature{$name}{'override'},
 546                @{$feature{$name}{'default'}});
 547        # project specific override is possible only if we have project
 548        our $git_dir; # global variable, declared later
 549        if (!$override || !defined $git_dir) {
 550                return @defaults;
 551        }
 552        if (!defined $sub) {
 553                warn "feature $name is not overridable";
 554                return @defaults;
 555        }
 556        return $sub->(@defaults);
 557}
 558
 559# A wrapper to check if a given feature is enabled.
 560# With this, you can say
 561#
 562#   my $bool_feat = gitweb_check_feature('bool_feat');
 563#   gitweb_check_feature('bool_feat') or somecode;
 564#
 565# instead of
 566#
 567#   my ($bool_feat) = gitweb_get_feature('bool_feat');
 568#   (gitweb_get_feature('bool_feat'))[0] or somecode;
 569#
 570sub gitweb_check_feature {
 571        return (gitweb_get_feature(@_))[0];
 572}
 573
 574
 575sub feature_bool {
 576        my $key = shift;
 577        my ($val) = git_get_project_config($key, '--bool');
 578
 579        if (!defined $val) {
 580                return ($_[0]);
 581        } elsif ($val eq 'true') {
 582                return (1);
 583        } elsif ($val eq 'false') {
 584                return (0);
 585        }
 586}
 587
 588sub feature_snapshot {
 589        my (@fmts) = @_;
 590
 591        my ($val) = git_get_project_config('snapshot');
 592
 593        if ($val) {
 594                @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
 595        }
 596
 597        return @fmts;
 598}
 599
 600sub feature_patches {
 601        my @val = (git_get_project_config('patches', '--int'));
 602
 603        if (@val) {
 604                return @val;
 605        }
 606
 607        return ($_[0]);
 608}
 609
 610sub feature_avatar {
 611        my @val = (git_get_project_config('avatar'));
 612
 613        return @val ? @val : @_;
 614}
 615
 616# checking HEAD file with -e is fragile if the repository was
 617# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
 618# and then pruned.
 619sub check_head_link {
 620        my ($dir) = @_;
 621        my $headfile = "$dir/HEAD";
 622        return ((-e $headfile) ||
 623                (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
 624}
 625
 626sub check_export_ok {
 627        my ($dir) = @_;
 628        return (check_head_link($dir) &&
 629                (!$export_ok || -e "$dir/$export_ok") &&
 630                (!$export_auth_hook || $export_auth_hook->($dir)));
 631}
 632
 633# process alternate names for backward compatibility
 634# filter out unsupported (unknown) snapshot formats
 635sub filter_snapshot_fmts {
 636        my @fmts = @_;
 637
 638        @fmts = map {
 639                exists $known_snapshot_format_aliases{$_} ?
 640                       $known_snapshot_format_aliases{$_} : $_} @fmts;
 641        @fmts = grep {
 642                exists $known_snapshot_formats{$_} &&
 643                !$known_snapshot_formats{$_}{'disabled'}} @fmts;
 644}
 645
 646# If it is set to code reference, it is code that it is to be run once per
 647# request, allowing updating configurations that change with each request,
 648# while running other code in config file only once.
 649#
 650# Otherwise, if it is false then gitweb would process config file only once;
 651# if it is true then gitweb config would be run for each request.
 652our $per_request_config = 1;
 653
 654# read and parse gitweb config file given by its parameter.
 655# returns true on success, false on recoverable error, allowing
 656# to chain this subroutine, using first file that exists.
 657# dies on errors during parsing config file, as it is unrecoverable.
 658sub read_config_file {
 659        my $filename = shift;
 660        return unless defined $filename;
 661        # die if there are errors parsing config file
 662        if (-e $filename) {
 663                do $filename;
 664                die $@ if $@;
 665                return 1;
 666        }
 667        return;
 668}
 669
 670our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
 671sub evaluate_gitweb_config {
 672        our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
 673        our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
 674        our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
 675
 676        # Protect agains duplications of file names, to not read config twice.
 677        # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
 678        # there possibility of duplication of filename there doesn't matter.
 679        $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
 680        $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
 681
 682        # Common system-wide settings for convenience.
 683        # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
 684        read_config_file($GITWEB_CONFIG_COMMON);
 685
 686        # Use first config file that exists.  This means use the per-instance
 687        # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
 688        read_config_file($GITWEB_CONFIG) and return;
 689        read_config_file($GITWEB_CONFIG_SYSTEM);
 690}
 691
 692# Get loadavg of system, to compare against $maxload.
 693# Currently it requires '/proc/loadavg' present to get loadavg;
 694# if it is not present it returns 0, which means no load checking.
 695sub get_loadavg {
 696        if( -e '/proc/loadavg' ){
 697                open my $fd, '<', '/proc/loadavg'
 698                        or return 0;
 699                my @load = split(/\s+/, scalar <$fd>);
 700                close $fd;
 701
 702                # The first three columns measure CPU and IO utilization of the last one,
 703                # five, and 10 minute periods.  The fourth column shows the number of
 704                # currently running processes and the total number of processes in the m/n
 705                # format.  The last column displays the last process ID used.
 706                return $load[0] || 0;
 707        }
 708        # additional checks for load average should go here for things that don't export
 709        # /proc/loadavg
 710
 711        return 0;
 712}
 713
 714# version of the core git binary
 715our $git_version;
 716sub evaluate_git_version {
 717        our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
 718        $number_of_git_cmds++;
 719}
 720
 721sub check_loadavg {
 722        if (defined $maxload && get_loadavg() > $maxload) {
 723                die_error(503, "The load average on the server is too high");
 724        }
 725}
 726
 727# ======================================================================
 728# input validation and dispatch
 729
 730# input parameters can be collected from a variety of sources (presently, CGI
 731# and PATH_INFO), so we define an %input_params hash that collects them all
 732# together during validation: this allows subsequent uses (e.g. href()) to be
 733# agnostic of the parameter origin
 734
 735our %input_params = ();
 736
 737# input parameters are stored with the long parameter name as key. This will
 738# also be used in the href subroutine to convert parameters to their CGI
 739# equivalent, and since the href() usage is the most frequent one, we store
 740# the name -> CGI key mapping here, instead of the reverse.
 741#
 742# XXX: Warning: If you touch this, check the search form for updating,
 743# too.
 744
 745our @cgi_param_mapping = (
 746        project => "p",
 747        action => "a",
 748        file_name => "f",
 749        file_parent => "fp",
 750        hash => "h",
 751        hash_parent => "hp",
 752        hash_base => "hb",
 753        hash_parent_base => "hpb",
 754        page => "pg",
 755        order => "o",
 756        searchtext => "s",
 757        searchtype => "st",
 758        snapshot_format => "sf",
 759        extra_options => "opt",
 760        search_use_regexp => "sr",
 761        ctag => "by_tag",
 762        diff_style => "ds",
 763        # this must be last entry (for manipulation from JavaScript)
 764        javascript => "js"
 765);
 766our %cgi_param_mapping = @cgi_param_mapping;
 767
 768# we will also need to know the possible actions, for validation
 769our %actions = (
 770        "blame" => \&git_blame,
 771        "blame_incremental" => \&git_blame_incremental,
 772        "blame_data" => \&git_blame_data,
 773        "blobdiff" => \&git_blobdiff,
 774        "blobdiff_plain" => \&git_blobdiff_plain,
 775        "blob" => \&git_blob,
 776        "blob_plain" => \&git_blob_plain,
 777        "commitdiff" => \&git_commitdiff,
 778        "commitdiff_plain" => \&git_commitdiff_plain,
 779        "commit" => \&git_commit,
 780        "forks" => \&git_forks,
 781        "heads" => \&git_heads,
 782        "history" => \&git_history,
 783        "log" => \&git_log,
 784        "patch" => \&git_patch,
 785        "patches" => \&git_patches,
 786        "remotes" => \&git_remotes,
 787        "rss" => \&git_rss,
 788        "atom" => \&git_atom,
 789        "search" => \&git_search,
 790        "search_help" => \&git_search_help,
 791        "shortlog" => \&git_shortlog,
 792        "summary" => \&git_summary,
 793        "tag" => \&git_tag,
 794        "tags" => \&git_tags,
 795        "tree" => \&git_tree,
 796        "snapshot" => \&git_snapshot,
 797        "object" => \&git_object,
 798        # those below don't need $project
 799        "opml" => \&git_opml,
 800        "project_list" => \&git_project_list,
 801        "project_index" => \&git_project_index,
 802);
 803
 804# finally, we have the hash of allowed extra_options for the commands that
 805# allow them
 806our %allowed_options = (
 807        "--no-merges" => [ qw(rss atom log shortlog history) ],
 808);
 809
 810# fill %input_params with the CGI parameters. All values except for 'opt'
 811# should be single values, but opt can be an array. We should probably
 812# build an array of parameters that can be multi-valued, but since for the time
 813# being it's only this one, we just single it out
 814sub evaluate_query_params {
 815        our $cgi;
 816
 817        while (my ($name, $symbol) = each %cgi_param_mapping) {
 818                if ($symbol eq 'opt') {
 819                        $input_params{$name} = [ $cgi->param($symbol) ];
 820                } else {
 821                        $input_params{$name} = $cgi->param($symbol);
 822                }
 823        }
 824}
 825
 826# now read PATH_INFO and update the parameter list for missing parameters
 827sub evaluate_path_info {
 828        return if defined $input_params{'project'};
 829        return if !$path_info;
 830        $path_info =~ s,^/+,,;
 831        return if !$path_info;
 832
 833        # find which part of PATH_INFO is project
 834        my $project = $path_info;
 835        $project =~ s,/+$,,;
 836        while ($project && !check_head_link("$projectroot/$project")) {
 837                $project =~ s,/*[^/]*$,,;
 838        }
 839        return unless $project;
 840        $input_params{'project'} = $project;
 841
 842        # do not change any parameters if an action is given using the query string
 843        return if $input_params{'action'};
 844        $path_info =~ s,^\Q$project\E/*,,;
 845
 846        # next, check if we have an action
 847        my $action = $path_info;
 848        $action =~ s,/.*$,,;
 849        if (exists $actions{$action}) {
 850                $path_info =~ s,^$action/*,,;
 851                $input_params{'action'} = $action;
 852        }
 853
 854        # list of actions that want hash_base instead of hash, but can have no
 855        # pathname (f) parameter
 856        my @wants_base = (
 857                'tree',
 858                'history',
 859        );
 860
 861        # we want to catch, among others
 862        # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
 863        my ($parentrefname, $parentpathname, $refname, $pathname) =
 864                ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
 865
 866        # first, analyze the 'current' part
 867        if (defined $pathname) {
 868                # we got "branch:filename" or "branch:dir/"
 869                # we could use git_get_type(branch:pathname), but:
 870                # - it needs $git_dir
 871                # - it does a git() call
 872                # - the convention of terminating directories with a slash
 873                #   makes it superfluous
 874                # - embedding the action in the PATH_INFO would make it even
 875                #   more superfluous
 876                $pathname =~ s,^/+,,;
 877                if (!$pathname || substr($pathname, -1) eq "/") {
 878                        $input_params{'action'} ||= "tree";
 879                        $pathname =~ s,/$,,;
 880                } else {
 881                        # the default action depends on whether we had parent info
 882                        # or not
 883                        if ($parentrefname) {
 884                                $input_params{'action'} ||= "blobdiff_plain";
 885                        } else {
 886                                $input_params{'action'} ||= "blob_plain";
 887                        }
 888                }
 889                $input_params{'hash_base'} ||= $refname;
 890                $input_params{'file_name'} ||= $pathname;
 891        } elsif (defined $refname) {
 892                # we got "branch". In this case we have to choose if we have to
 893                # set hash or hash_base.
 894                #
 895                # Most of the actions without a pathname only want hash to be
 896                # set, except for the ones specified in @wants_base that want
 897                # hash_base instead. It should also be noted that hand-crafted
 898                # links having 'history' as an action and no pathname or hash
 899                # set will fail, but that happens regardless of PATH_INFO.
 900                if (defined $parentrefname) {
 901                        # if there is parent let the default be 'shortlog' action
 902                        # (for http://git.example.com/repo.git/A..B links); if there
 903                        # is no parent, dispatch will detect type of object and set
 904                        # action appropriately if required (if action is not set)
 905                        $input_params{'action'} ||= "shortlog";
 906                }
 907                if ($input_params{'action'} &&
 908                    grep { $_ eq $input_params{'action'} } @wants_base) {
 909                        $input_params{'hash_base'} ||= $refname;
 910                } else {
 911                        $input_params{'hash'} ||= $refname;
 912                }
 913        }
 914
 915        # next, handle the 'parent' part, if present
 916        if (defined $parentrefname) {
 917                # a missing pathspec defaults to the 'current' filename, allowing e.g.
 918                # someproject/blobdiff/oldrev..newrev:/filename
 919                if ($parentpathname) {
 920                        $parentpathname =~ s,^/+,,;
 921                        $parentpathname =~ s,/$,,;
 922                        $input_params{'file_parent'} ||= $parentpathname;
 923                } else {
 924                        $input_params{'file_parent'} ||= $input_params{'file_name'};
 925                }
 926                # we assume that hash_parent_base is wanted if a path was specified,
 927                # or if the action wants hash_base instead of hash
 928                if (defined $input_params{'file_parent'} ||
 929                        grep { $_ eq $input_params{'action'} } @wants_base) {
 930                        $input_params{'hash_parent_base'} ||= $parentrefname;
 931                } else {
 932                        $input_params{'hash_parent'} ||= $parentrefname;
 933                }
 934        }
 935
 936        # for the snapshot action, we allow URLs in the form
 937        # $project/snapshot/$hash.ext
 938        # where .ext determines the snapshot and gets removed from the
 939        # passed $refname to provide the $hash.
 940        #
 941        # To be able to tell that $refname includes the format extension, we
 942        # require the following two conditions to be satisfied:
 943        # - the hash input parameter MUST have been set from the $refname part
 944        #   of the URL (i.e. they must be equal)
 945        # - the snapshot format MUST NOT have been defined already (e.g. from
 946        #   CGI parameter sf)
 947        # It's also useless to try any matching unless $refname has a dot,
 948        # so we check for that too
 949        if (defined $input_params{'action'} &&
 950                $input_params{'action'} eq 'snapshot' &&
 951                defined $refname && index($refname, '.') != -1 &&
 952                $refname eq $input_params{'hash'} &&
 953                !defined $input_params{'snapshot_format'}) {
 954                # We loop over the known snapshot formats, checking for
 955                # extensions. Allowed extensions are both the defined suffix
 956                # (which includes the initial dot already) and the snapshot
 957                # format key itself, with a prepended dot
 958                while (my ($fmt, $opt) = each %known_snapshot_formats) {
 959                        my $hash = $refname;
 960                        unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
 961                                next;
 962                        }
 963                        my $sfx = $1;
 964                        # a valid suffix was found, so set the snapshot format
 965                        # and reset the hash parameter
 966                        $input_params{'snapshot_format'} = $fmt;
 967                        $input_params{'hash'} = $hash;
 968                        # we also set the format suffix to the one requested
 969                        # in the URL: this way a request for e.g. .tgz returns
 970                        # a .tgz instead of a .tar.gz
 971                        $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
 972                        last;
 973                }
 974        }
 975}
 976
 977our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
 978     $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
 979     $searchtext, $search_regexp);
 980sub evaluate_and_validate_params {
 981        our $action = $input_params{'action'};
 982        if (defined $action) {
 983                if (!validate_action($action)) {
 984                        die_error(400, "Invalid action parameter");
 985                }
 986        }
 987
 988        # parameters which are pathnames
 989        our $project = $input_params{'project'};
 990        if (defined $project) {
 991                if (!validate_project($project)) {
 992                        undef $project;
 993                        die_error(404, "No such project");
 994                }
 995        }
 996
 997        our $file_name = $input_params{'file_name'};
 998        if (defined $file_name) {
 999                if (!validate_pathname($file_name)) {
1000                        die_error(400, "Invalid file parameter");
1001                }
1002        }
1003
1004        our $file_parent = $input_params{'file_parent'};
1005        if (defined $file_parent) {
1006                if (!validate_pathname($file_parent)) {
1007                        die_error(400, "Invalid file parent parameter");
1008                }
1009        }
1010
1011        # parameters which are refnames
1012        our $hash = $input_params{'hash'};
1013        if (defined $hash) {
1014                if (!validate_refname($hash)) {
1015                        die_error(400, "Invalid hash parameter");
1016                }
1017        }
1018
1019        our $hash_parent = $input_params{'hash_parent'};
1020        if (defined $hash_parent) {
1021                if (!validate_refname($hash_parent)) {
1022                        die_error(400, "Invalid hash parent parameter");
1023                }
1024        }
1025
1026        our $hash_base = $input_params{'hash_base'};
1027        if (defined $hash_base) {
1028                if (!validate_refname($hash_base)) {
1029                        die_error(400, "Invalid hash base parameter");
1030                }
1031        }
1032
1033        our @extra_options = @{$input_params{'extra_options'}};
1034        # @extra_options is always defined, since it can only be (currently) set from
1035        # CGI, and $cgi->param() returns the empty array in array context if the param
1036        # is not set
1037        foreach my $opt (@extra_options) {
1038                if (not exists $allowed_options{$opt}) {
1039                        die_error(400, "Invalid option parameter");
1040                }
1041                if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1042                        die_error(400, "Invalid option parameter for this action");
1043                }
1044        }
1045
1046        our $hash_parent_base = $input_params{'hash_parent_base'};
1047        if (defined $hash_parent_base) {
1048                if (!validate_refname($hash_parent_base)) {
1049                        die_error(400, "Invalid hash parent base parameter");
1050                }
1051        }
1052
1053        # other parameters
1054        our $page = $input_params{'page'};
1055        if (defined $page) {
1056                if ($page =~ m/[^0-9]/) {
1057                        die_error(400, "Invalid page parameter");
1058                }
1059        }
1060
1061        our $searchtype = $input_params{'searchtype'};
1062        if (defined $searchtype) {
1063                if ($searchtype =~ m/[^a-z]/) {
1064                        die_error(400, "Invalid searchtype parameter");
1065                }
1066        }
1067
1068        our $search_use_regexp = $input_params{'search_use_regexp'};
1069
1070        our $searchtext = $input_params{'searchtext'};
1071        our $search_regexp;
1072        if (defined $searchtext) {
1073                if (length($searchtext) < 2) {
1074                        die_error(403, "At least two characters are required for search parameter");
1075                }
1076                $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
1077        }
1078}
1079
1080# path to the current git repository
1081our $git_dir;
1082sub evaluate_git_dir {
1083        our $git_dir = "$projectroot/$project" if $project;
1084}
1085
1086our (@snapshot_fmts, $git_avatar);
1087sub configure_gitweb_features {
1088        # list of supported snapshot formats
1089        our @snapshot_fmts = gitweb_get_feature('snapshot');
1090        @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1091
1092        # check that the avatar feature is set to a known provider name,
1093        # and for each provider check if the dependencies are satisfied.
1094        # if the provider name is invalid or the dependencies are not met,
1095        # reset $git_avatar to the empty string.
1096        our ($git_avatar) = gitweb_get_feature('avatar');
1097        if ($git_avatar eq 'gravatar') {
1098                $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1099        } elsif ($git_avatar eq 'picon') {
1100                # no dependencies
1101        } else {
1102                $git_avatar = '';
1103        }
1104}
1105
1106# custom error handler: 'die <message>' is Internal Server Error
1107sub handle_errors_html {
1108        my $msg = shift; # it is already HTML escaped
1109
1110        # to avoid infinite loop where error occurs in die_error,
1111        # change handler to default handler, disabling handle_errors_html
1112        set_message("Error occured when inside die_error:\n$msg");
1113
1114        # you cannot jump out of die_error when called as error handler;
1115        # the subroutine set via CGI::Carp::set_message is called _after_
1116        # HTTP headers are already written, so it cannot write them itself
1117        die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1118}
1119set_message(\&handle_errors_html);
1120
1121# dispatch
1122sub dispatch {
1123        if (!defined $action) {
1124                if (defined $hash) {
1125                        $action = git_get_type($hash);
1126                } elsif (defined $hash_base && defined $file_name) {
1127                        $action = git_get_type("$hash_base:$file_name");
1128                } elsif (defined $project) {
1129                        $action = 'summary';
1130                } else {
1131                        $action = 'project_list';
1132                }
1133        }
1134        if (!defined($actions{$action})) {
1135                die_error(400, "Unknown action");
1136        }
1137        if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1138            !$project) {
1139                die_error(400, "Project needed");
1140        }
1141        $actions{$action}->();
1142}
1143
1144sub reset_timer {
1145        our $t0 = [ gettimeofday() ]
1146                if defined $t0;
1147        our $number_of_git_cmds = 0;
1148}
1149
1150our $first_request = 1;
1151sub run_request {
1152        reset_timer();
1153
1154        evaluate_uri();
1155        if ($first_request) {
1156                evaluate_gitweb_config();
1157                evaluate_git_version();
1158        }
1159        if ($per_request_config) {
1160                if (ref($per_request_config) eq 'CODE') {
1161                        $per_request_config->();
1162                } elsif (!$first_request) {
1163                        evaluate_gitweb_config();
1164                }
1165        }
1166        check_loadavg();
1167
1168        # $projectroot and $projects_list might be set in gitweb config file
1169        $projects_list ||= $projectroot;
1170
1171        evaluate_query_params();
1172        evaluate_path_info();
1173        evaluate_and_validate_params();
1174        evaluate_git_dir();
1175
1176        configure_gitweb_features();
1177
1178        dispatch();
1179}
1180
1181our $is_last_request = sub { 1 };
1182our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1183our $CGI = 'CGI';
1184our $cgi;
1185sub configure_as_fcgi {
1186        require CGI::Fast;
1187        our $CGI = 'CGI::Fast';
1188
1189        my $request_number = 0;
1190        # let each child service 100 requests
1191        our $is_last_request = sub { ++$request_number > 100 };
1192}
1193sub evaluate_argv {
1194        my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1195        configure_as_fcgi()
1196                if $script_name =~ /\.fcgi$/;
1197
1198        return unless (@ARGV);
1199
1200        require Getopt::Long;
1201        Getopt::Long::GetOptions(
1202                'fastcgi|fcgi|f' => \&configure_as_fcgi,
1203                'nproc|n=i' => sub {
1204                        my ($arg, $val) = @_;
1205                        return unless eval { require FCGI::ProcManager; 1; };
1206                        my $proc_manager = FCGI::ProcManager->new({
1207                                n_processes => $val,
1208                        });
1209                        our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1210                        our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1211                        our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1212                },
1213        );
1214}
1215
1216sub run {
1217        evaluate_argv();
1218
1219        $first_request = 1;
1220        $pre_listen_hook->()
1221                if $pre_listen_hook;
1222
1223 REQUEST:
1224        while ($cgi = $CGI->new()) {
1225                $pre_dispatch_hook->()
1226                        if $pre_dispatch_hook;
1227
1228                run_request();
1229
1230                $post_dispatch_hook->()
1231                        if $post_dispatch_hook;
1232                $first_request = 0;
1233
1234                last REQUEST if ($is_last_request->());
1235        }
1236
1237 DONE_GITWEB:
1238        1;
1239}
1240
1241run();
1242
1243if (defined caller) {
1244        # wrapped in a subroutine processing requests,
1245        # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1246        return;
1247} else {
1248        # pure CGI script, serving single request
1249        exit;
1250}
1251
1252## ======================================================================
1253## action links
1254
1255# possible values of extra options
1256# -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1257# -replay => 1      - start from a current view (replay with modifications)
1258# -path_info => 0|1 - don't use/use path_info URL (if possible)
1259# -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1260sub href {
1261        my %params = @_;
1262        # default is to use -absolute url() i.e. $my_uri
1263        my $href = $params{-full} ? $my_url : $my_uri;
1264
1265        # implicit -replay, must be first of implicit params
1266        $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1267
1268        $params{'project'} = $project unless exists $params{'project'};
1269
1270        if ($params{-replay}) {
1271                while (my ($name, $symbol) = each %cgi_param_mapping) {
1272                        if (!exists $params{$name}) {
1273                                $params{$name} = $input_params{$name};
1274                        }
1275                }
1276        }
1277
1278        my $use_pathinfo = gitweb_check_feature('pathinfo');
1279        if (defined $params{'project'} &&
1280            (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1281                # try to put as many parameters as possible in PATH_INFO:
1282                #   - project name
1283                #   - action
1284                #   - hash_parent or hash_parent_base:/file_parent
1285                #   - hash or hash_base:/filename
1286                #   - the snapshot_format as an appropriate suffix
1287
1288                # When the script is the root DirectoryIndex for the domain,
1289                # $href here would be something like http://gitweb.example.com/
1290                # Thus, we strip any trailing / from $href, to spare us double
1291                # slashes in the final URL
1292                $href =~ s,/$,,;
1293
1294                # Then add the project name, if present
1295                $href .= "/".esc_path_info($params{'project'});
1296                delete $params{'project'};
1297
1298                # since we destructively absorb parameters, we keep this
1299                # boolean that remembers if we're handling a snapshot
1300                my $is_snapshot = $params{'action'} eq 'snapshot';
1301
1302                # Summary just uses the project path URL, any other action is
1303                # added to the URL
1304                if (defined $params{'action'}) {
1305                        $href .= "/".esc_path_info($params{'action'})
1306                                unless $params{'action'} eq 'summary';
1307                        delete $params{'action'};
1308                }
1309
1310                # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1311                # stripping nonexistent or useless pieces
1312                $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1313                        || $params{'hash_parent'} || $params{'hash'});
1314                if (defined $params{'hash_base'}) {
1315                        if (defined $params{'hash_parent_base'}) {
1316                                $href .= esc_path_info($params{'hash_parent_base'});
1317                                # skip the file_parent if it's the same as the file_name
1318                                if (defined $params{'file_parent'}) {
1319                                        if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1320                                                delete $params{'file_parent'};
1321                                        } elsif ($params{'file_parent'} !~ /\.\./) {
1322                                                $href .= ":/".esc_path_info($params{'file_parent'});
1323                                                delete $params{'file_parent'};
1324                                        }
1325                                }
1326                                $href .= "..";
1327                                delete $params{'hash_parent'};
1328                                delete $params{'hash_parent_base'};
1329                        } elsif (defined $params{'hash_parent'}) {
1330                                $href .= esc_path_info($params{'hash_parent'}). "..";
1331                                delete $params{'hash_parent'};
1332                        }
1333
1334                        $href .= esc_path_info($params{'hash_base'});
1335                        if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1336                                $href .= ":/".esc_path_info($params{'file_name'});
1337                                delete $params{'file_name'};
1338                        }
1339                        delete $params{'hash'};
1340                        delete $params{'hash_base'};
1341                } elsif (defined $params{'hash'}) {
1342                        $href .= esc_path_info($params{'hash'});
1343                        delete $params{'hash'};
1344                }
1345
1346                # If the action was a snapshot, we can absorb the
1347                # snapshot_format parameter too
1348                if ($is_snapshot) {
1349                        my $fmt = $params{'snapshot_format'};
1350                        # snapshot_format should always be defined when href()
1351                        # is called, but just in case some code forgets, we
1352                        # fall back to the default
1353                        $fmt ||= $snapshot_fmts[0];
1354                        $href .= $known_snapshot_formats{$fmt}{'suffix'};
1355                        delete $params{'snapshot_format'};
1356                }
1357        }
1358
1359        # now encode the parameters explicitly
1360        my @result = ();
1361        for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1362                my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1363                if (defined $params{$name}) {
1364                        if (ref($params{$name}) eq "ARRAY") {
1365                                foreach my $par (@{$params{$name}}) {
1366                                        push @result, $symbol . "=" . esc_param($par);
1367                                }
1368                        } else {
1369                                push @result, $symbol . "=" . esc_param($params{$name});
1370                        }
1371                }
1372        }
1373        $href .= "?" . join(';', @result) if scalar @result;
1374
1375        # final transformation: trailing spaces must be escaped (URI-encoded)
1376        $href =~ s/(\s+)$/CGI::escape($1)/e;
1377
1378        if ($params{-anchor}) {
1379                $href .= "#".esc_param($params{-anchor});
1380        }
1381
1382        return $href;
1383}
1384
1385
1386## ======================================================================
1387## validation, quoting/unquoting and escaping
1388
1389sub validate_action {
1390        my $input = shift || return undef;
1391        return undef unless exists $actions{$input};
1392        return $input;
1393}
1394
1395sub validate_project {
1396        my $input = shift || return undef;
1397        if (!validate_pathname($input) ||
1398                !(-d "$projectroot/$input") ||
1399                !check_export_ok("$projectroot/$input") ||
1400                ($strict_export && !project_in_list($input))) {
1401                return undef;
1402        } else {
1403                return $input;
1404        }
1405}
1406
1407sub validate_pathname {
1408        my $input = shift || return undef;
1409
1410        # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1411        # at the beginning, at the end, and between slashes.
1412        # also this catches doubled slashes
1413        if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1414                return undef;
1415        }
1416        # no null characters
1417        if ($input =~ m!\0!) {
1418                return undef;
1419        }
1420        return $input;
1421}
1422
1423sub validate_refname {
1424        my $input = shift || return undef;
1425
1426        # textual hashes are O.K.
1427        if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1428                return $input;
1429        }
1430        # it must be correct pathname
1431        $input = validate_pathname($input)
1432                or return undef;
1433        # restrictions on ref name according to git-check-ref-format
1434        if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1435                return undef;
1436        }
1437        return $input;
1438}
1439
1440# decode sequences of octets in utf8 into Perl's internal form,
1441# which is utf-8 with utf8 flag set if needed.  gitweb writes out
1442# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1443sub to_utf8 {
1444        my $str = shift;
1445        return undef unless defined $str;
1446        if (utf8::valid($str)) {
1447                utf8::decode($str);
1448                return $str;
1449        } else {
1450                return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1451        }
1452}
1453
1454# quote unsafe chars, but keep the slash, even when it's not
1455# correct, but quoted slashes look too horrible in bookmarks
1456sub esc_param {
1457        my $str = shift;
1458        return undef unless defined $str;
1459        $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1460        $str =~ s/ /\+/g;
1461        return $str;
1462}
1463
1464# the quoting rules for path_info fragment are slightly different
1465sub esc_path_info {
1466        my $str = shift;
1467        return undef unless defined $str;
1468
1469        # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1470        $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1471
1472        return $str;
1473}
1474
1475# quote unsafe chars in whole URL, so some characters cannot be quoted
1476sub esc_url {
1477        my $str = shift;
1478        return undef unless defined $str;
1479        $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1480        $str =~ s/ /\+/g;
1481        return $str;
1482}
1483
1484# quote unsafe characters in HTML attributes
1485sub esc_attr {
1486
1487        # for XHTML conformance escaping '"' to '&quot;' is not enough
1488        return esc_html(@_);
1489}
1490
1491# replace invalid utf8 character with SUBSTITUTION sequence
1492sub esc_html {
1493        my $str = shift;
1494        my %opts = @_;
1495
1496        return undef unless defined $str;
1497
1498        $str = to_utf8($str);
1499        $str = $cgi->escapeHTML($str);
1500        if ($opts{'-nbsp'}) {
1501                $str =~ s/ /&nbsp;/g;
1502        }
1503        $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1504        return $str;
1505}
1506
1507# quote control characters and escape filename to HTML
1508sub esc_path {
1509        my $str = shift;
1510        my %opts = @_;
1511
1512        return undef unless defined $str;
1513
1514        $str = to_utf8($str);
1515        $str = $cgi->escapeHTML($str);
1516        if ($opts{'-nbsp'}) {
1517                $str =~ s/ /&nbsp;/g;
1518        }
1519        $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1520        return $str;
1521}
1522
1523# Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1524sub sanitize {
1525        my $str = shift;
1526
1527        return undef unless defined $str;
1528
1529        $str = to_utf8($str);
1530        $str =~ s|([[:cntrl:]])|($1 =~ /[\t\n\r]/ ? $1 : quot_cec($1))|eg;
1531        return $str;
1532}
1533
1534# Make control characters "printable", using character escape codes (CEC)
1535sub quot_cec {
1536        my $cntrl = shift;
1537        my %opts = @_;
1538        my %es = ( # character escape codes, aka escape sequences
1539                "\t" => '\t',   # tab            (HT)
1540                "\n" => '\n',   # line feed      (LF)
1541                "\r" => '\r',   # carrige return (CR)
1542                "\f" => '\f',   # form feed      (FF)
1543                "\b" => '\b',   # backspace      (BS)
1544                "\a" => '\a',   # alarm (bell)   (BEL)
1545                "\e" => '\e',   # escape         (ESC)
1546                "\013" => '\v', # vertical tab   (VT)
1547                "\000" => '\0', # nul character  (NUL)
1548        );
1549        my $chr = ( (exists $es{$cntrl})
1550                    ? $es{$cntrl}
1551                    : sprintf('\%2x', ord($cntrl)) );
1552        if ($opts{-nohtml}) {
1553                return $chr;
1554        } else {
1555                return "<span class=\"cntrl\">$chr</span>";
1556        }
1557}
1558
1559# Alternatively use unicode control pictures codepoints,
1560# Unicode "printable representation" (PR)
1561sub quot_upr {
1562        my $cntrl = shift;
1563        my %opts = @_;
1564
1565        my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1566        if ($opts{-nohtml}) {
1567                return $chr;
1568        } else {
1569                return "<span class=\"cntrl\">$chr</span>";
1570        }
1571}
1572
1573# git may return quoted and escaped filenames
1574sub unquote {
1575        my $str = shift;
1576
1577        sub unq {
1578                my $seq = shift;
1579                my %es = ( # character escape codes, aka escape sequences
1580                        't' => "\t",   # tab            (HT, TAB)
1581                        'n' => "\n",   # newline        (NL)
1582                        'r' => "\r",   # return         (CR)
1583                        'f' => "\f",   # form feed      (FF)
1584                        'b' => "\b",   # backspace      (BS)
1585                        'a' => "\a",   # alarm (bell)   (BEL)
1586                        'e' => "\e",   # escape         (ESC)
1587                        'v' => "\013", # vertical tab   (VT)
1588                );
1589
1590                if ($seq =~ m/^[0-7]{1,3}$/) {
1591                        # octal char sequence
1592                        return chr(oct($seq));
1593                } elsif (exists $es{$seq}) {
1594                        # C escape sequence, aka character escape code
1595                        return $es{$seq};
1596                }
1597                # quoted ordinary character
1598                return $seq;
1599        }
1600
1601        if ($str =~ m/^"(.*)"$/) {
1602                # needs unquoting
1603                $str = $1;
1604                $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1605        }
1606        return $str;
1607}
1608
1609# escape tabs (convert tabs to spaces)
1610sub untabify {
1611        my $line = shift;
1612
1613        while ((my $pos = index($line, "\t")) != -1) {
1614                if (my $count = (8 - ($pos % 8))) {
1615                        my $spaces = ' ' x $count;
1616                        $line =~ s/\t/$spaces/;
1617                }
1618        }
1619
1620        return $line;
1621}
1622
1623sub project_in_list {
1624        my $project = shift;
1625        my @list = git_get_projects_list();
1626        return @list && scalar(grep { $_->{'path'} eq $project } @list);
1627}
1628
1629## ----------------------------------------------------------------------
1630## HTML aware string manipulation
1631
1632# Try to chop given string on a word boundary between position
1633# $len and $len+$add_len. If there is no word boundary there,
1634# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1635# (marking chopped part) would be longer than given string.
1636sub chop_str {
1637        my $str = shift;
1638        my $len = shift;
1639        my $add_len = shift || 10;
1640        my $where = shift || 'right'; # 'left' | 'center' | 'right'
1641
1642        # Make sure perl knows it is utf8 encoded so we don't
1643        # cut in the middle of a utf8 multibyte char.
1644        $str = to_utf8($str);
1645
1646        # allow only $len chars, but don't cut a word if it would fit in $add_len
1647        # if it doesn't fit, cut it if it's still longer than the dots we would add
1648        # remove chopped character entities entirely
1649
1650        # when chopping in the middle, distribute $len into left and right part
1651        # return early if chopping wouldn't make string shorter
1652        if ($where eq 'center') {
1653                return $str if ($len + 5 >= length($str)); # filler is length 5
1654                $len = int($len/2);
1655        } else {
1656                return $str if ($len + 4 >= length($str)); # filler is length 4
1657        }
1658
1659        # regexps: ending and beginning with word part up to $add_len
1660        my $endre = qr/.{$len}\w{0,$add_len}/;
1661        my $begre = qr/\w{0,$add_len}.{$len}/;
1662
1663        if ($where eq 'left') {
1664                $str =~ m/^(.*?)($begre)$/;
1665                my ($lead, $body) = ($1, $2);
1666                if (length($lead) > 4) {
1667                        $lead = " ...";
1668                }
1669                return "$lead$body";
1670
1671        } elsif ($where eq 'center') {
1672                $str =~ m/^($endre)(.*)$/;
1673                my ($left, $str)  = ($1, $2);
1674                $str =~ m/^(.*?)($begre)$/;
1675                my ($mid, $right) = ($1, $2);
1676                if (length($mid) > 5) {
1677                        $mid = " ... ";
1678                }
1679                return "$left$mid$right";
1680
1681        } else {
1682                $str =~ m/^($endre)(.*)$/;
1683                my $body = $1;
1684                my $tail = $2;
1685                if (length($tail) > 4) {
1686                        $tail = "... ";
1687                }
1688                return "$body$tail";
1689        }
1690}
1691
1692# takes the same arguments as chop_str, but also wraps a <span> around the
1693# result with a title attribute if it does get chopped. Additionally, the
1694# string is HTML-escaped.
1695sub chop_and_escape_str {
1696        my ($str) = @_;
1697
1698        my $chopped = chop_str(@_);
1699        if ($chopped eq $str) {
1700                return esc_html($chopped);
1701        } else {
1702                $str =~ s/[[:cntrl:]]/?/g;
1703                return $cgi->span({-title=>$str}, esc_html($chopped));
1704        }
1705}
1706
1707## ----------------------------------------------------------------------
1708## functions returning short strings
1709
1710# CSS class for given age value (in seconds)
1711sub age_class {
1712        my $age = shift;
1713
1714        if (!defined $age) {
1715                return "noage";
1716        } elsif ($age < 60*60*2) {
1717                return "age0";
1718        } elsif ($age < 60*60*24*2) {
1719                return "age1";
1720        } else {
1721                return "age2";
1722        }
1723}
1724
1725# convert age in seconds to "nn units ago" string
1726sub age_string {
1727        my $age = shift;
1728        my $age_str;
1729
1730        if ($age > 60*60*24*365*2) {
1731                $age_str = (int $age/60/60/24/365);
1732                $age_str .= " years ago";
1733        } elsif ($age > 60*60*24*(365/12)*2) {
1734                $age_str = int $age/60/60/24/(365/12);
1735                $age_str .= " months ago";
1736        } elsif ($age > 60*60*24*7*2) {
1737                $age_str = int $age/60/60/24/7;
1738                $age_str .= " weeks ago";
1739        } elsif ($age > 60*60*24*2) {
1740                $age_str = int $age/60/60/24;
1741                $age_str .= " days ago";
1742        } elsif ($age > 60*60*2) {
1743                $age_str = int $age/60/60;
1744                $age_str .= " hours ago";
1745        } elsif ($age > 60*2) {
1746                $age_str = int $age/60;
1747                $age_str .= " min ago";
1748        } elsif ($age > 2) {
1749                $age_str = int $age;
1750                $age_str .= " sec ago";
1751        } else {
1752                $age_str .= " right now";
1753        }
1754        return $age_str;
1755}
1756
1757use constant {
1758        S_IFINVALID => 0030000,
1759        S_IFGITLINK => 0160000,
1760};
1761
1762# submodule/subproject, a commit object reference
1763sub S_ISGITLINK {
1764        my $mode = shift;
1765
1766        return (($mode & S_IFMT) == S_IFGITLINK)
1767}
1768
1769# convert file mode in octal to symbolic file mode string
1770sub mode_str {
1771        my $mode = oct shift;
1772
1773        if (S_ISGITLINK($mode)) {
1774                return 'm---------';
1775        } elsif (S_ISDIR($mode & S_IFMT)) {
1776                return 'drwxr-xr-x';
1777        } elsif (S_ISLNK($mode)) {
1778                return 'lrwxrwxrwx';
1779        } elsif (S_ISREG($mode)) {
1780                # git cares only about the executable bit
1781                if ($mode & S_IXUSR) {
1782                        return '-rwxr-xr-x';
1783                } else {
1784                        return '-rw-r--r--';
1785                };
1786        } else {
1787                return '----------';
1788        }
1789}
1790
1791# convert file mode in octal to file type string
1792sub file_type {
1793        my $mode = shift;
1794
1795        if ($mode !~ m/^[0-7]+$/) {
1796                return $mode;
1797        } else {
1798                $mode = oct $mode;
1799        }
1800
1801        if (S_ISGITLINK($mode)) {
1802                return "submodule";
1803        } elsif (S_ISDIR($mode & S_IFMT)) {
1804                return "directory";
1805        } elsif (S_ISLNK($mode)) {
1806                return "symlink";
1807        } elsif (S_ISREG($mode)) {
1808                return "file";
1809        } else {
1810                return "unknown";
1811        }
1812}
1813
1814# convert file mode in octal to file type description string
1815sub file_type_long {
1816        my $mode = shift;
1817
1818        if ($mode !~ m/^[0-7]+$/) {
1819                return $mode;
1820        } else {
1821                $mode = oct $mode;
1822        }
1823
1824        if (S_ISGITLINK($mode)) {
1825                return "submodule";
1826        } elsif (S_ISDIR($mode & S_IFMT)) {
1827                return "directory";
1828        } elsif (S_ISLNK($mode)) {
1829                return "symlink";
1830        } elsif (S_ISREG($mode)) {
1831                if ($mode & S_IXUSR) {
1832                        return "executable";
1833                } else {
1834                        return "file";
1835                };
1836        } else {
1837                return "unknown";
1838        }
1839}
1840
1841
1842## ----------------------------------------------------------------------
1843## functions returning short HTML fragments, or transforming HTML fragments
1844## which don't belong to other sections
1845
1846# format line of commit message.
1847sub format_log_line_html {
1848        my $line = shift;
1849
1850        $line = esc_html($line, -nbsp=>1);
1851        $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1852                $cgi->a({-href => href(action=>"object", hash=>$1),
1853                                        -class => "text"}, $1);
1854        }eg;
1855
1856        return $line;
1857}
1858
1859# format marker of refs pointing to given object
1860
1861# the destination action is chosen based on object type and current context:
1862# - for annotated tags, we choose the tag view unless it's the current view
1863#   already, in which case we go to shortlog view
1864# - for other refs, we keep the current view if we're in history, shortlog or
1865#   log view, and select shortlog otherwise
1866sub format_ref_marker {
1867        my ($refs, $id) = @_;
1868        my $markers = '';
1869
1870        if (defined $refs->{$id}) {
1871                foreach my $ref (@{$refs->{$id}}) {
1872                        # this code exploits the fact that non-lightweight tags are the
1873                        # only indirect objects, and that they are the only objects for which
1874                        # we want to use tag instead of shortlog as action
1875                        my ($type, $name) = qw();
1876                        my $indirect = ($ref =~ s/\^\{\}$//);
1877                        # e.g. tags/v2.6.11 or heads/next
1878                        if ($ref =~ m!^(.*?)s?/(.*)$!) {
1879                                $type = $1;
1880                                $name = $2;
1881                        } else {
1882                                $type = "ref";
1883                                $name = $ref;
1884                        }
1885
1886                        my $class = $type;
1887                        $class .= " indirect" if $indirect;
1888
1889                        my $dest_action = "shortlog";
1890
1891                        if ($indirect) {
1892                                $dest_action = "tag" unless $action eq "tag";
1893                        } elsif ($action =~ /^(history|(short)?log)$/) {
1894                                $dest_action = $action;
1895                        }
1896
1897                        my $dest = "";
1898                        $dest .= "refs/" unless $ref =~ m!^refs/!;
1899                        $dest .= $ref;
1900
1901                        my $link = $cgi->a({
1902                                -href => href(
1903                                        action=>$dest_action,
1904                                        hash=>$dest
1905                                )}, $name);
1906
1907                        $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
1908                                $link . "</span>";
1909                }
1910        }
1911
1912        if ($markers) {
1913                return ' <span class="refs">'. $markers . '</span>';
1914        } else {
1915                return "";
1916        }
1917}
1918
1919# format, perhaps shortened and with markers, title line
1920sub format_subject_html {
1921        my ($long, $short, $href, $extra) = @_;
1922        $extra = '' unless defined($extra);
1923
1924        if (length($short) < length($long)) {
1925                $long =~ s/[[:cntrl:]]/?/g;
1926                return $cgi->a({-href => $href, -class => "list subject",
1927                                -title => to_utf8($long)},
1928                       esc_html($short)) . $extra;
1929        } else {
1930                return $cgi->a({-href => $href, -class => "list subject"},
1931                       esc_html($long)) . $extra;
1932        }
1933}
1934
1935# Rather than recomputing the url for an email multiple times, we cache it
1936# after the first hit. This gives a visible benefit in views where the avatar
1937# for the same email is used repeatedly (e.g. shortlog).
1938# The cache is shared by all avatar engines (currently gravatar only), which
1939# are free to use it as preferred. Since only one avatar engine is used for any
1940# given page, there's no risk for cache conflicts.
1941our %avatar_cache = ();
1942
1943# Compute the picon url for a given email, by using the picon search service over at
1944# http://www.cs.indiana.edu/picons/search.html
1945sub picon_url {
1946        my $email = lc shift;
1947        if (!$avatar_cache{$email}) {
1948                my ($user, $domain) = split('@', $email);
1949                $avatar_cache{$email} =
1950                        "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1951                        "$domain/$user/" .
1952                        "users+domains+unknown/up/single";
1953        }
1954        return $avatar_cache{$email};
1955}
1956
1957# Compute the gravatar url for a given email, if it's not in the cache already.
1958# Gravatar stores only the part of the URL before the size, since that's the
1959# one computationally more expensive. This also allows reuse of the cache for
1960# different sizes (for this particular engine).
1961sub gravatar_url {
1962        my $email = lc shift;
1963        my $size = shift;
1964        $avatar_cache{$email} ||=
1965                "http://www.gravatar.com/avatar/" .
1966                        Digest::MD5::md5_hex($email) . "?s=";
1967        return $avatar_cache{$email} . $size;
1968}
1969
1970# Insert an avatar for the given $email at the given $size if the feature
1971# is enabled.
1972sub git_get_avatar {
1973        my ($email, %opts) = @_;
1974        my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1975        my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1976        $opts{-size} ||= 'default';
1977        my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1978        my $url = "";
1979        if ($git_avatar eq 'gravatar') {
1980                $url = gravatar_url($email, $size);
1981        } elsif ($git_avatar eq 'picon') {
1982                $url = picon_url($email);
1983        }
1984        # Other providers can be added by extending the if chain, defining $url
1985        # as needed. If no variant puts something in $url, we assume avatars
1986        # are completely disabled/unavailable.
1987        if ($url) {
1988                return $pre_white .
1989                       "<img width=\"$size\" " .
1990                            "class=\"avatar\" " .
1991                            "src=\"".esc_url($url)."\" " .
1992                            "alt=\"\" " .
1993                       "/>" . $post_white;
1994        } else {
1995                return "";
1996        }
1997}
1998
1999sub format_search_author {
2000        my ($author, $searchtype, $displaytext) = @_;
2001        my $have_search = gitweb_check_feature('search');
2002
2003        if ($have_search) {
2004                my $performed = "";
2005                if ($searchtype eq 'author') {
2006                        $performed = "authored";
2007                } elsif ($searchtype eq 'committer') {
2008                        $performed = "committed";
2009                }
2010
2011                return $cgi->a({-href => href(action=>"search", hash=>$hash,
2012                                searchtext=>$author,
2013                                searchtype=>$searchtype), class=>"list",
2014                                title=>"Search for commits $performed by $author"},
2015                                $displaytext);
2016
2017        } else {
2018                return $displaytext;
2019        }
2020}
2021
2022# format the author name of the given commit with the given tag
2023# the author name is chopped and escaped according to the other
2024# optional parameters (see chop_str).
2025sub format_author_html {
2026        my $tag = shift;
2027        my $co = shift;
2028        my $author = chop_and_escape_str($co->{'author_name'}, @_);
2029        return "<$tag class=\"author\">" .
2030               format_search_author($co->{'author_name'}, "author",
2031                       git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2032                       $author) .
2033               "</$tag>";
2034}
2035
2036# format git diff header line, i.e. "diff --(git|combined|cc) ..."
2037sub format_git_diff_header_line {
2038        my $line = shift;
2039        my $diffinfo = shift;
2040        my ($from, $to) = @_;
2041
2042        if ($diffinfo->{'nparents'}) {
2043                # combined diff
2044                $line =~ s!^(diff (.*?) )"?.*$!$1!;
2045                if ($to->{'href'}) {
2046                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2047                                         esc_path($to->{'file'}));
2048                } else { # file was deleted (no href)
2049                        $line .= esc_path($to->{'file'});
2050                }
2051        } else {
2052                # "ordinary" diff
2053                $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2054                if ($from->{'href'}) {
2055                        $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2056                                         'a/' . esc_path($from->{'file'}));
2057                } else { # file was added (no href)
2058                        $line .= 'a/' . esc_path($from->{'file'});
2059                }
2060                $line .= ' ';
2061                if ($to->{'href'}) {
2062                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2063                                         'b/' . esc_path($to->{'file'}));
2064                } else { # file was deleted
2065                        $line .= 'b/' . esc_path($to->{'file'});
2066                }
2067        }
2068
2069        return "<div class=\"diff header\">$line</div>\n";
2070}
2071
2072# format extended diff header line, before patch itself
2073sub format_extended_diff_header_line {
2074        my $line = shift;
2075        my $diffinfo = shift;
2076        my ($from, $to) = @_;
2077
2078        # match <path>
2079        if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2080                $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2081                                       esc_path($from->{'file'}));
2082        }
2083        if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2084                $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2085                                 esc_path($to->{'file'}));
2086        }
2087        # match single <mode>
2088        if ($line =~ m/\s(\d{6})$/) {
2089                $line .= '<span class="info"> (' .
2090                         file_type_long($1) .
2091                         ')</span>';
2092        }
2093        # match <hash>
2094        if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2095                # can match only for combined diff
2096                $line = 'index ';
2097                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2098                        if ($from->{'href'}[$i]) {
2099                                $line .= $cgi->a({-href=>$from->{'href'}[$i],
2100                                                  -class=>"hash"},
2101                                                 substr($diffinfo->{'from_id'}[$i],0,7));
2102                        } else {
2103                                $line .= '0' x 7;
2104                        }
2105                        # separator
2106                        $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2107                }
2108                $line .= '..';
2109                if ($to->{'href'}) {
2110                        $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2111                                         substr($diffinfo->{'to_id'},0,7));
2112                } else {
2113                        $line .= '0' x 7;
2114                }
2115
2116        } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2117                # can match only for ordinary diff
2118                my ($from_link, $to_link);
2119                if ($from->{'href'}) {
2120                        $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2121                                             substr($diffinfo->{'from_id'},0,7));
2122                } else {
2123                        $from_link = '0' x 7;
2124                }
2125                if ($to->{'href'}) {
2126                        $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2127                                           substr($diffinfo->{'to_id'},0,7));
2128                } else {
2129                        $to_link = '0' x 7;
2130                }
2131                my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2132                $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2133        }
2134
2135        return $line . "<br/>\n";
2136}
2137
2138# format from-file/to-file diff header
2139sub format_diff_from_to_header {
2140        my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2141        my $line;
2142        my $result = '';
2143
2144        $line = $from_line;
2145        #assert($line =~ m/^---/) if DEBUG;
2146        # no extra formatting for "^--- /dev/null"
2147        if (! $diffinfo->{'nparents'}) {
2148                # ordinary (single parent) diff
2149                if ($line =~ m!^--- "?a/!) {
2150                        if ($from->{'href'}) {
2151                                $line = '--- a/' .
2152                                        $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2153                                                esc_path($from->{'file'}));
2154                        } else {
2155                                $line = '--- a/' .
2156                                        esc_path($from->{'file'});
2157                        }
2158                }
2159                $result .= qq!<div class="diff from_file">$line</div>\n!;
2160
2161        } else {
2162                # combined diff (merge commit)
2163                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2164                        if ($from->{'href'}[$i]) {
2165                                $line = '--- ' .
2166                                        $cgi->a({-href=>href(action=>"blobdiff",
2167                                                             hash_parent=>$diffinfo->{'from_id'}[$i],
2168                                                             hash_parent_base=>$parents[$i],
2169                                                             file_parent=>$from->{'file'}[$i],
2170                                                             hash=>$diffinfo->{'to_id'},
2171                                                             hash_base=>$hash,
2172                                                             file_name=>$to->{'file'}),
2173                                                 -class=>"path",
2174                                                 -title=>"diff" . ($i+1)},
2175                                                $i+1) .
2176                                        '/' .
2177                                        $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2178                                                esc_path($from->{'file'}[$i]));
2179                        } else {
2180                                $line = '--- /dev/null';
2181                        }
2182                        $result .= qq!<div class="diff from_file">$line</div>\n!;
2183                }
2184        }
2185
2186        $line = $to_line;
2187        #assert($line =~ m/^\+\+\+/) if DEBUG;
2188        # no extra formatting for "^+++ /dev/null"
2189        if ($line =~ m!^\+\+\+ "?b/!) {
2190                if ($to->{'href'}) {
2191                        $line = '+++ b/' .
2192                                $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2193                                        esc_path($to->{'file'}));
2194                } else {
2195                        $line = '+++ b/' .
2196                                esc_path($to->{'file'});
2197                }
2198        }
2199        $result .= qq!<div class="diff to_file">$line</div>\n!;
2200
2201        return $result;
2202}
2203
2204# create note for patch simplified by combined diff
2205sub format_diff_cc_simplified {
2206        my ($diffinfo, @parents) = @_;
2207        my $result = '';
2208
2209        $result .= "<div class=\"diff header\">" .
2210                   "diff --cc ";
2211        if (!is_deleted($diffinfo)) {
2212                $result .= $cgi->a({-href => href(action=>"blob",
2213                                                  hash_base=>$hash,
2214                                                  hash=>$diffinfo->{'to_id'},
2215                                                  file_name=>$diffinfo->{'to_file'}),
2216                                    -class => "path"},
2217                                   esc_path($diffinfo->{'to_file'}));
2218        } else {
2219                $result .= esc_path($diffinfo->{'to_file'});
2220        }
2221        $result .= "</div>\n" . # class="diff header"
2222                   "<div class=\"diff nodifferences\">" .
2223                   "Simple merge" .
2224                   "</div>\n"; # class="diff nodifferences"
2225
2226        return $result;
2227}
2228
2229sub diff_line_class {
2230        my ($line, $from, $to) = @_;
2231
2232        # ordinary diff
2233        my $num_sign = 1;
2234        # combined diff
2235        if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2236                $num_sign = scalar @{$from->{'href'}};
2237        }
2238
2239        my @diff_line_classifier = (
2240                { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2241                { regexp => qr/^\\/,               class => "incomplete"  },
2242                { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2243                # classifier for context must come before classifier add/rem,
2244                # or we would have to use more complicated regexp, for example
2245                # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2246                { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2247                { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2248        );
2249        for my $clsfy (@diff_line_classifier) {
2250                return $clsfy->{'class'}
2251                        if ($line =~ $clsfy->{'regexp'});
2252        }
2253
2254        # fallback
2255        return "";
2256}
2257
2258# assumes that $from and $to are defined and correctly filled,
2259# and that $line holds a line of chunk header for unified diff
2260sub format_unidiff_chunk_header {
2261        my ($line, $from, $to) = @_;
2262
2263        my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2264                $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2265
2266        $from_lines = 0 unless defined $from_lines;
2267        $to_lines   = 0 unless defined $to_lines;
2268
2269        if ($from->{'href'}) {
2270                $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2271                                     -class=>"list"}, $from_text);
2272        }
2273        if ($to->{'href'}) {
2274                $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2275                                     -class=>"list"}, $to_text);
2276        }
2277        $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2278                "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2279        return $line;
2280}
2281
2282# assumes that $from and $to are defined and correctly filled,
2283# and that $line holds a line of chunk header for combined diff
2284sub format_cc_diff_chunk_header {
2285        my ($line, $from, $to) = @_;
2286
2287        my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2288        my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2289
2290        @from_text = split(' ', $ranges);
2291        for (my $i = 0; $i < @from_text; ++$i) {
2292                ($from_start[$i], $from_nlines[$i]) =
2293                        (split(',', substr($from_text[$i], 1)), 0);
2294        }
2295
2296        $to_text   = pop @from_text;
2297        $to_start  = pop @from_start;
2298        $to_nlines = pop @from_nlines;
2299
2300        $line = "<span class=\"chunk_info\">$prefix ";
2301        for (my $i = 0; $i < @from_text; ++$i) {
2302                if ($from->{'href'}[$i]) {
2303                        $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2304                                          -class=>"list"}, $from_text[$i]);
2305                } else {
2306                        $line .= $from_text[$i];
2307                }
2308                $line .= " ";
2309        }
2310        if ($to->{'href'}) {
2311                $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2312                                  -class=>"list"}, $to_text);
2313        } else {
2314                $line .= $to_text;
2315        }
2316        $line .= " $prefix</span>" .
2317                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2318        return $line;
2319}
2320
2321# process patch (diff) line (not to be used for diff headers),
2322# returning class and HTML-formatted (but not wrapped) line
2323sub process_diff_line {
2324        my $line = shift;
2325        my ($from, $to) = @_;
2326
2327        my $diff_class = diff_line_class($line, $from, $to);
2328
2329        chomp $line;
2330        $line = untabify($line);
2331
2332        if ($from && $to && $line =~ m/^\@{2} /) {
2333                $line = format_unidiff_chunk_header($line, $from, $to);
2334                return $diff_class, $line;
2335
2336        } elsif ($from && $to && $line =~ m/^\@{3}/) {
2337                $line = format_cc_diff_chunk_header($line, $from, $to);
2338                return $diff_class, $line;
2339
2340        }
2341        return $diff_class, esc_html($line, -nbsp=>1);
2342}
2343
2344# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2345# linked.  Pass the hash of the tree/commit to snapshot.
2346sub format_snapshot_links {
2347        my ($hash) = @_;
2348        my $num_fmts = @snapshot_fmts;
2349        if ($num_fmts > 1) {
2350                # A parenthesized list of links bearing format names.
2351                # e.g. "snapshot (_tar.gz_ _zip_)"
2352                return "snapshot (" . join(' ', map
2353                        $cgi->a({
2354                                -href => href(
2355                                        action=>"snapshot",
2356                                        hash=>$hash,
2357                                        snapshot_format=>$_
2358                                )
2359                        }, $known_snapshot_formats{$_}{'display'})
2360                , @snapshot_fmts) . ")";
2361        } elsif ($num_fmts == 1) {
2362                # A single "snapshot" link whose tooltip bears the format name.
2363                # i.e. "_snapshot_"
2364                my ($fmt) = @snapshot_fmts;
2365                return
2366                        $cgi->a({
2367                                -href => href(
2368                                        action=>"snapshot",
2369                                        hash=>$hash,
2370                                        snapshot_format=>$fmt
2371                                ),
2372                                -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2373                        }, "snapshot");
2374        } else { # $num_fmts == 0
2375                return undef;
2376        }
2377}
2378
2379## ......................................................................
2380## functions returning values to be passed, perhaps after some
2381## transformation, to other functions; e.g. returning arguments to href()
2382
2383# returns hash to be passed to href to generate gitweb URL
2384# in -title key it returns description of link
2385sub get_feed_info {
2386        my $format = shift || 'Atom';
2387        my %res = (action => lc($format));
2388
2389        # feed links are possible only for project views
2390        return unless (defined $project);
2391        # some views should link to OPML, or to generic project feed,
2392        # or don't have specific feed yet (so they should use generic)
2393        return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2394
2395        my $branch;
2396        # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2397        # from tag links; this also makes possible to detect branch links
2398        if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2399            (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2400                $branch = $1;
2401        }
2402        # find log type for feed description (title)
2403        my $type = 'log';
2404        if (defined $file_name) {
2405                $type  = "history of $file_name";
2406                $type .= "/" if ($action eq 'tree');
2407                $type .= " on '$branch'" if (defined $branch);
2408        } else {
2409                $type = "log of $branch" if (defined $branch);
2410        }
2411
2412        $res{-title} = $type;
2413        $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2414        $res{'file_name'} = $file_name;
2415
2416        return %res;
2417}
2418
2419## ----------------------------------------------------------------------
2420## git utility subroutines, invoking git commands
2421
2422# returns path to the core git executable and the --git-dir parameter as list
2423sub git_cmd {
2424        $number_of_git_cmds++;
2425        return $GIT, '--git-dir='.$git_dir;
2426}
2427
2428# quote the given arguments for passing them to the shell
2429# quote_command("command", "arg 1", "arg with ' and ! characters")
2430# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2431# Try to avoid using this function wherever possible.
2432sub quote_command {
2433        return join(' ',
2434                map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2435}
2436
2437# get HEAD ref of given project as hash
2438sub git_get_head_hash {
2439        return git_get_full_hash(shift, 'HEAD');
2440}
2441
2442sub git_get_full_hash {
2443        return git_get_hash(@_);
2444}
2445
2446sub git_get_short_hash {
2447        return git_get_hash(@_, '--short=7');
2448}
2449
2450sub git_get_hash {
2451        my ($project, $hash, @options) = @_;
2452        my $o_git_dir = $git_dir;
2453        my $retval = undef;
2454        $git_dir = "$projectroot/$project";
2455        if (open my $fd, '-|', git_cmd(), 'rev-parse',
2456            '--verify', '-q', @options, $hash) {
2457                $retval = <$fd>;
2458                chomp $retval if defined $retval;
2459                close $fd;
2460        }
2461        if (defined $o_git_dir) {
2462                $git_dir = $o_git_dir;
2463        }
2464        return $retval;
2465}
2466
2467# get type of given object
2468sub git_get_type {
2469        my $hash = shift;
2470
2471        open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2472        my $type = <$fd>;
2473        close $fd or return;
2474        chomp $type;
2475        return $type;
2476}
2477
2478# repository configuration
2479our $config_file = '';
2480our %config;
2481
2482# store multiple values for single key as anonymous array reference
2483# single values stored directly in the hash, not as [ <value> ]
2484sub hash_set_multi {
2485        my ($hash, $key, $value) = @_;
2486
2487        if (!exists $hash->{$key}) {
2488                $hash->{$key} = $value;
2489        } elsif (!ref $hash->{$key}) {
2490                $hash->{$key} = [ $hash->{$key}, $value ];
2491        } else {
2492                push @{$hash->{$key}}, $value;
2493        }
2494}
2495
2496# return hash of git project configuration
2497# optionally limited to some section, e.g. 'gitweb'
2498sub git_parse_project_config {
2499        my $section_regexp = shift;
2500        my %config;
2501
2502        local $/ = "\0";
2503
2504        open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2505                or return;
2506
2507        while (my $keyval = <$fh>) {
2508                chomp $keyval;
2509                my ($key, $value) = split(/\n/, $keyval, 2);
2510
2511                hash_set_multi(\%config, $key, $value)
2512                        if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2513        }
2514        close $fh;
2515
2516        return %config;
2517}
2518
2519# convert config value to boolean: 'true' or 'false'
2520# no value, number > 0, 'true' and 'yes' values are true
2521# rest of values are treated as false (never as error)
2522sub config_to_bool {
2523        my $val = shift;
2524
2525        return 1 if !defined $val;             # section.key
2526
2527        # strip leading and trailing whitespace
2528        $val =~ s/^\s+//;
2529        $val =~ s/\s+$//;
2530
2531        return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2532                ($val =~ /^(?:true|yes)$/i));  # section.key = true
2533}
2534
2535# convert config value to simple decimal number
2536# an optional value suffix of 'k', 'm', or 'g' will cause the value
2537# to be multiplied by 1024, 1048576, or 1073741824
2538sub config_to_int {
2539        my $val = shift;
2540
2541        # strip leading and trailing whitespace
2542        $val =~ s/^\s+//;
2543        $val =~ s/\s+$//;
2544
2545        if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2546                $unit = lc($unit);
2547                # unknown unit is treated as 1
2548                return $num * ($unit eq 'g' ? 1073741824 :
2549                               $unit eq 'm' ?    1048576 :
2550                               $unit eq 'k' ?       1024 : 1);
2551        }
2552        return $val;
2553}
2554
2555# convert config value to array reference, if needed
2556sub config_to_multi {
2557        my $val = shift;
2558
2559        return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2560}
2561
2562sub git_get_project_config {
2563        my ($key, $type) = @_;
2564
2565        return unless defined $git_dir;
2566
2567        # key sanity check
2568        return unless ($key);
2569        # only subsection, if exists, is case sensitive,
2570        # and not lowercased by 'git config -z -l'
2571        if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2572                $key = join(".", lc($hi), $mi, lc($lo));
2573        } else {
2574                $key = lc($key);
2575        }
2576        $key =~ s/^gitweb\.//;
2577        return if ($key =~ m/\W/);
2578
2579        # type sanity check
2580        if (defined $type) {
2581                $type =~ s/^--//;
2582                $type = undef
2583                        unless ($type eq 'bool' || $type eq 'int');
2584        }
2585
2586        # get config
2587        if (!defined $config_file ||
2588            $config_file ne "$git_dir/config") {
2589                %config = git_parse_project_config('gitweb');
2590                $config_file = "$git_dir/config";
2591        }
2592
2593        # check if config variable (key) exists
2594        return unless exists $config{"gitweb.$key"};
2595
2596        # ensure given type
2597        if (!defined $type) {
2598                return $config{"gitweb.$key"};
2599        } elsif ($type eq 'bool') {
2600                # backward compatibility: 'git config --bool' returns true/false
2601                return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2602        } elsif ($type eq 'int') {
2603                return config_to_int($config{"gitweb.$key"});
2604        }
2605        return $config{"gitweb.$key"};
2606}
2607
2608# get hash of given path at given ref
2609sub git_get_hash_by_path {
2610        my $base = shift;
2611        my $path = shift || return undef;
2612        my $type = shift;
2613
2614        $path =~ s,/+$,,;
2615
2616        open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2617                or die_error(500, "Open git-ls-tree failed");
2618        my $line = <$fd>;
2619        close $fd or return undef;
2620
2621        if (!defined $line) {
2622                # there is no tree or hash given by $path at $base
2623                return undef;
2624        }
2625
2626        #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2627        $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2628        if (defined $type && $type ne $2) {
2629                # type doesn't match
2630                return undef;
2631        }
2632        return $3;
2633}
2634
2635# get path of entry with given hash at given tree-ish (ref)
2636# used to get 'from' filename for combined diff (merge commit) for renames
2637sub git_get_path_by_hash {
2638        my $base = shift || return;
2639        my $hash = shift || return;
2640
2641        local $/ = "\0";
2642
2643        open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2644                or return undef;
2645        while (my $line = <$fd>) {
2646                chomp $line;
2647
2648                #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2649                #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2650                if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2651                        close $fd;
2652                        return $1;
2653                }
2654        }
2655        close $fd;
2656        return undef;
2657}
2658
2659## ......................................................................
2660## git utility functions, directly accessing git repository
2661
2662# get the value of config variable either from file named as the variable
2663# itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2664# configuration variable in the repository config file.
2665sub git_get_file_or_project_config {
2666        my ($path, $name) = @_;
2667
2668        $git_dir = "$projectroot/$path";
2669        open my $fd, '<', "$git_dir/$name"
2670                or return git_get_project_config($name);
2671        my $conf = <$fd>;
2672        close $fd;
2673        if (defined $conf) {
2674                chomp $conf;
2675        }
2676        return $conf;
2677}
2678
2679sub git_get_project_description {
2680        my $path = shift;
2681        return git_get_file_or_project_config($path, 'description');
2682}
2683
2684sub git_get_project_category {
2685        my $path = shift;
2686        return git_get_file_or_project_config($path, 'category');
2687}
2688
2689
2690# supported formats:
2691# * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2692#   - if its contents is a number, use it as tag weight,
2693#   - otherwise add a tag with weight 1
2694# * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2695#   the same value multiple times increases tag weight
2696# * `gitweb.ctag' multi-valued repo config variable
2697sub git_get_project_ctags {
2698        my $project = shift;
2699        my $ctags = {};
2700
2701        $git_dir = "$projectroot/$project";
2702        if (opendir my $dh, "$git_dir/ctags") {
2703                my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2704                foreach my $tagfile (@files) {
2705                        open my $ct, '<', $tagfile
2706                                or next;
2707                        my $val = <$ct>;
2708                        chomp $val if $val;
2709                        close $ct;
2710
2711                        (my $ctag = $tagfile) =~ s#.*/##;
2712                        if ($val =~ /^\d+$/) {
2713                                $ctags->{$ctag} = $val;
2714                        } else {
2715                                $ctags->{$ctag} = 1;
2716                        }
2717                }
2718                closedir $dh;
2719
2720        } elsif (open my $fh, '<', "$git_dir/ctags") {
2721                while (my $line = <$fh>) {
2722                        chomp $line;
2723                        $ctags->{$line}++ if $line;
2724                }
2725                close $fh;
2726
2727        } else {
2728                my $taglist = config_to_multi(git_get_project_config('ctag'));
2729                foreach my $tag (@$taglist) {
2730                        $ctags->{$tag}++;
2731                }
2732        }
2733
2734        return $ctags;
2735}
2736
2737# return hash, where keys are content tags ('ctags'),
2738# and values are sum of weights of given tag in every project
2739sub git_gather_all_ctags {
2740        my $projects = shift;
2741        my $ctags = {};
2742
2743        foreach my $p (@$projects) {
2744                foreach my $ct (keys %{$p->{'ctags'}}) {
2745                        $ctags->{$ct} += $p->{'ctags'}->{$ct};
2746                }
2747        }
2748
2749        return $ctags;
2750}
2751
2752sub git_populate_project_tagcloud {
2753        my $ctags = shift;
2754
2755        # First, merge different-cased tags; tags vote on casing
2756        my %ctags_lc;
2757        foreach (keys %$ctags) {
2758                $ctags_lc{lc $_}->{count} += $ctags->{$_};
2759                if (not $ctags_lc{lc $_}->{topcount}
2760                    or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2761                        $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2762                        $ctags_lc{lc $_}->{topname} = $_;
2763                }
2764        }
2765
2766        my $cloud;
2767        my $matched = $cgi->param('by_tag');
2768        if (eval { require HTML::TagCloud; 1; }) {
2769                $cloud = HTML::TagCloud->new;
2770                foreach my $ctag (sort keys %ctags_lc) {
2771                        # Pad the title with spaces so that the cloud looks
2772                        # less crammed.
2773                        my $title = esc_html($ctags_lc{$ctag}->{topname});
2774                        $title =~ s/ /&nbsp;/g;
2775                        $title =~ s/^/&nbsp;/g;
2776                        $title =~ s/$/&nbsp;/g;
2777                        if (defined $matched && $matched eq $ctag) {
2778                                $title = qq(<span class="match">$title</span>);
2779                        }
2780                        $cloud->add($title, href(project=>undef, ctag=>$ctag),
2781                                    $ctags_lc{$ctag}->{count});
2782                }
2783        } else {
2784                $cloud = {};
2785                foreach my $ctag (keys %ctags_lc) {
2786                        my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2787                        if (defined $matched && $matched eq $ctag) {
2788                                $title = qq(<span class="match">$title</span>);
2789                        }
2790                        $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2791                        $cloud->{$ctag}{ctag} =
2792                                $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2793                }
2794        }
2795        return $cloud;
2796}
2797
2798sub git_show_project_tagcloud {
2799        my ($cloud, $count) = @_;
2800        if (ref $cloud eq 'HTML::TagCloud') {
2801                return $cloud->html_and_css($count);
2802        } else {
2803                my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2804                return
2805                        '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2806                        join (', ', map {
2807                                $cloud->{$_}->{'ctag'}
2808                        } splice(@tags, 0, $count)) .
2809                        '</div>';
2810        }
2811}
2812
2813sub git_get_project_url_list {
2814        my $path = shift;
2815
2816        $git_dir = "$projectroot/$path";
2817        open my $fd, '<', "$git_dir/cloneurl"
2818                or return wantarray ?
2819                @{ config_to_multi(git_get_project_config('url')) } :
2820                   config_to_multi(git_get_project_config('url'));
2821        my @git_project_url_list = map { chomp; $_ } <$fd>;
2822        close $fd;
2823
2824        return wantarray ? @git_project_url_list : \@git_project_url_list;
2825}
2826
2827sub git_get_projects_list {
2828        my $filter = shift || '';
2829        my @list;
2830
2831        $filter =~ s/\.git$//;
2832
2833        if (-d $projects_list) {
2834                # search in directory
2835                my $dir = $projects_list;
2836                # remove the trailing "/"
2837                $dir =~ s!/+$!!;
2838                my $pfxlen = length("$projects_list");
2839                my $pfxdepth = ($projects_list =~ tr!/!!);
2840                # when filtering, search only given subdirectory
2841                if ($filter) {
2842                        $dir .= "/$filter";
2843                        $dir =~ s!/+$!!;
2844                }
2845
2846                File::Find::find({
2847                        follow_fast => 1, # follow symbolic links
2848                        follow_skip => 2, # ignore duplicates
2849                        dangling_symlinks => 0, # ignore dangling symlinks, silently
2850                        wanted => sub {
2851                                # global variables
2852                                our $project_maxdepth;
2853                                our $projectroot;
2854                                # skip project-list toplevel, if we get it.
2855                                return if (m!^[/.]$!);
2856                                # only directories can be git repositories
2857                                return unless (-d $_);
2858                                # don't traverse too deep (Find is super slow on os x)
2859                                # $project_maxdepth excludes depth of $projectroot
2860                                if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2861                                        $File::Find::prune = 1;
2862                                        return;
2863                                }
2864
2865                                my $path = substr($File::Find::name, $pfxlen + 1);
2866                                # we check related file in $projectroot
2867                                if (check_export_ok("$projectroot/$path")) {
2868                                        push @list, { path => $path };
2869                                        $File::Find::prune = 1;
2870                                }
2871                        },
2872                }, "$dir");
2873
2874        } elsif (-f $projects_list) {
2875                # read from file(url-encoded):
2876                # 'git%2Fgit.git Linus+Torvalds'
2877                # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2878                # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2879                open my $fd, '<', $projects_list or return;
2880        PROJECT:
2881                while (my $line = <$fd>) {
2882                        chomp $line;
2883                        my ($path, $owner) = split ' ', $line;
2884                        $path = unescape($path);
2885                        $owner = unescape($owner);
2886                        if (!defined $path) {
2887                                next;
2888                        }
2889                        # if $filter is rpovided, check if $path begins with $filter
2890                        if ($filter && $path !~ m!^\Q$filter\E/!) {
2891                                next;
2892                        }
2893                        if (check_export_ok("$projectroot/$path")) {
2894                                my $pr = {
2895                                        path => $path,
2896                                        owner => to_utf8($owner),
2897                                };
2898                                push @list, $pr;
2899                        }
2900                }
2901                close $fd;
2902        }
2903        return @list;
2904}
2905
2906# written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
2907# as side effects it sets 'forks' field to list of forks for forked projects
2908sub filter_forks_from_projects_list {
2909        my $projects = shift;
2910
2911        my %trie; # prefix tree of directories (path components)
2912        # generate trie out of those directories that might contain forks
2913        foreach my $pr (@$projects) {
2914                my $path = $pr->{'path'};
2915                $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
2916                next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
2917                next unless ($path);      # skip '.git' repository: tests, git-instaweb
2918                next unless (-d "$projectroot/$path"); # containing directory exists
2919                $pr->{'forks'} = [];      # there can be 0 or more forks of project
2920
2921                # add to trie
2922                my @dirs = split('/', $path);
2923                # walk the trie, until either runs out of components or out of trie
2924                my $ref = \%trie;
2925                while (scalar @dirs &&
2926                       exists($ref->{$dirs[0]})) {
2927                        $ref = $ref->{shift @dirs};
2928                }
2929                # create rest of trie structure from rest of components
2930                foreach my $dir (@dirs) {
2931                        $ref = $ref->{$dir} = {};
2932                }
2933                # create end marker, store $pr as a data
2934                $ref->{''} = $pr if (!exists $ref->{''});
2935        }
2936
2937        # filter out forks, by finding shortest prefix match for paths
2938        my @filtered;
2939 PROJECT:
2940        foreach my $pr (@$projects) {
2941                # trie lookup
2942                my $ref = \%trie;
2943        DIR:
2944                foreach my $dir (split('/', $pr->{'path'})) {
2945                        if (exists $ref->{''}) {
2946                                # found [shortest] prefix, is a fork - skip it
2947                                push @{$ref->{''}{'forks'}}, $pr;
2948                                next PROJECT;
2949                        }
2950                        if (!exists $ref->{$dir}) {
2951                                # not in trie, cannot have prefix, not a fork
2952                                push @filtered, $pr;
2953                                next PROJECT;
2954                        }
2955                        # If the dir is there, we just walk one step down the trie.
2956                        $ref = $ref->{$dir};
2957                }
2958                # we ran out of trie
2959                # (shouldn't happen: it's either no match, or end marker)
2960                push @filtered, $pr;
2961        }
2962
2963        return @filtered;
2964}
2965
2966# note: fill_project_list_info must be run first,
2967# for 'descr_long' and 'ctags' to be filled
2968sub search_projects_list {
2969        my ($projlist, %opts) = @_;
2970        my $tagfilter  = $opts{'tagfilter'};
2971        my $searchtext = $opts{'searchtext'};
2972
2973        return @$projlist
2974                unless ($tagfilter || $searchtext);
2975
2976        my @projects;
2977 PROJECT:
2978        foreach my $pr (@$projlist) {
2979
2980                if ($tagfilter) {
2981                        next unless ref($pr->{'ctags'}) eq 'HASH';
2982                        next unless
2983                                grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
2984                }
2985
2986                if ($searchtext) {
2987                        next unless
2988                                $pr->{'path'} =~ /$searchtext/ ||
2989                                $pr->{'descr_long'} =~ /$searchtext/;
2990                }
2991
2992                push @projects, $pr;
2993        }
2994
2995        return @projects;
2996}
2997
2998our $gitweb_project_owner = undef;
2999sub git_get_project_list_from_file {
3000
3001        return if (defined $gitweb_project_owner);
3002
3003        $gitweb_project_owner = {};
3004        # read from file (url-encoded):
3005        # 'git%2Fgit.git Linus+Torvalds'
3006        # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3007        # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3008        if (-f $projects_list) {
3009                open(my $fd, '<', $projects_list);
3010                while (my $line = <$fd>) {
3011                        chomp $line;
3012                        my ($pr, $ow) = split ' ', $line;
3013                        $pr = unescape($pr);
3014                        $ow = unescape($ow);
3015                        $gitweb_project_owner->{$pr} = to_utf8($ow);
3016                }
3017                close $fd;
3018        }
3019}
3020
3021sub git_get_project_owner {
3022        my $project = shift;
3023        my $owner;
3024
3025        return undef unless $project;
3026        $git_dir = "$projectroot/$project";
3027
3028        if (!defined $gitweb_project_owner) {
3029                git_get_project_list_from_file();
3030        }
3031
3032        if (exists $gitweb_project_owner->{$project}) {
3033                $owner = $gitweb_project_owner->{$project};
3034        }
3035        if (!defined $owner){
3036                $owner = git_get_project_config('owner');
3037        }
3038        if (!defined $owner) {
3039                $owner = get_file_owner("$git_dir");
3040        }
3041
3042        return $owner;
3043}
3044
3045sub git_get_last_activity {
3046        my ($path) = @_;
3047        my $fd;
3048
3049        $git_dir = "$projectroot/$path";
3050        open($fd, "-|", git_cmd(), 'for-each-ref',
3051             '--format=%(committer)',
3052             '--sort=-committerdate',
3053             '--count=1',
3054             'refs/heads') or return;
3055        my $most_recent = <$fd>;
3056        close $fd or return;
3057        if (defined $most_recent &&
3058            $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3059                my $timestamp = $1;
3060                my $age = time - $timestamp;
3061                return ($age, age_string($age));
3062        }
3063        return (undef, undef);
3064}
3065
3066# Implementation note: when a single remote is wanted, we cannot use 'git
3067# remote show -n' because that command always work (assuming it's a remote URL
3068# if it's not defined), and we cannot use 'git remote show' because that would
3069# try to make a network roundtrip. So the only way to find if that particular
3070# remote is defined is to walk the list provided by 'git remote -v' and stop if
3071# and when we find what we want.
3072sub git_get_remotes_list {
3073        my $wanted = shift;
3074        my %remotes = ();
3075
3076        open my $fd, '-|' , git_cmd(), 'remote', '-v';
3077        return unless $fd;
3078        while (my $remote = <$fd>) {
3079                chomp $remote;
3080                $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3081                next if $wanted and not $remote eq $wanted;
3082                my ($url, $key) = ($1, $2);
3083
3084                $remotes{$remote} ||= { 'heads' => () };
3085                $remotes{$remote}{$key} = $url;
3086        }
3087        close $fd or return;
3088        return wantarray ? %remotes : \%remotes;
3089}
3090
3091# Takes a hash of remotes as first parameter and fills it by adding the
3092# available remote heads for each of the indicated remotes.
3093sub fill_remote_heads {
3094        my $remotes = shift;
3095        my @heads = map { "remotes/$_" } keys %$remotes;
3096        my @remoteheads = git_get_heads_list(undef, @heads);
3097        foreach my $remote (keys %$remotes) {
3098                $remotes->{$remote}{'heads'} = [ grep {
3099                        $_->{'name'} =~ s!^$remote/!!
3100                        } @remoteheads ];
3101        }
3102}
3103
3104sub git_get_references {
3105        my $type = shift || "";
3106        my %refs;
3107        # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3108        # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3109        open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3110                ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3111                or return;
3112
3113        while (my $line = <$fd>) {
3114                chomp $line;
3115                if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3116                        if (defined $refs{$1}) {
3117                                push @{$refs{$1}}, $2;
3118                        } else {
3119                                $refs{$1} = [ $2 ];
3120                        }
3121                }
3122        }
3123        close $fd or return;
3124        return \%refs;
3125}
3126
3127sub git_get_rev_name_tags {
3128        my $hash = shift || return undef;
3129
3130        open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3131                or return;
3132        my $name_rev = <$fd>;
3133        close $fd;
3134
3135        if ($name_rev =~ m|^$hash tags/(.*)$|) {
3136                return $1;
3137        } else {
3138                # catches also '$hash undefined' output
3139                return undef;
3140        }
3141}
3142
3143## ----------------------------------------------------------------------
3144## parse to hash functions
3145
3146sub parse_date {
3147        my $epoch = shift;
3148        my $tz = shift || "-0000";
3149
3150        my %date;
3151        my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3152        my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3153        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3154        $date{'hour'} = $hour;
3155        $date{'minute'} = $min;
3156        $date{'mday'} = $mday;
3157        $date{'day'} = $days[$wday];
3158        $date{'month'} = $months[$mon];
3159        $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3160                             $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3161        $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3162                             $mday, $months[$mon], $hour ,$min;
3163        $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3164                             1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3165
3166        my ($tz_sign, $tz_hour, $tz_min) =
3167                ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3168        $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3169        my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3170        ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3171        $date{'hour_local'} = $hour;
3172        $date{'minute_local'} = $min;
3173        $date{'tz_local'} = $tz;
3174        $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3175                                  1900+$year, $mon+1, $mday,
3176                                  $hour, $min, $sec, $tz);
3177        return %date;
3178}
3179
3180sub parse_tag {
3181        my $tag_id = shift;
3182        my %tag;
3183        my @comment;
3184
3185        open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3186        $tag{'id'} = $tag_id;
3187        while (my $line = <$fd>) {
3188                chomp $line;
3189                if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3190                        $tag{'object'} = $1;
3191                } elsif ($line =~ m/^type (.+)$/) {
3192                        $tag{'type'} = $1;
3193                } elsif ($line =~ m/^tag (.+)$/) {
3194                        $tag{'name'} = $1;
3195                } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3196                        $tag{'author'} = $1;
3197                        $tag{'author_epoch'} = $2;
3198                        $tag{'author_tz'} = $3;
3199                        if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3200                                $tag{'author_name'}  = $1;
3201                                $tag{'author_email'} = $2;
3202                        } else {
3203                                $tag{'author_name'} = $tag{'author'};
3204                        }
3205                } elsif ($line =~ m/--BEGIN/) {
3206                        push @comment, $line;
3207                        last;
3208                } elsif ($line eq "") {
3209                        last;
3210                }
3211        }
3212        push @comment, <$fd>;
3213        $tag{'comment'} = \@comment;
3214        close $fd or return;
3215        if (!defined $tag{'name'}) {
3216                return
3217        };
3218        return %tag
3219}
3220
3221sub parse_commit_text {
3222        my ($commit_text, $withparents) = @_;
3223        my @commit_lines = split '\n', $commit_text;
3224        my %co;
3225
3226        pop @commit_lines; # Remove '\0'
3227
3228        if (! @commit_lines) {
3229                return;
3230        }
3231
3232        my $header = shift @commit_lines;
3233        if ($header !~ m/^[0-9a-fA-F]{40}/) {
3234                return;
3235        }
3236        ($co{'id'}, my @parents) = split ' ', $header;
3237        while (my $line = shift @commit_lines) {
3238                last if $line eq "\n";
3239                if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3240                        $co{'tree'} = $1;
3241                } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3242                        push @parents, $1;
3243                } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3244                        $co{'author'} = to_utf8($1);
3245                        $co{'author_epoch'} = $2;
3246                        $co{'author_tz'} = $3;
3247                        if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3248                                $co{'author_name'}  = $1;
3249                                $co{'author_email'} = $2;
3250                        } else {
3251                                $co{'author_name'} = $co{'author'};
3252                        }
3253                } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3254                        $co{'committer'} = to_utf8($1);
3255                        $co{'committer_epoch'} = $2;
3256                        $co{'committer_tz'} = $3;
3257                        if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3258                                $co{'committer_name'}  = $1;
3259                                $co{'committer_email'} = $2;
3260                        } else {
3261                                $co{'committer_name'} = $co{'committer'};
3262                        }
3263                }
3264        }
3265        if (!defined $co{'tree'}) {
3266                return;
3267        };
3268        $co{'parents'} = \@parents;
3269        $co{'parent'} = $parents[0];
3270
3271        foreach my $title (@commit_lines) {
3272                $title =~ s/^    //;
3273                if ($title ne "") {
3274                        $co{'title'} = chop_str($title, 80, 5);
3275                        # remove leading stuff of merges to make the interesting part visible
3276                        if (length($title) > 50) {
3277                                $title =~ s/^Automatic //;
3278                                $title =~ s/^merge (of|with) /Merge ... /i;
3279                                if (length($title) > 50) {
3280                                        $title =~ s/(http|rsync):\/\///;
3281                                }
3282                                if (length($title) > 50) {
3283                                        $title =~ s/(master|www|rsync)\.//;
3284                                }
3285                                if (length($title) > 50) {
3286                                        $title =~ s/kernel.org:?//;
3287                                }
3288                                if (length($title) > 50) {
3289                                        $title =~ s/\/pub\/scm//;
3290                                }
3291                        }
3292                        $co{'title_short'} = chop_str($title, 50, 5);
3293                        last;
3294                }
3295        }
3296        if (! defined $co{'title'} || $co{'title'} eq "") {
3297                $co{'title'} = $co{'title_short'} = '(no commit message)';
3298        }
3299        # remove added spaces
3300        foreach my $line (@commit_lines) {
3301                $line =~ s/^    //;
3302        }
3303        $co{'comment'} = \@commit_lines;
3304
3305        my $age = time - $co{'committer_epoch'};
3306        $co{'age'} = $age;
3307        $co{'age_string'} = age_string($age);
3308        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3309        if ($age > 60*60*24*7*2) {
3310                $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3311                $co{'age_string_age'} = $co{'age_string'};
3312        } else {
3313                $co{'age_string_date'} = $co{'age_string'};
3314                $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3315        }
3316        return %co;
3317}
3318
3319sub parse_commit {
3320        my ($commit_id) = @_;
3321        my %co;
3322
3323        local $/ = "\0";
3324
3325        open my $fd, "-|", git_cmd(), "rev-list",
3326                "--parents",
3327                "--header",
3328                "--max-count=1",
3329                $commit_id,
3330                "--",
3331                or die_error(500, "Open git-rev-list failed");
3332        %co = parse_commit_text(<$fd>, 1);
3333        close $fd;
3334
3335        return %co;
3336}
3337
3338sub parse_commits {
3339        my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3340        my @cos;
3341
3342        $maxcount ||= 1;
3343        $skip ||= 0;
3344
3345        local $/ = "\0";
3346
3347        open my $fd, "-|", git_cmd(), "rev-list",
3348                "--header",
3349                @args,
3350                ("--max-count=" . $maxcount),
3351                ("--skip=" . $skip),
3352                @extra_options,
3353                $commit_id,
3354                "--",
3355                ($filename ? ($filename) : ())
3356                or die_error(500, "Open git-rev-list failed");
3357        while (my $line = <$fd>) {
3358                my %co = parse_commit_text($line);
3359                push @cos, \%co;
3360        }
3361        close $fd;
3362
3363        return wantarray ? @cos : \@cos;
3364}
3365
3366# parse line of git-diff-tree "raw" output
3367sub parse_difftree_raw_line {
3368        my $line = shift;
3369        my %res;
3370
3371        # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3372        # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3373        if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3374                $res{'from_mode'} = $1;
3375                $res{'to_mode'} = $2;
3376                $res{'from_id'} = $3;
3377                $res{'to_id'} = $4;
3378                $res{'status'} = $5;
3379                $res{'similarity'} = $6;
3380                if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3381                        ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3382                } else {
3383                        $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3384                }
3385        }
3386        # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3387        # combined diff (for merge commit)
3388        elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3389                $res{'nparents'}  = length($1);
3390                $res{'from_mode'} = [ split(' ', $2) ];
3391                $res{'to_mode'} = pop @{$res{'from_mode'}};
3392                $res{'from_id'} = [ split(' ', $3) ];
3393                $res{'to_id'} = pop @{$res{'from_id'}};
3394                $res{'status'} = [ split('', $4) ];
3395                $res{'to_file'} = unquote($5);
3396        }
3397        # 'c512b523472485aef4fff9e57b229d9d243c967f'
3398        elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3399                $res{'commit'} = $1;
3400        }
3401
3402        return wantarray ? %res : \%res;
3403}
3404
3405# wrapper: return parsed line of git-diff-tree "raw" output
3406# (the argument might be raw line, or parsed info)
3407sub parsed_difftree_line {
3408        my $line_or_ref = shift;
3409
3410        if (ref($line_or_ref) eq "HASH") {
3411                # pre-parsed (or generated by hand)
3412                return $line_or_ref;
3413        } else {
3414                return parse_difftree_raw_line($line_or_ref);
3415        }
3416}
3417
3418# parse line of git-ls-tree output
3419sub parse_ls_tree_line {
3420        my $line = shift;
3421        my %opts = @_;
3422        my %res;
3423
3424        if ($opts{'-l'}) {
3425                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3426                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3427
3428                $res{'mode'} = $1;
3429                $res{'type'} = $2;
3430                $res{'hash'} = $3;
3431                $res{'size'} = $4;
3432                if ($opts{'-z'}) {
3433                        $res{'name'} = $5;
3434                } else {
3435                        $res{'name'} = unquote($5);
3436                }
3437        } else {
3438                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3439                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3440
3441                $res{'mode'} = $1;
3442                $res{'type'} = $2;
3443                $res{'hash'} = $3;
3444                if ($opts{'-z'}) {
3445                        $res{'name'} = $4;
3446                } else {
3447                        $res{'name'} = unquote($4);
3448                }
3449        }
3450
3451        return wantarray ? %res : \%res;
3452}
3453
3454# generates _two_ hashes, references to which are passed as 2 and 3 argument
3455sub parse_from_to_diffinfo {
3456        my ($diffinfo, $from, $to, @parents) = @_;
3457
3458        if ($diffinfo->{'nparents'}) {
3459                # combined diff
3460                $from->{'file'} = [];
3461                $from->{'href'} = [];
3462                fill_from_file_info($diffinfo, @parents)
3463                        unless exists $diffinfo->{'from_file'};
3464                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3465                        $from->{'file'}[$i] =
3466                                defined $diffinfo->{'from_file'}[$i] ?
3467                                        $diffinfo->{'from_file'}[$i] :
3468                                        $diffinfo->{'to_file'};
3469                        if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3470                                $from->{'href'}[$i] = href(action=>"blob",
3471                                                           hash_base=>$parents[$i],
3472                                                           hash=>$diffinfo->{'from_id'}[$i],
3473                                                           file_name=>$from->{'file'}[$i]);
3474                        } else {
3475                                $from->{'href'}[$i] = undef;
3476                        }
3477                }
3478        } else {
3479                # ordinary (not combined) diff
3480                $from->{'file'} = $diffinfo->{'from_file'};
3481                if ($diffinfo->{'status'} ne "A") { # not new (added) file
3482                        $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3483                                               hash=>$diffinfo->{'from_id'},
3484                                               file_name=>$from->{'file'});
3485                } else {
3486                        delete $from->{'href'};
3487                }
3488        }
3489
3490        $to->{'file'} = $diffinfo->{'to_file'};
3491        if (!is_deleted($diffinfo)) { # file exists in result
3492                $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3493                                     hash=>$diffinfo->{'to_id'},
3494                                     file_name=>$to->{'file'});
3495        } else {
3496                delete $to->{'href'};
3497        }
3498}
3499
3500## ......................................................................
3501## parse to array of hashes functions
3502
3503sub git_get_heads_list {
3504        my ($limit, @classes) = @_;
3505        @classes = ('heads') unless @classes;
3506        my @patterns = map { "refs/$_" } @classes;
3507        my @headslist;
3508
3509        open my $fd, '-|', git_cmd(), 'for-each-ref',
3510                ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3511                '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3512                @patterns
3513                or return;
3514        while (my $line = <$fd>) {
3515                my %ref_item;
3516
3517                chomp $line;
3518                my ($refinfo, $committerinfo) = split(/\0/, $line);
3519                my ($hash, $name, $title) = split(' ', $refinfo, 3);
3520                my ($committer, $epoch, $tz) =
3521                        ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3522                $ref_item{'fullname'}  = $name;
3523                $name =~ s!^refs/(?:head|remote)s/!!;
3524
3525                $ref_item{'name'}  = $name;
3526                $ref_item{'id'}    = $hash;
3527                $ref_item{'title'} = $title || '(no commit message)';
3528                $ref_item{'epoch'} = $epoch;
3529                if ($epoch) {
3530                        $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3531                } else {
3532                        $ref_item{'age'} = "unknown";
3533                }
3534
3535                push @headslist, \%ref_item;
3536        }
3537        close $fd;
3538
3539        return wantarray ? @headslist : \@headslist;
3540}
3541
3542sub git_get_tags_list {
3543        my $limit = shift;
3544        my @tagslist;
3545
3546        open my $fd, '-|', git_cmd(), 'for-each-ref',
3547                ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3548                '--format=%(objectname) %(objecttype) %(refname) '.
3549                '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3550                'refs/tags'
3551                or return;
3552        while (my $line = <$fd>) {
3553                my %ref_item;
3554
3555                chomp $line;
3556                my ($refinfo, $creatorinfo) = split(/\0/, $line);
3557                my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3558                my ($creator, $epoch, $tz) =
3559                        ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3560                $ref_item{'fullname'} = $name;
3561                $name =~ s!^refs/tags/!!;
3562
3563                $ref_item{'type'} = $type;
3564                $ref_item{'id'} = $id;
3565                $ref_item{'name'} = $name;
3566                if ($type eq "tag") {
3567                        $ref_item{'subject'} = $title;
3568                        $ref_item{'reftype'} = $reftype;
3569                        $ref_item{'refid'}   = $refid;
3570                } else {
3571                        $ref_item{'reftype'} = $type;
3572                        $ref_item{'refid'}   = $id;
3573                }
3574
3575                if ($type eq "tag" || $type eq "commit") {
3576                        $ref_item{'epoch'} = $epoch;
3577                        if ($epoch) {
3578                                $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3579                        } else {
3580                                $ref_item{'age'} = "unknown";
3581                        }
3582                }
3583
3584                push @tagslist, \%ref_item;
3585        }
3586        close $fd;
3587
3588        return wantarray ? @tagslist : \@tagslist;
3589}
3590
3591## ----------------------------------------------------------------------
3592## filesystem-related functions
3593
3594sub get_file_owner {
3595        my $path = shift;
3596
3597        my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3598        my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3599        if (!defined $gcos) {
3600                return undef;
3601        }
3602        my $owner = $gcos;
3603        $owner =~ s/[,;].*$//;
3604        return to_utf8($owner);
3605}
3606
3607# assume that file exists
3608sub insert_file {
3609        my $filename = shift;
3610
3611        open my $fd, '<', $filename;
3612        print map { to_utf8($_) } <$fd>;
3613        close $fd;
3614}
3615
3616## ......................................................................
3617## mimetype related functions
3618
3619sub mimetype_guess_file {
3620        my $filename = shift;
3621        my $mimemap = shift;
3622        -r $mimemap or return undef;
3623
3624        my %mimemap;
3625        open(my $mh, '<', $mimemap) or return undef;
3626        while (<$mh>) {
3627                next if m/^#/; # skip comments
3628                my ($mimetype, @exts) = split(/\s+/);
3629                foreach my $ext (@exts) {
3630                        $mimemap{$ext} = $mimetype;
3631                }
3632        }
3633        close($mh);
3634
3635        $filename =~ /\.([^.]*)$/;
3636        return $mimemap{$1};
3637}
3638
3639sub mimetype_guess {
3640        my $filename = shift;
3641        my $mime;
3642        $filename =~ /\./ or return undef;
3643
3644        if ($mimetypes_file) {
3645                my $file = $mimetypes_file;
3646                if ($file !~ m!^/!) { # if it is relative path
3647                        # it is relative to project
3648                        $file = "$projectroot/$project/$file";
3649                }
3650                $mime = mimetype_guess_file($filename, $file);
3651        }
3652        $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3653        return $mime;
3654}
3655
3656sub blob_mimetype {
3657        my $fd = shift;
3658        my $filename = shift;
3659
3660        if ($filename) {
3661                my $mime = mimetype_guess($filename);
3662                $mime and return $mime;
3663        }
3664
3665        # just in case
3666        return $default_blob_plain_mimetype unless $fd;
3667
3668        if (-T $fd) {
3669                return 'text/plain';
3670        } elsif (! $filename) {
3671                return 'application/octet-stream';
3672        } elsif ($filename =~ m/\.png$/i) {
3673                return 'image/png';
3674        } elsif ($filename =~ m/\.gif$/i) {
3675                return 'image/gif';
3676        } elsif ($filename =~ m/\.jpe?g$/i) {
3677                return 'image/jpeg';
3678        } else {
3679                return 'application/octet-stream';
3680        }
3681}
3682
3683sub blob_contenttype {
3684        my ($fd, $file_name, $type) = @_;
3685
3686        $type ||= blob_mimetype($fd, $file_name);
3687        if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3688                $type .= "; charset=$default_text_plain_charset";
3689        }
3690
3691        return $type;
3692}
3693
3694# guess file syntax for syntax highlighting; return undef if no highlighting
3695# the name of syntax can (in the future) depend on syntax highlighter used
3696sub guess_file_syntax {
3697        my ($highlight, $mimetype, $file_name) = @_;
3698        return undef unless ($highlight && defined $file_name);
3699        my $basename = basename($file_name, '.in');
3700        return $highlight_basename{$basename}
3701                if exists $highlight_basename{$basename};
3702
3703        $basename =~ /\.([^.]*)$/;
3704        my $ext = $1 or return undef;
3705        return $highlight_ext{$ext}
3706                if exists $highlight_ext{$ext};
3707
3708        return undef;
3709}
3710
3711# run highlighter and return FD of its output,
3712# or return original FD if no highlighting
3713sub run_highlighter {
3714        my ($fd, $highlight, $syntax) = @_;
3715        return $fd unless ($highlight && defined $syntax);
3716
3717        close $fd;
3718        open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3719                  quote_command($highlight_bin).
3720                  " --replace-tabs=8 --fragment --syntax $syntax |"
3721                or die_error(500, "Couldn't open file or run syntax highlighter");
3722        return $fd;
3723}
3724
3725## ======================================================================
3726## functions printing HTML: header, footer, error page
3727
3728sub get_page_title {
3729        my $title = to_utf8($site_name);
3730
3731        return $title unless (defined $project);
3732        $title .= " - " . to_utf8($project);
3733
3734        return $title unless (defined $action);
3735        $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3736
3737        return $title unless (defined $file_name);
3738        $title .= " - " . esc_path($file_name);
3739        if ($action eq "tree" && $file_name !~ m|/$|) {
3740                $title .= "/";
3741        }
3742
3743        return $title;
3744}
3745
3746sub get_content_type_html {
3747        # require explicit support from the UA if we are to send the page as
3748        # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3749        # we have to do this because MSIE sometimes globs '*/*', pretending to
3750        # support xhtml+xml but choking when it gets what it asked for.
3751        if (defined $cgi->http('HTTP_ACCEPT') &&
3752            $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3753            $cgi->Accept('application/xhtml+xml') != 0) {
3754                return 'application/xhtml+xml';
3755        } else {
3756                return 'text/html';
3757        }
3758}
3759
3760sub print_feed_meta {
3761        if (defined $project) {
3762                my %href_params = get_feed_info();
3763                if (!exists $href_params{'-title'}) {
3764                        $href_params{'-title'} = 'log';
3765                }
3766
3767                foreach my $format (qw(RSS Atom)) {
3768                        my $type = lc($format);
3769                        my %link_attr = (
3770                                '-rel' => 'alternate',
3771                                '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3772                                '-type' => "application/$type+xml"
3773                        );
3774
3775                        $href_params{'action'} = $type;
3776                        $link_attr{'-href'} = href(%href_params);
3777                        print "<link ".
3778                              "rel=\"$link_attr{'-rel'}\" ".
3779                              "title=\"$link_attr{'-title'}\" ".
3780                              "href=\"$link_attr{'-href'}\" ".
3781                              "type=\"$link_attr{'-type'}\" ".
3782                              "/>\n";
3783
3784                        $href_params{'extra_options'} = '--no-merges';
3785                        $link_attr{'-href'} = href(%href_params);
3786                        $link_attr{'-title'} .= ' (no merges)';
3787                        print "<link ".
3788                              "rel=\"$link_attr{'-rel'}\" ".
3789                              "title=\"$link_attr{'-title'}\" ".
3790                              "href=\"$link_attr{'-href'}\" ".
3791                              "type=\"$link_attr{'-type'}\" ".
3792                              "/>\n";
3793                }
3794
3795        } else {
3796                printf('<link rel="alternate" title="%s projects list" '.
3797                       'href="%s" type="text/plain; charset=utf-8" />'."\n",
3798                       esc_attr($site_name), href(project=>undef, action=>"project_index"));
3799                printf('<link rel="alternate" title="%s projects feeds" '.
3800                       'href="%s" type="text/x-opml" />'."\n",
3801                       esc_attr($site_name), href(project=>undef, action=>"opml"));
3802        }
3803}
3804
3805sub print_header_links {
3806        my $status = shift;
3807
3808        # print out each stylesheet that exist, providing backwards capability
3809        # for those people who defined $stylesheet in a config file
3810        if (defined $stylesheet) {
3811                print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3812        } else {
3813                foreach my $stylesheet (@stylesheets) {
3814                        next unless $stylesheet;
3815                        print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3816                }
3817        }
3818        print_feed_meta()
3819                if ($status eq '200 OK');
3820        if (defined $favicon) {
3821                print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3822        }
3823}
3824
3825sub print_nav_breadcrumbs {
3826        my %opts = @_;
3827
3828        print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3829        if (defined $project) {
3830                print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3831                if (defined $action) {
3832                        my $action_print = $action ;
3833                        if (defined $opts{-action_extra}) {
3834                                $action_print = $cgi->a({-href => href(action=>$action)},
3835                                        $action);
3836                        }
3837                        print " / $action_print";
3838                }
3839                if (defined $opts{-action_extra}) {
3840                        print " / $opts{-action_extra}";
3841                }
3842                print "\n";
3843        }
3844}
3845
3846sub print_search_form {
3847        if (!defined $searchtext) {
3848                $searchtext = "";
3849        }
3850        my $search_hash;
3851        if (defined $hash_base) {
3852                $search_hash = $hash_base;
3853        } elsif (defined $hash) {
3854                $search_hash = $hash;
3855        } else {
3856                $search_hash = "HEAD";
3857        }
3858        my $action = $my_uri;
3859        my $use_pathinfo = gitweb_check_feature('pathinfo');
3860        if ($use_pathinfo) {
3861                $action .= "/".esc_url($project);
3862        }
3863        print $cgi->startform(-method => "get", -action => $action) .
3864              "<div class=\"search\">\n" .
3865              (!$use_pathinfo &&
3866              $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3867              $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3868              $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3869              $cgi->popup_menu(-name => 'st', -default => 'commit',
3870                               -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3871              $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3872              " search:\n",
3873              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3874              "<span title=\"Extended regular expression\">" .
3875              $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3876                             -checked => $search_use_regexp) .
3877              "</span>" .
3878              "</div>" .
3879              $cgi->end_form() . "\n";
3880}
3881
3882sub git_header_html {
3883        my $status = shift || "200 OK";
3884        my $expires = shift;
3885        my %opts = @_;
3886
3887        my $title = get_page_title();
3888        my $content_type = get_content_type_html();
3889        print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3890                           -status=> $status, -expires => $expires)
3891                unless ($opts{'-no_http_header'});
3892        my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3893        print <<EOF;
3894<?xml version="1.0" encoding="utf-8"?>
3895<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3896<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3897<!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3898<!-- git core binaries version $git_version -->
3899<head>
3900<meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3901<meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3902<meta name="robots" content="index, nofollow"/>
3903<title>$title</title>
3904EOF
3905        # the stylesheet, favicon etc urls won't work correctly with path_info
3906        # unless we set the appropriate base URL
3907        if ($ENV{'PATH_INFO'}) {
3908                print "<base href=\"".esc_url($base_url)."\" />\n";
3909        }
3910        print_header_links($status);
3911
3912        if (defined $site_html_head_string) {
3913                print to_utf8($site_html_head_string);
3914        }
3915
3916        print "</head>\n" .
3917              "<body>\n";
3918
3919        if (defined $site_header && -f $site_header) {
3920                insert_file($site_header);
3921        }
3922
3923        print "<div class=\"page_header\">\n";
3924        if (defined $logo) {
3925                print $cgi->a({-href => esc_url($logo_url),
3926                               -title => $logo_label},
3927                              $cgi->img({-src => esc_url($logo),
3928                                         -width => 72, -height => 27,
3929                                         -alt => "git",
3930                                         -class => "logo"}));
3931        }
3932        print_nav_breadcrumbs(%opts);
3933        print "</div>\n";
3934
3935        my $have_search = gitweb_check_feature('search');
3936        if (defined $project && $have_search) {
3937                print_search_form();
3938        }
3939}
3940
3941sub git_footer_html {
3942        my $feed_class = 'rss_logo';
3943
3944        print "<div class=\"page_footer\">\n";
3945        if (defined $project) {
3946                my $descr = git_get_project_description($project);
3947                if (defined $descr) {
3948                        print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3949                }
3950
3951                my %href_params = get_feed_info();
3952                if (!%href_params) {
3953                        $feed_class .= ' generic';
3954                }
3955                $href_params{'-title'} ||= 'log';
3956
3957                foreach my $format (qw(RSS Atom)) {
3958                        $href_params{'action'} = lc($format);
3959                        print $cgi->a({-href => href(%href_params),
3960                                      -title => "$href_params{'-title'} $format feed",
3961                                      -class => $feed_class}, $format)."\n";
3962                }
3963
3964        } else {
3965                print $cgi->a({-href => href(project=>undef, action=>"opml"),
3966                              -class => $feed_class}, "OPML") . " ";
3967                print $cgi->a({-href => href(project=>undef, action=>"project_index"),
3968                              -class => $feed_class}, "TXT") . "\n";
3969        }
3970        print "</div>\n"; # class="page_footer"
3971
3972        if (defined $t0 && gitweb_check_feature('timed')) {
3973                print "<div id=\"generating_info\">\n";
3974                print 'This page took '.
3975                      '<span id="generating_time" class="time_span">'.
3976                      tv_interval($t0, [ gettimeofday() ]).
3977                      ' seconds </span>'.
3978                      ' and '.
3979                      '<span id="generating_cmd">'.
3980                      $number_of_git_cmds.
3981                      '</span> git commands '.
3982                      " to generate.\n";
3983                print "</div>\n"; # class="page_footer"
3984        }
3985
3986        if (defined $site_footer && -f $site_footer) {
3987                insert_file($site_footer);
3988        }
3989
3990        print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
3991        if (defined $action &&
3992            $action eq 'blame_incremental') {
3993                print qq!<script type="text/javascript">\n!.
3994                      qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
3995                      qq!           "!. href() .qq!");\n!.
3996                      qq!</script>\n!;
3997        } else {
3998                my ($jstimezone, $tz_cookie, $datetime_class) =
3999                        gitweb_get_feature('javascript-timezone');
4000
4001                print qq!<script type="text/javascript">\n!.
4002                      qq!window.onload = function () {\n!;
4003                if (gitweb_check_feature('javascript-actions')) {
4004                        print qq!       fixLinks();\n!;
4005                }
4006                if ($jstimezone && $tz_cookie && $datetime_class) {
4007                        print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4008                              qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4009                }
4010                print qq!};\n!.
4011                      qq!</script>\n!;
4012        }
4013
4014        print "</body>\n" .
4015              "</html>";
4016}
4017
4018# die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4019# Example: die_error(404, 'Hash not found')
4020# By convention, use the following status codes (as defined in RFC 2616):
4021# 400: Invalid or missing CGI parameters, or
4022#      requested object exists but has wrong type.
4023# 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4024#      this server or project.
4025# 404: Requested object/revision/project doesn't exist.
4026# 500: The server isn't configured properly, or
4027#      an internal error occurred (e.g. failed assertions caused by bugs), or
4028#      an unknown error occurred (e.g. the git binary died unexpectedly).
4029# 503: The server is currently unavailable (because it is overloaded,
4030#      or down for maintenance).  Generally, this is a temporary state.
4031sub die_error {
4032        my $status = shift || 500;
4033        my $error = esc_html(shift) || "Internal Server Error";
4034        my $extra = shift;
4035        my %opts = @_;
4036
4037        my %http_responses = (
4038                400 => '400 Bad Request',
4039                403 => '403 Forbidden',
4040                404 => '404 Not Found',
4041                500 => '500 Internal Server Error',
4042                503 => '503 Service Unavailable',
4043        );
4044        git_header_html($http_responses{$status}, undef, %opts);
4045        print <<EOF;
4046<div class="page_body">
4047<br /><br />
4048$status - $error
4049<br />
4050EOF
4051        if (defined $extra) {
4052                print "<hr />\n" .
4053                      "$extra\n";
4054        }
4055        print "</div>\n";
4056
4057        git_footer_html();
4058        goto DONE_GITWEB
4059                unless ($opts{'-error_handler'});
4060}
4061
4062## ----------------------------------------------------------------------
4063## functions printing or outputting HTML: navigation
4064
4065sub git_print_page_nav {
4066        my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4067        $extra = '' if !defined $extra; # pager or formats
4068
4069        my @navs = qw(summary shortlog log commit commitdiff tree);
4070        if ($suppress) {
4071                @navs = grep { $_ ne $suppress } @navs;
4072        }
4073
4074        my %arg = map { $_ => {action=>$_} } @navs;
4075        if (defined $head) {
4076                for (qw(commit commitdiff)) {
4077                        $arg{$_}{'hash'} = $head;
4078                }
4079                if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4080                        for (qw(shortlog log)) {
4081                                $arg{$_}{'hash'} = $head;
4082                        }
4083                }
4084        }
4085
4086        $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4087        $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4088
4089        my @actions = gitweb_get_feature('actions');
4090        my %repl = (
4091                '%' => '%',
4092                'n' => $project,         # project name
4093                'f' => $git_dir,         # project path within filesystem
4094                'h' => $treehead || '',  # current hash ('h' parameter)
4095                'b' => $treebase || '',  # hash base ('hb' parameter)
4096        );
4097        while (@actions) {
4098                my ($label, $link, $pos) = splice(@actions,0,3);
4099                # insert
4100                @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4101                # munch munch
4102                $link =~ s/%([%nfhb])/$repl{$1}/g;
4103                $arg{$label}{'_href'} = $link;
4104        }
4105
4106        print "<div class=\"page_nav\">\n" .
4107                (join " | ",
4108                 map { $_ eq $current ?
4109                       $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4110                 } @navs);
4111        print "<br/>\n$extra<br/>\n" .
4112              "</div>\n";
4113}
4114
4115# returns a submenu for the nagivation of the refs views (tags, heads,
4116# remotes) with the current view disabled and the remotes view only
4117# available if the feature is enabled
4118sub format_ref_views {
4119        my ($current) = @_;
4120        my @ref_views = qw{tags heads};
4121        push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4122        return join " | ", map {
4123                $_ eq $current ? $_ :
4124                $cgi->a({-href => href(action=>$_)}, $_)
4125        } @ref_views
4126}
4127
4128sub format_paging_nav {
4129        my ($action, $page, $has_next_link) = @_;
4130        my $paging_nav;
4131
4132
4133        if ($page > 0) {
4134                $paging_nav .=
4135                        $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4136                        " &sdot; " .
4137                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
4138                                 -accesskey => "p", -title => "Alt-p"}, "prev");
4139        } else {
4140                $paging_nav .= "first &sdot; prev";
4141        }
4142
4143        if ($has_next_link) {
4144                $paging_nav .= " &sdot; " .
4145                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
4146                                 -accesskey => "n", -title => "Alt-n"}, "next");
4147        } else {
4148                $paging_nav .= " &sdot; next";
4149        }
4150
4151        return $paging_nav;
4152}
4153
4154## ......................................................................
4155## functions printing or outputting HTML: div
4156
4157sub git_print_header_div {
4158        my ($action, $title, $hash, $hash_base) = @_;
4159        my %args = ();
4160
4161        $args{'action'} = $action;
4162        $args{'hash'} = $hash if $hash;
4163        $args{'hash_base'} = $hash_base if $hash_base;
4164
4165        print "<div class=\"header\">\n" .
4166              $cgi->a({-href => href(%args), -class => "title"},
4167              $title ? $title : $action) .
4168              "\n</div>\n";
4169}
4170
4171sub format_repo_url {
4172        my ($name, $url) = @_;
4173        return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4174}
4175
4176# Group output by placing it in a DIV element and adding a header.
4177# Options for start_div() can be provided by passing a hash reference as the
4178# first parameter to the function.
4179# Options to git_print_header_div() can be provided by passing an array
4180# reference. This must follow the options to start_div if they are present.
4181# The content can be a scalar, which is output as-is, a scalar reference, which
4182# is output after html escaping, an IO handle passed either as *handle or
4183# *handle{IO}, or a function reference. In the latter case all following
4184# parameters will be taken as argument to the content function call.
4185sub git_print_section {
4186        my ($div_args, $header_args, $content);
4187        my $arg = shift;
4188        if (ref($arg) eq 'HASH') {
4189                $div_args = $arg;
4190                $arg = shift;
4191        }
4192        if (ref($arg) eq 'ARRAY') {
4193                $header_args = $arg;
4194                $arg = shift;
4195        }
4196        $content = $arg;
4197
4198        print $cgi->start_div($div_args);
4199        git_print_header_div(@$header_args);
4200
4201        if (ref($content) eq 'CODE') {
4202                $content->(@_);
4203        } elsif (ref($content) eq 'SCALAR') {
4204                print esc_html($$content);
4205        } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4206                print <$content>;
4207        } elsif (!ref($content) && defined($content)) {
4208                print $content;
4209        }
4210
4211        print $cgi->end_div;
4212}
4213
4214sub format_timestamp_html {
4215        my $date = shift;
4216        my $strtime = $date->{'rfc2822'};
4217
4218        my (undef, undef, $datetime_class) =
4219                gitweb_get_feature('javascript-timezone');
4220        if ($datetime_class) {
4221                $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4222        }
4223
4224        my $localtime_format = '(%02d:%02d %s)';
4225        if ($date->{'hour_local'} < 6) {
4226                $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4227        }
4228        $strtime .= ' ' .
4229                    sprintf($localtime_format,
4230                            $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4231
4232        return $strtime;
4233}
4234
4235# Outputs the author name and date in long form
4236sub git_print_authorship {
4237        my $co = shift;
4238        my %opts = @_;
4239        my $tag = $opts{-tag} || 'div';
4240        my $author = $co->{'author_name'};
4241
4242        my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4243        print "<$tag class=\"author_date\">" .
4244              format_search_author($author, "author", esc_html($author)) .
4245              " [".format_timestamp_html(\%ad)."]".
4246              git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4247              "</$tag>\n";
4248}
4249
4250# Outputs table rows containing the full author or committer information,
4251# in the format expected for 'commit' view (& similar).
4252# Parameters are a commit hash reference, followed by the list of people
4253# to output information for. If the list is empty it defaults to both
4254# author and committer.
4255sub git_print_authorship_rows {
4256        my $co = shift;
4257        # too bad we can't use @people = @_ || ('author', 'committer')
4258        my @people = @_;
4259        @people = ('author', 'committer') unless @people;
4260        foreach my $who (@people) {
4261                my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4262                print "<tr><td>$who</td><td>" .
4263                      format_search_author($co->{"${who}_name"}, $who,
4264                                           esc_html($co->{"${who}_name"})) . " " .
4265                      format_search_author($co->{"${who}_email"}, $who,
4266                                           esc_html("<" . $co->{"${who}_email"} . ">")) .
4267                      "</td><td rowspan=\"2\">" .
4268                      git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4269                      "</td></tr>\n" .
4270                      "<tr>" .
4271                      "<td></td><td>" .
4272                      format_timestamp_html(\%wd) .
4273                      "</td>" .
4274                      "</tr>\n";
4275        }
4276}
4277
4278sub git_print_page_path {
4279        my $name = shift;
4280        my $type = shift;
4281        my $hb = shift;
4282
4283
4284        print "<div class=\"page_path\">";
4285        print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4286                      -title => 'tree root'}, to_utf8("[$project]"));
4287        print " / ";
4288        if (defined $name) {
4289                my @dirname = split '/', $name;
4290                my $basename = pop @dirname;
4291                my $fullname = '';
4292
4293                foreach my $dir (@dirname) {
4294                        $fullname .= ($fullname ? '/' : '') . $dir;
4295                        print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4296                                                     hash_base=>$hb),
4297                                      -title => $fullname}, esc_path($dir));
4298                        print " / ";
4299                }
4300                if (defined $type && $type eq 'blob') {
4301                        print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4302                                                     hash_base=>$hb),
4303                                      -title => $name}, esc_path($basename));
4304                } elsif (defined $type && $type eq 'tree') {
4305                        print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4306                                                     hash_base=>$hb),
4307                                      -title => $name}, esc_path($basename));
4308                        print " / ";
4309                } else {
4310                        print esc_path($basename);
4311                }
4312        }
4313        print "<br/></div>\n";
4314}
4315
4316sub git_print_log {
4317        my $log = shift;
4318        my %opts = @_;
4319
4320        if ($opts{'-remove_title'}) {
4321                # remove title, i.e. first line of log
4322                shift @$log;
4323        }
4324        # remove leading empty lines
4325        while (defined $log->[0] && $log->[0] eq "") {
4326                shift @$log;
4327        }
4328
4329        # print log
4330        my $signoff = 0;
4331        my $empty = 0;
4332        foreach my $line (@$log) {
4333                if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4334                        $signoff = 1;
4335                        $empty = 0;
4336                        if (! $opts{'-remove_signoff'}) {
4337                                print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4338                                next;
4339                        } else {
4340                                # remove signoff lines
4341                                next;
4342                        }
4343                } else {
4344                        $signoff = 0;
4345                }
4346
4347                # print only one empty line
4348                # do not print empty line after signoff
4349                if ($line eq "") {
4350                        next if ($empty || $signoff);
4351                        $empty = 1;
4352                } else {
4353                        $empty = 0;
4354                }
4355
4356                print format_log_line_html($line) . "<br/>\n";
4357        }
4358
4359        if ($opts{'-final_empty_line'}) {
4360                # end with single empty line
4361                print "<br/>\n" unless $empty;
4362        }
4363}
4364
4365# return link target (what link points to)
4366sub git_get_link_target {
4367        my $hash = shift;
4368        my $link_target;
4369
4370        # read link
4371        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4372                or return;
4373        {
4374                local $/ = undef;
4375                $link_target = <$fd>;
4376        }
4377        close $fd
4378                or return;
4379
4380        return $link_target;
4381}
4382
4383# given link target, and the directory (basedir) the link is in,
4384# return target of link relative to top directory (top tree);
4385# return undef if it is not possible (including absolute links).
4386sub normalize_link_target {
4387        my ($link_target, $basedir) = @_;
4388
4389        # absolute symlinks (beginning with '/') cannot be normalized
4390        return if (substr($link_target, 0, 1) eq '/');
4391
4392        # normalize link target to path from top (root) tree (dir)
4393        my $path;
4394        if ($basedir) {
4395                $path = $basedir . '/' . $link_target;
4396        } else {
4397                # we are in top (root) tree (dir)
4398                $path = $link_target;
4399        }
4400
4401        # remove //, /./, and /../
4402        my @path_parts;
4403        foreach my $part (split('/', $path)) {
4404                # discard '.' and ''
4405                next if (!$part || $part eq '.');
4406                # handle '..'
4407                if ($part eq '..') {
4408                        if (@path_parts) {
4409                                pop @path_parts;
4410                        } else {
4411                                # link leads outside repository (outside top dir)
4412                                return;
4413                        }
4414                } else {
4415                        push @path_parts, $part;
4416                }
4417        }
4418        $path = join('/', @path_parts);
4419
4420        return $path;
4421}
4422
4423# print tree entry (row of git_tree), but without encompassing <tr> element
4424sub git_print_tree_entry {
4425        my ($t, $basedir, $hash_base, $have_blame) = @_;
4426
4427        my %base_key = ();
4428        $base_key{'hash_base'} = $hash_base if defined $hash_base;
4429
4430        # The format of a table row is: mode list link.  Where mode is
4431        # the mode of the entry, list is the name of the entry, an href,
4432        # and link is the action links of the entry.
4433
4434        print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4435        if (exists $t->{'size'}) {
4436                print "<td class=\"size\">$t->{'size'}</td>\n";
4437        }
4438        if ($t->{'type'} eq "blob") {
4439                print "<td class=\"list\">" .
4440                        $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4441                                               file_name=>"$basedir$t->{'name'}", %base_key),
4442                                -class => "list"}, esc_path($t->{'name'}));
4443                if (S_ISLNK(oct $t->{'mode'})) {
4444                        my $link_target = git_get_link_target($t->{'hash'});
4445                        if ($link_target) {
4446                                my $norm_target = normalize_link_target($link_target, $basedir);
4447                                if (defined $norm_target) {
4448                                        print " -> " .
4449                                              $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4450                                                                     file_name=>$norm_target),
4451                                                       -title => $norm_target}, esc_path($link_target));
4452                                } else {
4453                                        print " -> " . esc_path($link_target);
4454                                }
4455                        }
4456                }
4457                print "</td>\n";
4458                print "<td class=\"link\">";
4459                print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4460                                             file_name=>"$basedir$t->{'name'}", %base_key)},
4461                              "blob");
4462                if ($have_blame) {
4463                        print " | " .
4464                              $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4465                                                     file_name=>"$basedir$t->{'name'}", %base_key)},
4466                                      "blame");
4467                }
4468                if (defined $hash_base) {
4469                        print " | " .
4470                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4471                                                     hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4472                                      "history");
4473                }
4474                print " | " .
4475                        $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4476                                               file_name=>"$basedir$t->{'name'}")},
4477                                "raw");
4478                print "</td>\n";
4479
4480        } elsif ($t->{'type'} eq "tree") {
4481                print "<td class=\"list\">";
4482                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4483                                             file_name=>"$basedir$t->{'name'}",
4484                                             %base_key)},
4485                              esc_path($t->{'name'}));
4486                print "</td>\n";
4487                print "<td class=\"link\">";
4488                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4489                                             file_name=>"$basedir$t->{'name'}",
4490                                             %base_key)},
4491                              "tree");
4492                if (defined $hash_base) {
4493                        print " | " .
4494                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4495                                                     file_name=>"$basedir$t->{'name'}")},
4496                                      "history");
4497                }
4498                print "</td>\n";
4499        } else {
4500                # unknown object: we can only present history for it
4501                # (this includes 'commit' object, i.e. submodule support)
4502                print "<td class=\"list\">" .
4503                      esc_path($t->{'name'}) .
4504                      "</td>\n";
4505                print "<td class=\"link\">";
4506                if (defined $hash_base) {
4507                        print $cgi->a({-href => href(action=>"history",
4508                                                     hash_base=>$hash_base,
4509                                                     file_name=>"$basedir$t->{'name'}")},
4510                                      "history");
4511                }
4512                print "</td>\n";
4513        }
4514}
4515
4516## ......................................................................
4517## functions printing large fragments of HTML
4518
4519# get pre-image filenames for merge (combined) diff
4520sub fill_from_file_info {
4521        my ($diff, @parents) = @_;
4522
4523        $diff->{'from_file'} = [ ];
4524        $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4525        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4526                if ($diff->{'status'}[$i] eq 'R' ||
4527                    $diff->{'status'}[$i] eq 'C') {
4528                        $diff->{'from_file'}[$i] =
4529                                git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4530                }
4531        }
4532
4533        return $diff;
4534}
4535
4536# is current raw difftree line of file deletion
4537sub is_deleted {
4538        my $diffinfo = shift;
4539
4540        return $diffinfo->{'to_id'} eq ('0' x 40);
4541}
4542
4543# does patch correspond to [previous] difftree raw line
4544# $diffinfo  - hashref of parsed raw diff format
4545# $patchinfo - hashref of parsed patch diff format
4546#              (the same keys as in $diffinfo)
4547sub is_patch_split {
4548        my ($diffinfo, $patchinfo) = @_;
4549
4550        return defined $diffinfo && defined $patchinfo
4551                && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4552}
4553
4554
4555sub git_difftree_body {
4556        my ($difftree, $hash, @parents) = @_;
4557        my ($parent) = $parents[0];
4558        my $have_blame = gitweb_check_feature('blame');
4559        print "<div class=\"list_head\">\n";
4560        if ($#{$difftree} > 10) {
4561                print(($#{$difftree} + 1) . " files changed:\n");
4562        }
4563        print "</div>\n";
4564
4565        print "<table class=\"" .
4566              (@parents > 1 ? "combined " : "") .
4567              "diff_tree\">\n";
4568
4569        # header only for combined diff in 'commitdiff' view
4570        my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4571        if ($has_header) {
4572                # table header
4573                print "<thead><tr>\n" .
4574                       "<th></th><th></th>\n"; # filename, patchN link
4575                for (my $i = 0; $i < @parents; $i++) {
4576                        my $par = $parents[$i];
4577                        print "<th>" .
4578                              $cgi->a({-href => href(action=>"commitdiff",
4579                                                     hash=>$hash, hash_parent=>$par),
4580                                       -title => 'commitdiff to parent number ' .
4581                                                  ($i+1) . ': ' . substr($par,0,7)},
4582                                      $i+1) .
4583                              "&nbsp;</th>\n";
4584                }
4585                print "</tr></thead>\n<tbody>\n";
4586        }
4587
4588        my $alternate = 1;
4589        my $patchno = 0;
4590        foreach my $line (@{$difftree}) {
4591                my $diff = parsed_difftree_line($line);
4592
4593                if ($alternate) {
4594                        print "<tr class=\"dark\">\n";
4595                } else {
4596                        print "<tr class=\"light\">\n";
4597                }
4598                $alternate ^= 1;
4599
4600                if (exists $diff->{'nparents'}) { # combined diff
4601
4602                        fill_from_file_info($diff, @parents)
4603                                unless exists $diff->{'from_file'};
4604
4605                        if (!is_deleted($diff)) {
4606                                # file exists in the result (child) commit
4607                                print "<td>" .
4608                                      $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4609                                                             file_name=>$diff->{'to_file'},
4610                                                             hash_base=>$hash),
4611                                              -class => "list"}, esc_path($diff->{'to_file'})) .
4612                                      "</td>\n";
4613                        } else {
4614                                print "<td>" .
4615                                      esc_path($diff->{'to_file'}) .
4616                                      "</td>\n";
4617                        }
4618
4619                        if ($action eq 'commitdiff') {
4620                                # link to patch
4621                                $patchno++;
4622                                print "<td class=\"link\">" .
4623                                      $cgi->a({-href => href(-anchor=>"patch$patchno")},
4624                                              "patch") .
4625                                      " | " .
4626                                      "</td>\n";
4627                        }
4628
4629                        my $has_history = 0;
4630                        my $not_deleted = 0;
4631                        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4632                                my $hash_parent = $parents[$i];
4633                                my $from_hash = $diff->{'from_id'}[$i];
4634                                my $from_path = $diff->{'from_file'}[$i];
4635                                my $status = $diff->{'status'}[$i];
4636
4637                                $has_history ||= ($status ne 'A');
4638                                $not_deleted ||= ($status ne 'D');
4639
4640                                if ($status eq 'A') {
4641                                        print "<td  class=\"link\" align=\"right\"> | </td>\n";
4642                                } elsif ($status eq 'D') {
4643                                        print "<td class=\"link\">" .
4644                                              $cgi->a({-href => href(action=>"blob",
4645                                                                     hash_base=>$hash,
4646                                                                     hash=>$from_hash,
4647                                                                     file_name=>$from_path)},
4648                                                      "blob" . ($i+1)) .
4649                                              " | </td>\n";
4650                                } else {
4651                                        if ($diff->{'to_id'} eq $from_hash) {
4652                                                print "<td class=\"link nochange\">";
4653                                        } else {
4654                                                print "<td class=\"link\">";
4655                                        }
4656                                        print $cgi->a({-href => href(action=>"blobdiff",
4657                                                                     hash=>$diff->{'to_id'},
4658                                                                     hash_parent=>$from_hash,
4659                                                                     hash_base=>$hash,
4660                                                                     hash_parent_base=>$hash_parent,
4661                                                                     file_name=>$diff->{'to_file'},
4662                                                                     file_parent=>$from_path)},
4663                                                      "diff" . ($i+1)) .
4664                                              " | </td>\n";
4665                                }
4666                        }
4667
4668                        print "<td class=\"link\">";
4669                        if ($not_deleted) {
4670                                print $cgi->a({-href => href(action=>"blob",
4671                                                             hash=>$diff->{'to_id'},
4672                                                             file_name=>$diff->{'to_file'},
4673                                                             hash_base=>$hash)},
4674                                              "blob");
4675                                print " | " if ($has_history);
4676                        }
4677                        if ($has_history) {
4678                                print $cgi->a({-href => href(action=>"history",
4679                                                             file_name=>$diff->{'to_file'},
4680                                                             hash_base=>$hash)},
4681                                              "history");
4682                        }
4683                        print "</td>\n";
4684
4685                        print "</tr>\n";
4686                        next; # instead of 'else' clause, to avoid extra indent
4687                }
4688                # else ordinary diff
4689
4690                my ($to_mode_oct, $to_mode_str, $to_file_type);
4691                my ($from_mode_oct, $from_mode_str, $from_file_type);
4692                if ($diff->{'to_mode'} ne ('0' x 6)) {
4693                        $to_mode_oct = oct $diff->{'to_mode'};
4694                        if (S_ISREG($to_mode_oct)) { # only for regular file
4695                                $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4696                        }
4697                        $to_file_type = file_type($diff->{'to_mode'});
4698                }
4699                if ($diff->{'from_mode'} ne ('0' x 6)) {
4700                        $from_mode_oct = oct $diff->{'from_mode'};
4701                        if (S_ISREG($from_mode_oct)) { # only for regular file
4702                                $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4703                        }
4704                        $from_file_type = file_type($diff->{'from_mode'});
4705                }
4706
4707                if ($diff->{'status'} eq "A") { # created
4708                        my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4709                        $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4710                        $mode_chng   .= "]</span>";
4711                        print "<td>";
4712                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4713                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4714                                      -class => "list"}, esc_path($diff->{'file'}));
4715                        print "</td>\n";
4716                        print "<td>$mode_chng</td>\n";
4717                        print "<td class=\"link\">";
4718                        if ($action eq 'commitdiff') {
4719                                # link to patch
4720                                $patchno++;
4721                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4722                                              "patch") .
4723                                      " | ";
4724                        }
4725                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4726                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4727                                      "blob");
4728                        print "</td>\n";
4729
4730                } elsif ($diff->{'status'} eq "D") { # deleted
4731                        my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4732                        print "<td>";
4733                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4734                                                     hash_base=>$parent, file_name=>$diff->{'file'}),
4735                                       -class => "list"}, esc_path($diff->{'file'}));
4736                        print "</td>\n";
4737                        print "<td>$mode_chng</td>\n";
4738                        print "<td class=\"link\">";
4739                        if ($action eq 'commitdiff') {
4740                                # link to patch
4741                                $patchno++;
4742                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4743                                              "patch") .
4744                                      " | ";
4745                        }
4746                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4747                                                     hash_base=>$parent, file_name=>$diff->{'file'})},
4748                                      "blob") . " | ";
4749                        if ($have_blame) {
4750                                print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4751                                                             file_name=>$diff->{'file'})},
4752                                              "blame") . " | ";
4753                        }
4754                        print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4755                                                     file_name=>$diff->{'file'})},
4756                                      "history");
4757                        print "</td>\n";
4758
4759                } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4760                        my $mode_chnge = "";
4761                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4762                                $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4763                                if ($from_file_type ne $to_file_type) {
4764                                        $mode_chnge .= " from $from_file_type to $to_file_type";
4765                                }
4766                                if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4767                                        if ($from_mode_str && $to_mode_str) {
4768                                                $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4769                                        } elsif ($to_mode_str) {
4770                                                $mode_chnge .= " mode: $to_mode_str";
4771                                        }
4772                                }
4773                                $mode_chnge .= "]</span>\n";
4774                        }
4775                        print "<td>";
4776                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4777                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4778                                      -class => "list"}, esc_path($diff->{'file'}));
4779                        print "</td>\n";
4780                        print "<td>$mode_chnge</td>\n";
4781                        print "<td class=\"link\">";
4782                        if ($action eq 'commitdiff') {
4783                                # link to patch
4784                                $patchno++;
4785                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4786                                              "patch") .
4787                                      " | ";
4788                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4789                                # "commit" view and modified file (not onlu mode changed)
4790                                print $cgi->a({-href => href(action=>"blobdiff",
4791                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4792                                                             hash_base=>$hash, hash_parent_base=>$parent,
4793                                                             file_name=>$diff->{'file'})},
4794                                              "diff") .
4795                                      " | ";
4796                        }
4797                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4798                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4799                                       "blob") . " | ";
4800                        if ($have_blame) {
4801                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4802                                                             file_name=>$diff->{'file'})},
4803                                              "blame") . " | ";
4804                        }
4805                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4806                                                     file_name=>$diff->{'file'})},
4807                                      "history");
4808                        print "</td>\n";
4809
4810                } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4811                        my %status_name = ('R' => 'moved', 'C' => 'copied');
4812                        my $nstatus = $status_name{$diff->{'status'}};
4813                        my $mode_chng = "";
4814                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4815                                # mode also for directories, so we cannot use $to_mode_str
4816                                $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4817                        }
4818                        print "<td>" .
4819                              $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4820                                                     hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4821                                      -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4822                              "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4823                              $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4824                                                     hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4825                                      -class => "list"}, esc_path($diff->{'from_file'})) .
4826                              " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4827                              "<td class=\"link\">";
4828                        if ($action eq 'commitdiff') {
4829                                # link to patch
4830                                $patchno++;
4831                                print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4832                                              "patch") .
4833                                      " | ";
4834                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4835                                # "commit" view and modified file (not only pure rename or copy)
4836                                print $cgi->a({-href => href(action=>"blobdiff",
4837                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4838                                                             hash_base=>$hash, hash_parent_base=>$parent,
4839                                                             file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4840                                              "diff") .
4841                                      " | ";
4842                        }
4843                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4844                                                     hash_base=>$parent, file_name=>$diff->{'to_file'})},
4845                                      "blob") . " | ";
4846                        if ($have_blame) {
4847                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4848                                                             file_name=>$diff->{'to_file'})},
4849                                              "blame") . " | ";
4850                        }
4851                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4852                                                    file_name=>$diff->{'to_file'})},
4853                                      "history");
4854                        print "</td>\n";
4855
4856                } # we should not encounter Unmerged (U) or Unknown (X) status
4857                print "</tr>\n";
4858        }
4859        print "</tbody>" if $has_header;
4860        print "</table>\n";
4861}
4862
4863sub print_sidebyside_diff_chunk {
4864        my @chunk = @_;
4865        my (@ctx, @rem, @add);
4866
4867        return unless @chunk;
4868
4869        # incomplete last line might be among removed or added lines,
4870        # or both, or among context lines: find which
4871        for (my $i = 1; $i < @chunk; $i++) {
4872                if ($chunk[$i][0] eq 'incomplete') {
4873                        $chunk[$i][0] = $chunk[$i-1][0];
4874                }
4875        }
4876
4877        # guardian
4878        push @chunk, ["", ""];
4879
4880        foreach my $line_info (@chunk) {
4881                my ($class, $line) = @$line_info;
4882
4883                # print chunk headers
4884                if ($class && $class eq 'chunk_header') {
4885                        print $line;
4886                        next;
4887                }
4888
4889                ## print from accumulator when type of class of lines change
4890                # empty contents block on start rem/add block, or end of chunk
4891                if (@ctx && (!$class || $class eq 'rem' || $class eq 'add')) {
4892                        print join '',
4893                                '<div class="chunk_block ctx">',
4894                                        '<div class="old">',
4895                                        @ctx,
4896                                        '</div>',
4897                                        '<div class="new">',
4898                                        @ctx,
4899                                        '</div>',
4900                                '</div>';
4901                        @ctx = ();
4902                }
4903                # empty add/rem block on start context block, or end of chunk
4904                if ((@rem || @add) && (!$class || $class eq 'ctx')) {
4905                        if (!@add) {
4906                                # pure removal
4907                                print join '',
4908                                        '<div class="chunk_block rem">',
4909                                                '<div class="old">',
4910                                                @rem,
4911                                                '</div>',
4912                                        '</div>';
4913                        } elsif (!@rem) {
4914                                # pure addition
4915                                print join '',
4916                                        '<div class="chunk_block add">',
4917                                                '<div class="new">',
4918                                                @add,
4919                                                '</div>',
4920                                        '</div>';
4921                        } else {
4922                                # assume that it is change
4923                                print join '',
4924                                        '<div class="chunk_block chg">',
4925                                                '<div class="old">',
4926                                                @rem,
4927                                                '</div>',
4928                                                '<div class="new">',
4929                                                @add,
4930                                                '</div>',
4931                                        '</div>';
4932                        }
4933                        @rem = @add = ();
4934                }
4935
4936                ## adding lines to accumulator
4937                # guardian value
4938                last unless $line;
4939                # rem, add or change
4940                if ($class eq 'rem') {
4941                        push @rem, $line;
4942                } elsif ($class eq 'add') {
4943                        push @add, $line;
4944                }
4945                # context line
4946                if ($class eq 'ctx') {
4947                        push @ctx, $line;
4948                }
4949        }
4950}
4951
4952sub git_patchset_body {
4953        my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
4954        my ($hash_parent) = $hash_parents[0];
4955
4956        my $is_combined = (@hash_parents > 1);
4957        my $patch_idx = 0;
4958        my $patch_number = 0;
4959        my $patch_line;
4960        my $diffinfo;
4961        my $to_name;
4962        my (%from, %to);
4963        my @chunk; # for side-by-side diff
4964
4965        print "<div class=\"patchset\">\n";
4966
4967        # skip to first patch
4968        while ($patch_line = <$fd>) {
4969                chomp $patch_line;
4970
4971                last if ($patch_line =~ m/^diff /);
4972        }
4973
4974 PATCH:
4975        while ($patch_line) {
4976
4977                # parse "git diff" header line
4978                if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
4979                        # $1 is from_name, which we do not use
4980                        $to_name = unquote($2);
4981                        $to_name =~ s!^b/!!;
4982                } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
4983                        # $1 is 'cc' or 'combined', which we do not use
4984                        $to_name = unquote($2);
4985                } else {
4986                        $to_name = undef;
4987                }
4988
4989                # check if current patch belong to current raw line
4990                # and parse raw git-diff line if needed
4991                if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
4992                        # this is continuation of a split patch
4993                        print "<div class=\"patch cont\">\n";
4994                } else {
4995                        # advance raw git-diff output if needed
4996                        $patch_idx++ if defined $diffinfo;
4997
4998                        # read and prepare patch information
4999                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5000
5001                        # compact combined diff output can have some patches skipped
5002                        # find which patch (using pathname of result) we are at now;
5003                        if ($is_combined) {
5004                                while ($to_name ne $diffinfo->{'to_file'}) {
5005                                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5006                                              format_diff_cc_simplified($diffinfo, @hash_parents) .
5007                                              "</div>\n";  # class="patch"
5008
5009                                        $patch_idx++;
5010                                        $patch_number++;
5011
5012                                        last if $patch_idx > $#$difftree;
5013                                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5014                                }
5015                        }
5016
5017                        # modifies %from, %to hashes
5018                        parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5019
5020                        # this is first patch for raw difftree line with $patch_idx index
5021                        # we index @$difftree array from 0, but number patches from 1
5022                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5023                }
5024
5025                # git diff header
5026                #assert($patch_line =~ m/^diff /) if DEBUG;
5027                #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5028                $patch_number++;
5029                # print "git diff" header
5030                print format_git_diff_header_line($patch_line, $diffinfo,
5031                                                  \%from, \%to);
5032
5033                # print extended diff header
5034                print "<div class=\"diff extended_header\">\n";
5035        EXTENDED_HEADER:
5036                while ($patch_line = <$fd>) {
5037                        chomp $patch_line;
5038
5039                        last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5040
5041                        print format_extended_diff_header_line($patch_line, $diffinfo,
5042                                                               \%from, \%to);
5043                }
5044                print "</div>\n"; # class="diff extended_header"
5045
5046                # from-file/to-file diff header
5047                if (! $patch_line) {
5048                        print "</div>\n"; # class="patch"
5049                        last PATCH;
5050                }
5051                next PATCH if ($patch_line =~ m/^diff /);
5052                #assert($patch_line =~ m/^---/) if DEBUG;
5053
5054                my $last_patch_line = $patch_line;
5055                $patch_line = <$fd>;
5056                chomp $patch_line;
5057                #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5058
5059                print format_diff_from_to_header($last_patch_line, $patch_line,
5060                                                 $diffinfo, \%from, \%to,
5061                                                 @hash_parents);
5062
5063                # the patch itself
5064        LINE:
5065                while ($patch_line = <$fd>) {
5066                        chomp $patch_line;
5067
5068                        next PATCH if ($patch_line =~ m/^diff /);
5069
5070                        my ($class, $line) = process_diff_line($patch_line, \%from, \%to);
5071                        my $diff_classes = "diff";
5072                        $diff_classes .= " $class" if ($class);
5073                        $line = "<div class=\"$diff_classes\">$line</div>\n";
5074
5075                        if ($diff_style eq 'sidebyside' && !$is_combined) {
5076                                if ($class eq 'chunk_header') {
5077                                        print_sidebyside_diff_chunk(@chunk);
5078                                        @chunk = ( [ $class, $line ] );
5079                                } else {
5080                                        push @chunk, [ $class, $line ];
5081                                }
5082                        } else {
5083                                # default 'inline' style and unknown styles
5084                                print $line;
5085                        }
5086                }
5087
5088        } continue {
5089                if (@chunk) {
5090                        print_sidebyside_diff_chunk(@chunk);
5091                        @chunk = ();
5092                }
5093                print "</div>\n"; # class="patch"
5094        }
5095
5096        # for compact combined (--cc) format, with chunk and patch simplification
5097        # the patchset might be empty, but there might be unprocessed raw lines
5098        for (++$patch_idx if $patch_number > 0;
5099             $patch_idx < @$difftree;
5100             ++$patch_idx) {
5101                # read and prepare patch information
5102                $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5103
5104                # generate anchor for "patch" links in difftree / whatchanged part
5105                print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5106                      format_diff_cc_simplified($diffinfo, @hash_parents) .
5107                      "</div>\n";  # class="patch"
5108
5109                $patch_number++;
5110        }
5111
5112        if ($patch_number == 0) {
5113                if (@hash_parents > 1) {
5114                        print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5115                } else {
5116                        print "<div class=\"diff nodifferences\">No differences found</div>\n";
5117                }
5118        }
5119
5120        print "</div>\n"; # class="patchset"
5121}
5122
5123# . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5124
5125# fills project list info (age, description, owner, category, forks)
5126# for each project in the list, removing invalid projects from
5127# returned list
5128# NOTE: modifies $projlist, but does not remove entries from it
5129sub fill_project_list_info {
5130        my $projlist = shift;
5131        my @projects;
5132
5133        my $show_ctags = gitweb_check_feature('ctags');
5134 PROJECT:
5135        foreach my $pr (@$projlist) {
5136                my (@activity) = git_get_last_activity($pr->{'path'});
5137                unless (@activity) {
5138                        next PROJECT;
5139                }
5140                ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5141                if (!defined $pr->{'descr'}) {
5142                        my $descr = git_get_project_description($pr->{'path'}) || "";
5143                        $descr = to_utf8($descr);
5144                        $pr->{'descr_long'} = $descr;
5145                        $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5146                }
5147                if (!defined $pr->{'owner'}) {
5148                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5149                }
5150                if ($show_ctags) {
5151                        $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5152                }
5153                if ($projects_list_group_categories && !defined $pr->{'category'}) {
5154                        my $cat = git_get_project_category($pr->{'path'}) ||
5155                                                           $project_list_default_category;
5156                        $pr->{'category'} = to_utf8($cat);
5157                }
5158
5159                push @projects, $pr;
5160        }
5161
5162        return @projects;
5163}
5164
5165sub sort_projects_list {
5166        my ($projlist, $order) = @_;
5167        my @projects;
5168
5169        my %order_info = (
5170                project => { key => 'path', type => 'str' },
5171                descr => { key => 'descr_long', type => 'str' },
5172                owner => { key => 'owner', type => 'str' },
5173                age => { key => 'age', type => 'num' }
5174        );
5175        my $oi = $order_info{$order};
5176        return @$projlist unless defined $oi;
5177        if ($oi->{'type'} eq 'str') {
5178                @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5179        } else {
5180                @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5181        }
5182
5183        return @projects;
5184}
5185
5186# returns a hash of categories, containing the list of project
5187# belonging to each category
5188sub build_projlist_by_category {
5189        my ($projlist, $from, $to) = @_;
5190        my %categories;
5191
5192        $from = 0 unless defined $from;
5193        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5194
5195        for (my $i = $from; $i <= $to; $i++) {
5196                my $pr = $projlist->[$i];
5197                push @{$categories{ $pr->{'category'} }}, $pr;
5198        }
5199
5200        return wantarray ? %categories : \%categories;
5201}
5202
5203# print 'sort by' <th> element, generating 'sort by $name' replay link
5204# if that order is not selected
5205sub print_sort_th {
5206        print format_sort_th(@_);
5207}
5208
5209sub format_sort_th {
5210        my ($name, $order, $header) = @_;
5211        my $sort_th = "";
5212        $header ||= ucfirst($name);
5213
5214        if ($order eq $name) {
5215                $sort_th .= "<th>$header</th>\n";
5216        } else {
5217                $sort_th .= "<th>" .
5218                            $cgi->a({-href => href(-replay=>1, order=>$name),
5219                                     -class => "header"}, $header) .
5220                            "</th>\n";
5221        }
5222
5223        return $sort_th;
5224}
5225
5226sub git_project_list_rows {
5227        my ($projlist, $from, $to, $check_forks) = @_;
5228
5229        $from = 0 unless defined $from;
5230        $to = $#$projlist if (!defined $to || $#$projlist < $to);
5231
5232        my $alternate = 1;
5233        for (my $i = $from; $i <= $to; $i++) {
5234                my $pr = $projlist->[$i];
5235
5236                if ($alternate) {
5237                        print "<tr class=\"dark\">\n";
5238                } else {
5239                        print "<tr class=\"light\">\n";
5240                }
5241                $alternate ^= 1;
5242
5243                if ($check_forks) {
5244                        print "<td>";
5245                        if ($pr->{'forks'}) {
5246                                my $nforks = scalar @{$pr->{'forks'}};
5247                                if ($nforks > 0) {
5248                                        print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5249                                                       -title => "$nforks forks"}, "+");
5250                                } else {
5251                                        print $cgi->span({-title => "$nforks forks"}, "+");
5252                                }
5253                        }
5254                        print "</td>\n";
5255                }
5256                print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5257                                        -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
5258                      "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5259                                        -class => "list", -title => $pr->{'descr_long'}},
5260                                        esc_html($pr->{'descr'})) . "</td>\n" .
5261                      "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5262                print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5263                      (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
5264                      "<td class=\"link\">" .
5265                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5266                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5267                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5268                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5269                      ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5270                      "</td>\n" .
5271                      "</tr>\n";
5272        }
5273}
5274
5275sub git_project_list_body {
5276        # actually uses global variable $project
5277        my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5278        my @projects = @$projlist;
5279
5280        my $check_forks = gitweb_check_feature('forks');
5281        my $show_ctags  = gitweb_check_feature('ctags');
5282        my $tagfilter = $show_ctags ? $cgi->param('by_tag') : undef;
5283        $check_forks = undef
5284                if ($tagfilter || $searchtext);
5285
5286        # filtering out forks before filling info allows to do less work
5287        @projects = filter_forks_from_projects_list(\@projects)
5288                if ($check_forks);
5289        @projects = fill_project_list_info(\@projects);
5290        # searching projects require filling to be run before it
5291        @projects = search_projects_list(\@projects,
5292                                         'searchtext' => $searchtext,
5293                                         'tagfilter'  => $tagfilter)
5294                if ($tagfilter || $searchtext);
5295
5296        $order ||= $default_projects_order;
5297        $from = 0 unless defined $from;
5298        $to = $#projects if (!defined $to || $#projects < $to);
5299
5300        # short circuit
5301        if ($from > $to) {
5302                print "<center>\n".
5303                      "<b>No such projects found</b><br />\n".
5304                      "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5305                      "</center>\n<br />\n";
5306                return;
5307        }
5308
5309        @projects = sort_projects_list(\@projects, $order);
5310
5311        if ($show_ctags) {
5312                my $ctags = git_gather_all_ctags(\@projects);
5313                my $cloud = git_populate_project_tagcloud($ctags);
5314                print git_show_project_tagcloud($cloud, 64);
5315        }
5316
5317        print "<table class=\"project_list\">\n";
5318        unless ($no_header) {
5319                print "<tr>\n";
5320                if ($check_forks) {
5321                        print "<th></th>\n";
5322                }
5323                print_sort_th('project', $order, 'Project');
5324                print_sort_th('descr', $order, 'Description');
5325                print_sort_th('owner', $order, 'Owner');
5326                print_sort_th('age', $order, 'Last Change');
5327                print "<th></th>\n" . # for links
5328                      "</tr>\n";
5329        }
5330
5331        if ($projects_list_group_categories) {
5332                # only display categories with projects in the $from-$to window
5333                @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5334                my %categories = build_projlist_by_category(\@projects, $from, $to);
5335                foreach my $cat (sort keys %categories) {
5336                        unless ($cat eq "") {
5337                                print "<tr>\n";
5338                                if ($check_forks) {
5339                                        print "<td></td>\n";
5340                                }
5341                                print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5342                                print "</tr>\n";
5343                        }
5344
5345                        git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5346                }
5347        } else {
5348                git_project_list_rows(\@projects, $from, $to, $check_forks);
5349        }
5350
5351        if (defined $extra) {
5352                print "<tr>\n";
5353                if ($check_forks) {
5354                        print "<td></td>\n";
5355                }
5356                print "<td colspan=\"5\">$extra</td>\n" .
5357                      "</tr>\n";
5358        }
5359        print "</table>\n";
5360}
5361
5362sub git_log_body {
5363        # uses global variable $project
5364        my ($commitlist, $from, $to, $refs, $extra) = @_;
5365
5366        $from = 0 unless defined $from;
5367        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5368
5369        for (my $i = 0; $i <= $to; $i++) {
5370                my %co = %{$commitlist->[$i]};
5371                next if !%co;
5372                my $commit = $co{'id'};
5373                my $ref = format_ref_marker($refs, $commit);
5374                git_print_header_div('commit',
5375                               "<span class=\"age\">$co{'age_string'}</span>" .
5376                               esc_html($co{'title'}) . $ref,
5377                               $commit);
5378                print "<div class=\"title_text\">\n" .
5379                      "<div class=\"log_link\">\n" .
5380                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5381                      " | " .
5382                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5383                      " | " .
5384                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5385                      "<br/>\n" .
5386                      "</div>\n";
5387                      git_print_authorship(\%co, -tag => 'span');
5388                      print "<br/>\n</div>\n";
5389
5390                print "<div class=\"log_body\">\n";
5391                git_print_log($co{'comment'}, -final_empty_line=> 1);
5392                print "</div>\n";
5393        }
5394        if ($extra) {
5395                print "<div class=\"page_nav\">\n";
5396                print "$extra\n";
5397                print "</div>\n";
5398        }
5399}
5400
5401sub git_shortlog_body {
5402        # uses global variable $project
5403        my ($commitlist, $from, $to, $refs, $extra) = @_;
5404
5405        $from = 0 unless defined $from;
5406        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5407
5408        print "<table class=\"shortlog\">\n";
5409        my $alternate = 1;
5410        for (my $i = $from; $i <= $to; $i++) {
5411                my %co = %{$commitlist->[$i]};
5412                my $commit = $co{'id'};
5413                my $ref = format_ref_marker($refs, $commit);
5414                if ($alternate) {
5415                        print "<tr class=\"dark\">\n";
5416                } else {
5417                        print "<tr class=\"light\">\n";
5418                }
5419                $alternate ^= 1;
5420                # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5421                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5422                      format_author_html('td', \%co, 10) . "<td>";
5423                print format_subject_html($co{'title'}, $co{'title_short'},
5424                                          href(action=>"commit", hash=>$commit), $ref);
5425                print "</td>\n" .
5426                      "<td class=\"link\">" .
5427                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5428                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5429                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5430                my $snapshot_links = format_snapshot_links($commit);
5431                if (defined $snapshot_links) {
5432                        print " | " . $snapshot_links;
5433                }
5434                print "</td>\n" .
5435                      "</tr>\n";
5436        }
5437        if (defined $extra) {
5438                print "<tr>\n" .
5439                      "<td colspan=\"4\">$extra</td>\n" .
5440                      "</tr>\n";
5441        }
5442        print "</table>\n";
5443}
5444
5445sub git_history_body {
5446        # Warning: assumes constant type (blob or tree) during history
5447        my ($commitlist, $from, $to, $refs, $extra,
5448            $file_name, $file_hash, $ftype) = @_;
5449
5450        $from = 0 unless defined $from;
5451        $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5452
5453        print "<table class=\"history\">\n";
5454        my $alternate = 1;
5455        for (my $i = $from; $i <= $to; $i++) {
5456                my %co = %{$commitlist->[$i]};
5457                if (!%co) {
5458                        next;
5459                }
5460                my $commit = $co{'id'};
5461
5462                my $ref = format_ref_marker($refs, $commit);
5463
5464                if ($alternate) {
5465                        print "<tr class=\"dark\">\n";
5466                } else {
5467                        print "<tr class=\"light\">\n";
5468                }
5469                $alternate ^= 1;
5470                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5471        # shortlog:   format_author_html('td', \%co, 10)
5472                      format_author_html('td', \%co, 15, 3) . "<td>";
5473                # originally git_history used chop_str($co{'title'}, 50)
5474                print format_subject_html($co{'title'}, $co{'title_short'},
5475                                          href(action=>"commit", hash=>$commit), $ref);
5476                print "</td>\n" .
5477                      "<td class=\"link\">" .
5478                      $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5479                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5480
5481                if ($ftype eq 'blob') {
5482                        my $blob_current = $file_hash;
5483                        my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5484                        if (defined $blob_current && defined $blob_parent &&
5485                                        $blob_current ne $blob_parent) {
5486                                print " | " .
5487                                        $cgi->a({-href => href(action=>"blobdiff",
5488                                                               hash=>$blob_current, hash_parent=>$blob_parent,
5489                                                               hash_base=>$hash_base, hash_parent_base=>$commit,
5490                                                               file_name=>$file_name)},
5491                                                "diff to current");
5492                        }
5493                }
5494                print "</td>\n" .
5495                      "</tr>\n";
5496        }
5497        if (defined $extra) {
5498                print "<tr>\n" .
5499                      "<td colspan=\"4\">$extra</td>\n" .
5500                      "</tr>\n";
5501        }
5502        print "</table>\n";
5503}
5504
5505sub git_tags_body {
5506        # uses global variable $project
5507        my ($taglist, $from, $to, $extra) = @_;
5508        $from = 0 unless defined $from;
5509        $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5510
5511        print "<table class=\"tags\">\n";
5512        my $alternate = 1;
5513        for (my $i = $from; $i <= $to; $i++) {
5514                my $entry = $taglist->[$i];
5515                my %tag = %$entry;
5516                my $comment = $tag{'subject'};
5517                my $comment_short;
5518                if (defined $comment) {
5519                        $comment_short = chop_str($comment, 30, 5);
5520                }
5521                if ($alternate) {
5522                        print "<tr class=\"dark\">\n";
5523                } else {
5524                        print "<tr class=\"light\">\n";
5525                }
5526                $alternate ^= 1;
5527                if (defined $tag{'age'}) {
5528                        print "<td><i>$tag{'age'}</i></td>\n";
5529                } else {
5530                        print "<td></td>\n";
5531                }
5532                print "<td>" .
5533                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5534                               -class => "list name"}, esc_html($tag{'name'})) .
5535                      "</td>\n" .
5536                      "<td>";
5537                if (defined $comment) {
5538                        print format_subject_html($comment, $comment_short,
5539                                                  href(action=>"tag", hash=>$tag{'id'}));
5540                }
5541                print "</td>\n" .
5542                      "<td class=\"selflink\">";
5543                if ($tag{'type'} eq "tag") {
5544                        print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5545                } else {
5546                        print "&nbsp;";
5547                }
5548                print "</td>\n" .
5549                      "<td class=\"link\">" . " | " .
5550                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5551                if ($tag{'reftype'} eq "commit") {
5552                        print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5553                              " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5554                } elsif ($tag{'reftype'} eq "blob") {
5555                        print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5556                }
5557                print "</td>\n" .
5558                      "</tr>";
5559        }
5560        if (defined $extra) {
5561                print "<tr>\n" .
5562                      "<td colspan=\"5\">$extra</td>\n" .
5563                      "</tr>\n";
5564        }
5565        print "</table>\n";
5566}
5567
5568sub git_heads_body {
5569        # uses global variable $project
5570        my ($headlist, $head, $from, $to, $extra) = @_;
5571        $from = 0 unless defined $from;
5572        $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5573
5574        print "<table class=\"heads\">\n";
5575        my $alternate = 1;
5576        for (my $i = $from; $i <= $to; $i++) {
5577                my $entry = $headlist->[$i];
5578                my %ref = %$entry;
5579                my $curr = $ref{'id'} eq $head;
5580                if ($alternate) {
5581                        print "<tr class=\"dark\">\n";
5582                } else {
5583                        print "<tr class=\"light\">\n";
5584                }
5585                $alternate ^= 1;
5586                print "<td><i>$ref{'age'}</i></td>\n" .
5587                      ($curr ? "<td class=\"current_head\">" : "<td>") .
5588                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5589                               -class => "list name"},esc_html($ref{'name'})) .
5590                      "</td>\n" .
5591                      "<td class=\"link\">" .
5592                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5593                      $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5594                      $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5595                      "</td>\n" .
5596                      "</tr>";
5597        }
5598        if (defined $extra) {
5599                print "<tr>\n" .
5600                      "<td colspan=\"3\">$extra</td>\n" .
5601                      "</tr>\n";
5602        }
5603        print "</table>\n";
5604}
5605
5606# Display a single remote block
5607sub git_remote_block {
5608        my ($remote, $rdata, $limit, $head) = @_;
5609
5610        my $heads = $rdata->{'heads'};
5611        my $fetch = $rdata->{'fetch'};
5612        my $push = $rdata->{'push'};
5613
5614        my $urls_table = "<table class=\"projects_list\">\n" ;
5615
5616        if (defined $fetch) {
5617                if ($fetch eq $push) {
5618                        $urls_table .= format_repo_url("URL", $fetch);
5619                } else {
5620                        $urls_table .= format_repo_url("Fetch URL", $fetch);
5621                        $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5622                }
5623        } elsif (defined $push) {
5624                $urls_table .= format_repo_url("Push URL", $push);
5625        } else {
5626                $urls_table .= format_repo_url("", "No remote URL");
5627        }
5628
5629        $urls_table .= "</table>\n";
5630
5631        my $dots;
5632        if (defined $limit && $limit < @$heads) {
5633                $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5634        }
5635
5636        print $urls_table;
5637        git_heads_body($heads, $head, 0, $limit, $dots);
5638}
5639
5640# Display a list of remote names with the respective fetch and push URLs
5641sub git_remotes_list {
5642        my ($remotedata, $limit) = @_;
5643        print "<table class=\"heads\">\n";
5644        my $alternate = 1;
5645        my @remotes = sort keys %$remotedata;
5646
5647        my $limited = $limit && $limit < @remotes;
5648
5649        $#remotes = $limit - 1 if $limited;
5650
5651        while (my $remote = shift @remotes) {
5652                my $rdata = $remotedata->{$remote};
5653                my $fetch = $rdata->{'fetch'};
5654                my $push = $rdata->{'push'};
5655                if ($alternate) {
5656                        print "<tr class=\"dark\">\n";
5657                } else {
5658                        print "<tr class=\"light\">\n";
5659                }
5660                $alternate ^= 1;
5661                print "<td>" .
5662                      $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5663                               -class=> "list name"},esc_html($remote)) .
5664                      "</td>";
5665                print "<td class=\"link\">" .
5666                      (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5667                      " | " .
5668                      (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5669                      "</td>";
5670
5671                print "</tr>\n";
5672        }
5673
5674        if ($limited) {
5675                print "<tr>\n" .
5676                      "<td colspan=\"3\">" .
5677                      $cgi->a({-href => href(action=>"remotes")}, "...") .
5678                      "</td>\n" . "</tr>\n";
5679        }
5680
5681        print "</table>";
5682}
5683
5684# Display remote heads grouped by remote, unless there are too many
5685# remotes, in which case we only display the remote names
5686sub git_remotes_body {
5687        my ($remotedata, $limit, $head) = @_;
5688        if ($limit and $limit < keys %$remotedata) {
5689                git_remotes_list($remotedata, $limit);
5690        } else {
5691                fill_remote_heads($remotedata);
5692                while (my ($remote, $rdata) = each %$remotedata) {
5693                        git_print_section({-class=>"remote", -id=>$remote},
5694                                ["remotes", $remote, $remote], sub {
5695                                        git_remote_block($remote, $rdata, $limit, $head);
5696                                });
5697                }
5698        }
5699}
5700
5701sub git_search_message {
5702        my %co = @_;
5703
5704        my $greptype;
5705        if ($searchtype eq 'commit') {
5706                $greptype = "--grep=";
5707        } elsif ($searchtype eq 'author') {
5708                $greptype = "--author=";
5709        } elsif ($searchtype eq 'committer') {
5710                $greptype = "--committer=";
5711        }
5712        $greptype .= $searchtext;
5713        my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
5714                                       $greptype, '--regexp-ignore-case',
5715                                       $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
5716
5717        my $paging_nav = '';
5718        if ($page > 0) {
5719                $paging_nav .=
5720                        $cgi->a({-href => href(-replay=>1, page=>undef)},
5721                                "first") .
5722                        " &sdot; " .
5723                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
5724                                 -accesskey => "p", -title => "Alt-p"}, "prev");
5725        } else {
5726                $paging_nav .= "first &sdot; prev";
5727        }
5728        my $next_link = '';
5729        if ($#commitlist >= 100) {
5730                $next_link =
5731                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
5732                                 -accesskey => "n", -title => "Alt-n"}, "next");
5733                $paging_nav .= " &sdot; $next_link";
5734        } else {
5735                $paging_nav .= " &sdot; next";
5736        }
5737
5738        git_header_html();
5739
5740        git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
5741        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5742        if ($page == 0 && !@commitlist) {
5743                print "<p>No match.</p>\n";
5744        } else {
5745                git_search_grep_body(\@commitlist, 0, 99, $next_link);
5746        }
5747
5748        git_footer_html();
5749}
5750
5751sub git_search_changes {
5752        my %co = @_;
5753
5754        local $/ = "\n";
5755        open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
5756                '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
5757                ($search_use_regexp ? '--pickaxe-regex' : ())
5758                        or die_error(500, "Open git-log failed");
5759
5760        git_header_html();
5761
5762        git_print_page_nav('','', $hash,$co{'tree'},$hash);
5763        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5764
5765        print "<table class=\"pickaxe search\">\n";
5766        my $alternate = 1;
5767        undef %co;
5768        my @files;
5769        while (my $line = <$fd>) {
5770                chomp $line;
5771                next unless $line;
5772
5773                my %set = parse_difftree_raw_line($line);
5774                if (defined $set{'commit'}) {
5775                        # finish previous commit
5776                        if (%co) {
5777                                print "</td>\n" .
5778                                      "<td class=\"link\">" .
5779                                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5780                                              "commit") .
5781                                      " | " .
5782                                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5783                                                             hash_base=>$co{'id'})},
5784                                              "tree") .
5785                                      "</td>\n" .
5786                                      "</tr>\n";
5787                        }
5788
5789                        if ($alternate) {
5790                                print "<tr class=\"dark\">\n";
5791                        } else {
5792                                print "<tr class=\"light\">\n";
5793                        }
5794                        $alternate ^= 1;
5795                        %co = parse_commit($set{'commit'});
5796                        my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
5797                        print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5798                              "<td><i>$author</i></td>\n" .
5799                              "<td>" .
5800                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5801                                      -class => "list subject"},
5802                                      chop_and_escape_str($co{'title'}, 50) . "<br/>");
5803                } elsif (defined $set{'to_id'}) {
5804                        next if ($set{'to_id'} =~ m/^0{40}$/);
5805
5806                        print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
5807                                                     hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
5808                                      -class => "list"},
5809                                      "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
5810                              "<br/>\n";
5811                }
5812        }
5813        close $fd;
5814
5815        # finish last commit (warning: repetition!)
5816        if (%co) {
5817                print "</td>\n" .
5818                      "<td class=\"link\">" .
5819                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5820                              "commit") .
5821                      " | " .
5822                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5823                                             hash_base=>$co{'id'})},
5824                              "tree") .
5825                      "</td>\n" .
5826                      "</tr>\n";
5827        }
5828
5829        print "</table>\n";
5830
5831        git_footer_html();
5832}
5833
5834sub git_search_files {
5835        my %co = @_;
5836
5837        local $/ = "\n";
5838        open my $fd, "-|", git_cmd(), 'grep', '-n',
5839                $search_use_regexp ? ('-E', '-i') : '-F',
5840                $searchtext, $co{'tree'}
5841                        or die_error(500, "Open git-grep failed");
5842
5843        git_header_html();
5844
5845        git_print_page_nav('','', $hash,$co{'tree'},$hash);
5846        git_print_header_div('commit', esc_html($co{'title'}), $hash);
5847
5848        print "<table class=\"grep_search\">\n";
5849        my $alternate = 1;
5850        my $matches = 0;
5851        my $lastfile = '';
5852        while (my $line = <$fd>) {
5853                chomp $line;
5854                my ($file, $lno, $ltext, $binary);
5855                last if ($matches++ > 1000);
5856                if ($line =~ /^Binary file (.+) matches$/) {
5857                        $file = $1;
5858                        $binary = 1;
5859                } else {
5860                        (undef, $file, $lno, $ltext) = split(/:/, $line, 4);
5861                }
5862                if ($file ne $lastfile) {
5863                        $lastfile and print "</td></tr>\n";
5864                        if ($alternate++) {
5865                                print "<tr class=\"dark\">\n";
5866                        } else {
5867                                print "<tr class=\"light\">\n";
5868                        }
5869                        print "<td class=\"list\">".
5870                                $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
5871                                                       file_name=>"$file"),
5872                                        -class => "list"}, esc_path($file));
5873                        print "</td><td>\n";
5874                        $lastfile = $file;
5875                }
5876                if ($binary) {
5877                        print "<div class=\"binary\">Binary file</div>\n";
5878                } else {
5879                        $ltext = untabify($ltext);
5880                        if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
5881                                $ltext = esc_html($1, -nbsp=>1);
5882                                $ltext .= '<span class="match">';
5883                                $ltext .= esc_html($2, -nbsp=>1);
5884                                $ltext .= '</span>';
5885                                $ltext .= esc_html($3, -nbsp=>1);
5886                        } else {
5887                                $ltext = esc_html($ltext, -nbsp=>1);
5888                        }
5889                        print "<div class=\"pre\">" .
5890                                $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
5891                                                       file_name=>"$file").'#l'.$lno,
5892                                        -class => "linenr"}, sprintf('%4i', $lno))
5893                                . ' ' .  $ltext . "</div>\n";
5894                }
5895        }
5896        if ($lastfile) {
5897                print "</td></tr>\n";
5898                if ($matches > 1000) {
5899                        print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
5900                }
5901        } else {
5902                print "<div class=\"diff nodifferences\">No matches found</div>\n";
5903        }
5904        close $fd;
5905
5906        print "</table>\n";
5907
5908        git_footer_html();
5909}
5910
5911sub git_search_grep_body {
5912        my ($commitlist, $from, $to, $extra) = @_;
5913        $from = 0 unless defined $from;
5914        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5915
5916        print "<table class=\"commit_search\">\n";
5917        my $alternate = 1;
5918        for (my $i = $from; $i <= $to; $i++) {
5919                my %co = %{$commitlist->[$i]};
5920                if (!%co) {
5921                        next;
5922                }
5923                my $commit = $co{'id'};
5924                if ($alternate) {
5925                        print "<tr class=\"dark\">\n";
5926                } else {
5927                        print "<tr class=\"light\">\n";
5928                }
5929                $alternate ^= 1;
5930                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5931                      format_author_html('td', \%co, 15, 5) .
5932                      "<td>" .
5933                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5934                               -class => "list subject"},
5935                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
5936                my $comment = $co{'comment'};
5937                foreach my $line (@$comment) {
5938                        if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
5939                                my ($lead, $match, $trail) = ($1, $2, $3);
5940                                $match = chop_str($match, 70, 5, 'center');
5941                                my $contextlen = int((80 - length($match))/2);
5942                                $contextlen = 30 if ($contextlen > 30);
5943                                $lead  = chop_str($lead,  $contextlen, 10, 'left');
5944                                $trail = chop_str($trail, $contextlen, 10, 'right');
5945
5946                                $lead  = esc_html($lead);
5947                                $match = esc_html($match);
5948                                $trail = esc_html($trail);
5949
5950                                print "$lead<span class=\"match\">$match</span>$trail<br />";
5951                        }
5952                }
5953                print "</td>\n" .
5954                      "<td class=\"link\">" .
5955                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5956                      " | " .
5957                      $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5958                      " | " .
5959                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5960                print "</td>\n" .
5961                      "</tr>\n";
5962        }
5963        if (defined $extra) {
5964                print "<tr>\n" .
5965                      "<td colspan=\"3\">$extra</td>\n" .
5966                      "</tr>\n";
5967        }
5968        print "</table>\n";
5969}
5970
5971## ======================================================================
5972## ======================================================================
5973## actions
5974
5975sub git_project_list {
5976        my $order = $input_params{'order'};
5977        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5978                die_error(400, "Unknown order parameter");
5979        }
5980
5981        my @list = git_get_projects_list();
5982        if (!@list) {
5983                die_error(404, "No projects found");
5984        }
5985
5986        git_header_html();
5987        if (defined $home_text && -f $home_text) {
5988                print "<div class=\"index_include\">\n";
5989                insert_file($home_text);
5990                print "</div>\n";
5991        }
5992        print $cgi->startform(-method => "get") .
5993              "<p class=\"projsearch\">Search:\n" .
5994              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
5995              "</p>" .
5996              $cgi->end_form() . "\n";
5997        git_project_list_body(\@list, $order);
5998        git_footer_html();
5999}
6000
6001sub git_forks {
6002        my $order = $input_params{'order'};
6003        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6004                die_error(400, "Unknown order parameter");
6005        }
6006
6007        my @list = git_get_projects_list($project);
6008        if (!@list) {
6009                die_error(404, "No forks found");
6010        }
6011
6012        git_header_html();
6013        git_print_page_nav('','');
6014        git_print_header_div('summary', "$project forks");
6015        git_project_list_body(\@list, $order);
6016        git_footer_html();
6017}
6018
6019sub git_project_index {
6020        my @projects = git_get_projects_list();
6021        if (!@projects) {
6022                die_error(404, "No projects found");
6023        }
6024
6025        print $cgi->header(
6026                -type => 'text/plain',
6027                -charset => 'utf-8',
6028                -content_disposition => 'inline; filename="index.aux"');
6029
6030        foreach my $pr (@projects) {
6031                if (!exists $pr->{'owner'}) {
6032                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6033                }
6034
6035                my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6036                # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6037                $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6038                $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6039                $path  =~ s/ /\+/g;
6040                $owner =~ s/ /\+/g;
6041
6042                print "$path $owner\n";
6043        }
6044}
6045
6046sub git_summary {
6047        my $descr = git_get_project_description($project) || "none";
6048        my %co = parse_commit("HEAD");
6049        my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6050        my $head = $co{'id'};
6051        my $remote_heads = gitweb_check_feature('remote_heads');
6052
6053        my $owner = git_get_project_owner($project);
6054
6055        my $refs = git_get_references();
6056        # These get_*_list functions return one more to allow us to see if
6057        # there are more ...
6058        my @taglist  = git_get_tags_list(16);
6059        my @headlist = git_get_heads_list(16);
6060        my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6061        my @forklist;
6062        my $check_forks = gitweb_check_feature('forks');
6063
6064        if ($check_forks) {
6065                # find forks of a project
6066                @forklist = git_get_projects_list($project);
6067                # filter out forks of forks
6068                @forklist = filter_forks_from_projects_list(\@forklist)
6069                        if (@forklist);
6070        }
6071
6072        git_header_html();
6073        git_print_page_nav('summary','', $head);
6074
6075        print "<div class=\"title\">&nbsp;</div>\n";
6076        print "<table class=\"projects_list\">\n" .
6077              "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
6078              "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6079        if (defined $cd{'rfc2822'}) {
6080                print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6081                      "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6082        }
6083
6084        # use per project git URL list in $projectroot/$project/cloneurl
6085        # or make project git URL from git base URL and project name
6086        my $url_tag = "URL";
6087        my @url_list = git_get_project_url_list($project);
6088        @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6089        foreach my $git_url (@url_list) {
6090                next unless $git_url;
6091                print format_repo_url($url_tag, $git_url);
6092                $url_tag = "";
6093        }
6094
6095        # Tag cloud
6096        my $show_ctags = gitweb_check_feature('ctags');
6097        if ($show_ctags) {
6098                my $ctags = git_get_project_ctags($project);
6099                if (%$ctags) {
6100                        # without ability to add tags, don't show if there are none
6101                        my $cloud = git_populate_project_tagcloud($ctags);
6102                        print "<tr id=\"metadata_ctags\">" .
6103                              "<td>content tags</td>" .
6104                              "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6105                              "</tr>\n";
6106                }
6107        }
6108
6109        print "</table>\n";
6110
6111        # If XSS prevention is on, we don't include README.html.
6112        # TODO: Allow a readme in some safe format.
6113        if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6114                print "<div class=\"title\">readme</div>\n" .
6115                      "<div class=\"readme\">\n";
6116                insert_file("$projectroot/$project/README.html");
6117                print "\n</div>\n"; # class="readme"
6118        }
6119
6120        # we need to request one more than 16 (0..15) to check if
6121        # those 16 are all
6122        my @commitlist = $head ? parse_commits($head, 17) : ();
6123        if (@commitlist) {
6124                git_print_header_div('shortlog');
6125                git_shortlog_body(\@commitlist, 0, 15, $refs,
6126                                  $#commitlist <=  15 ? undef :
6127                                  $cgi->a({-href => href(action=>"shortlog")}, "..."));
6128        }
6129
6130        if (@taglist) {
6131                git_print_header_div('tags');
6132                git_tags_body(\@taglist, 0, 15,
6133                              $#taglist <=  15 ? undef :
6134                              $cgi->a({-href => href(action=>"tags")}, "..."));
6135        }
6136
6137        if (@headlist) {
6138                git_print_header_div('heads');
6139                git_heads_body(\@headlist, $head, 0, 15,
6140                               $#headlist <= 15 ? undef :
6141                               $cgi->a({-href => href(action=>"heads")}, "..."));
6142        }
6143
6144        if (%remotedata) {
6145                git_print_header_div('remotes');
6146                git_remotes_body(\%remotedata, 15, $head);
6147        }
6148
6149        if (@forklist) {
6150                git_print_header_div('forks');
6151                git_project_list_body(\@forklist, 'age', 0, 15,
6152                                      $#forklist <= 15 ? undef :
6153                                      $cgi->a({-href => href(action=>"forks")}, "..."),
6154                                      'no_header');
6155        }
6156
6157        git_footer_html();
6158}
6159
6160sub git_tag {
6161        my %tag = parse_tag($hash);
6162
6163        if (! %tag) {
6164                die_error(404, "Unknown tag object");
6165        }
6166
6167        my $head = git_get_head_hash($project);
6168        git_header_html();
6169        git_print_page_nav('','', $head,undef,$head);
6170        git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6171        print "<div class=\"title_text\">\n" .
6172              "<table class=\"object_header\">\n" .
6173              "<tr>\n" .
6174              "<td>object</td>\n" .
6175              "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6176                               $tag{'object'}) . "</td>\n" .
6177              "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6178                                              $tag{'type'}) . "</td>\n" .
6179              "</tr>\n";
6180        if (defined($tag{'author'})) {
6181                git_print_authorship_rows(\%tag, 'author');
6182        }
6183        print "</table>\n\n" .
6184              "</div>\n";
6185        print "<div class=\"page_body\">";
6186        my $comment = $tag{'comment'};
6187        foreach my $line (@$comment) {
6188                chomp $line;
6189                print esc_html($line, -nbsp=>1) . "<br/>\n";
6190        }
6191        print "</div>\n";
6192        git_footer_html();
6193}
6194
6195sub git_blame_common {
6196        my $format = shift || 'porcelain';
6197        if ($format eq 'porcelain' && $cgi->param('js')) {
6198                $format = 'incremental';
6199                $action = 'blame_incremental'; # for page title etc
6200        }
6201
6202        # permissions
6203        gitweb_check_feature('blame')
6204                or die_error(403, "Blame view not allowed");
6205
6206        # error checking
6207        die_error(400, "No file name given") unless $file_name;
6208        $hash_base ||= git_get_head_hash($project);
6209        die_error(404, "Couldn't find base commit") unless $hash_base;
6210        my %co = parse_commit($hash_base)
6211                or die_error(404, "Commit not found");
6212        my $ftype = "blob";
6213        if (!defined $hash) {
6214                $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6215                        or die_error(404, "Error looking up file");
6216        } else {
6217                $ftype = git_get_type($hash);
6218                if ($ftype !~ "blob") {
6219                        die_error(400, "Object is not a blob");
6220                }
6221        }
6222
6223        my $fd;
6224        if ($format eq 'incremental') {
6225                # get file contents (as base)
6226                open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6227                        or die_error(500, "Open git-cat-file failed");
6228        } elsif ($format eq 'data') {
6229                # run git-blame --incremental
6230                open $fd, "-|", git_cmd(), "blame", "--incremental",
6231                        $hash_base, "--", $file_name
6232                        or die_error(500, "Open git-blame --incremental failed");
6233        } else {
6234                # run git-blame --porcelain
6235                open $fd, "-|", git_cmd(), "blame", '-p',
6236                        $hash_base, '--', $file_name
6237                        or die_error(500, "Open git-blame --porcelain failed");
6238        }
6239
6240        # incremental blame data returns early
6241        if ($format eq 'data') {
6242                print $cgi->header(
6243                        -type=>"text/plain", -charset => "utf-8",
6244                        -status=> "200 OK");
6245                local $| = 1; # output autoflush
6246                print while <$fd>;
6247                close $fd
6248                        or print "ERROR $!\n";
6249
6250                print 'END';
6251                if (defined $t0 && gitweb_check_feature('timed')) {
6252                        print ' '.
6253                              tv_interval($t0, [ gettimeofday() ]).
6254                              ' '.$number_of_git_cmds;
6255                }
6256                print "\n";
6257
6258                return;
6259        }
6260
6261        # page header
6262        git_header_html();
6263        my $formats_nav =
6264                $cgi->a({-href => href(action=>"blob", -replay=>1)},
6265                        "blob") .
6266                " | ";
6267        if ($format eq 'incremental') {
6268                $formats_nav .=
6269                        $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6270                                "blame") . " (non-incremental)";
6271        } else {
6272                $formats_nav .=
6273                        $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6274                                "blame") . " (incremental)";
6275        }
6276        $formats_nav .=
6277                " | " .
6278                $cgi->a({-href => href(action=>"history", -replay=>1)},
6279                        "history") .
6280                " | " .
6281                $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6282                        "HEAD");
6283        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6284        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6285        git_print_page_path($file_name, $ftype, $hash_base);
6286
6287        # page body
6288        if ($format eq 'incremental') {
6289                print "<noscript>\n<div class=\"error\"><center><b>\n".
6290                      "This page requires JavaScript to run.\n Use ".
6291                      $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6292                              'this page').
6293                      " instead.\n".
6294                      "</b></center></div>\n</noscript>\n";
6295
6296                print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6297        }
6298
6299        print qq!<div class="page_body">\n!;
6300        print qq!<div id="progress_info">... / ...</div>\n!
6301                if ($format eq 'incremental');
6302        print qq!<table id="blame_table" class="blame" width="100%">\n!.
6303              #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6304              qq!<thead>\n!.
6305              qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6306              qq!</thead>\n!.
6307              qq!<tbody>\n!;
6308
6309        my @rev_color = qw(light dark);
6310        my $num_colors = scalar(@rev_color);
6311        my $current_color = 0;
6312
6313        if ($format eq 'incremental') {
6314                my $color_class = $rev_color[$current_color];
6315
6316                #contents of a file
6317                my $linenr = 0;
6318        LINE:
6319                while (my $line = <$fd>) {
6320                        chomp $line;
6321                        $linenr++;
6322
6323                        print qq!<tr id="l$linenr" class="$color_class">!.
6324                              qq!<td class="sha1"><a href=""> </a></td>!.
6325                              qq!<td class="linenr">!.
6326                              qq!<a class="linenr" href="">$linenr</a></td>!;
6327                        print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6328                        print qq!</tr>\n!;
6329                }
6330
6331        } else { # porcelain, i.e. ordinary blame
6332                my %metainfo = (); # saves information about commits
6333
6334                # blame data
6335        LINE:
6336                while (my $line = <$fd>) {
6337                        chomp $line;
6338                        # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6339                        # no <lines in group> for subsequent lines in group of lines
6340                        my ($full_rev, $orig_lineno, $lineno, $group_size) =
6341                           ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6342                        if (!exists $metainfo{$full_rev}) {
6343                                $metainfo{$full_rev} = { 'nprevious' => 0 };
6344                        }
6345                        my $meta = $metainfo{$full_rev};
6346                        my $data;
6347                        while ($data = <$fd>) {
6348                                chomp $data;
6349                                last if ($data =~ s/^\t//); # contents of line
6350                                if ($data =~ /^(\S+)(?: (.*))?$/) {
6351                                        $meta->{$1} = $2 unless exists $meta->{$1};
6352                                }
6353                                if ($data =~ /^previous /) {
6354                                        $meta->{'nprevious'}++;
6355                                }
6356                        }
6357                        my $short_rev = substr($full_rev, 0, 8);
6358                        my $author = $meta->{'author'};
6359                        my %date =
6360                                parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6361                        my $date = $date{'iso-tz'};
6362                        if ($group_size) {
6363                                $current_color = ($current_color + 1) % $num_colors;
6364                        }
6365                        my $tr_class = $rev_color[$current_color];
6366                        $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6367                        $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6368                        $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6369                        print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6370                        if ($group_size) {
6371                                print "<td class=\"sha1\"";
6372                                print " title=\"". esc_html($author) . ", $date\"";
6373                                print " rowspan=\"$group_size\"" if ($group_size > 1);
6374                                print ">";
6375                                print $cgi->a({-href => href(action=>"commit",
6376                                                             hash=>$full_rev,
6377                                                             file_name=>$file_name)},
6378                                              esc_html($short_rev));
6379                                if ($group_size >= 2) {
6380                                        my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6381                                        if (@author_initials) {
6382                                                print "<br />" .
6383                                                      esc_html(join('', @author_initials));
6384                                                #           or join('.', ...)
6385                                        }
6386                                }
6387                                print "</td>\n";
6388                        }
6389                        # 'previous' <sha1 of parent commit> <filename at commit>
6390                        if (exists $meta->{'previous'} &&
6391                            $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6392                                $meta->{'parent'} = $1;
6393                                $meta->{'file_parent'} = unquote($2);
6394                        }
6395                        my $linenr_commit =
6396                                exists($meta->{'parent'}) ?
6397                                $meta->{'parent'} : $full_rev;
6398                        my $linenr_filename =
6399                                exists($meta->{'file_parent'}) ?
6400                                $meta->{'file_parent'} : unquote($meta->{'filename'});
6401                        my $blamed = href(action => 'blame',
6402                                          file_name => $linenr_filename,
6403                                          hash_base => $linenr_commit);
6404                        print "<td class=\"linenr\">";
6405                        print $cgi->a({ -href => "$blamed#l$orig_lineno",
6406                                        -class => "linenr" },
6407                                      esc_html($lineno));
6408                        print "</td>";
6409                        print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6410                        print "</tr>\n";
6411                } # end while
6412
6413        }
6414
6415        # footer
6416        print "</tbody>\n".
6417              "</table>\n"; # class="blame"
6418        print "</div>\n";   # class="blame_body"
6419        close $fd
6420                or print "Reading blob failed\n";
6421
6422        git_footer_html();
6423}
6424
6425sub git_blame {
6426        git_blame_common();
6427}
6428
6429sub git_blame_incremental {
6430        git_blame_common('incremental');
6431}
6432
6433sub git_blame_data {
6434        git_blame_common('data');
6435}
6436
6437sub git_tags {
6438        my $head = git_get_head_hash($project);
6439        git_header_html();
6440        git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6441        git_print_header_div('summary', $project);
6442
6443        my @tagslist = git_get_tags_list();
6444        if (@tagslist) {
6445                git_tags_body(\@tagslist);
6446        }
6447        git_footer_html();
6448}
6449
6450sub git_heads {
6451        my $head = git_get_head_hash($project);
6452        git_header_html();
6453        git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6454        git_print_header_div('summary', $project);
6455
6456        my @headslist = git_get_heads_list();
6457        if (@headslist) {
6458                git_heads_body(\@headslist, $head);
6459        }
6460        git_footer_html();
6461}
6462
6463# used both for single remote view and for list of all the remotes
6464sub git_remotes {
6465        gitweb_check_feature('remote_heads')
6466                or die_error(403, "Remote heads view is disabled");
6467
6468        my $head = git_get_head_hash($project);
6469        my $remote = $input_params{'hash'};
6470
6471        my $remotedata = git_get_remotes_list($remote);
6472        die_error(500, "Unable to get remote information") unless defined $remotedata;
6473
6474        unless (%$remotedata) {
6475                die_error(404, defined $remote ?
6476                        "Remote $remote not found" :
6477                        "No remotes found");
6478        }
6479
6480        git_header_html(undef, undef, -action_extra => $remote);
6481        git_print_page_nav('', '',  $head, undef, $head,
6482                format_ref_views($remote ? '' : 'remotes'));
6483
6484        fill_remote_heads($remotedata);
6485        if (defined $remote) {
6486                git_print_header_div('remotes', "$remote remote for $project");
6487                git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6488        } else {
6489                git_print_header_div('summary', "$project remotes");
6490                git_remotes_body($remotedata, undef, $head);
6491        }
6492
6493        git_footer_html();
6494}
6495
6496sub git_blob_plain {
6497        my $type = shift;
6498        my $expires;
6499
6500        if (!defined $hash) {
6501                if (defined $file_name) {
6502                        my $base = $hash_base || git_get_head_hash($project);
6503                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6504                                or die_error(404, "Cannot find file");
6505                } else {
6506                        die_error(400, "No file name defined");
6507                }
6508        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6509                # blobs defined by non-textual hash id's can be cached
6510                $expires = "+1d";
6511        }
6512
6513        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6514                or die_error(500, "Open git-cat-file blob '$hash' failed");
6515
6516        # content-type (can include charset)
6517        $type = blob_contenttype($fd, $file_name, $type);
6518
6519        # "save as" filename, even when no $file_name is given
6520        my $save_as = "$hash";
6521        if (defined $file_name) {
6522                $save_as = $file_name;
6523        } elsif ($type =~ m/^text\//) {
6524                $save_as .= '.txt';
6525        }
6526
6527        # With XSS prevention on, blobs of all types except a few known safe
6528        # ones are served with "Content-Disposition: attachment" to make sure
6529        # they don't run in our security domain.  For certain image types,
6530        # blob view writes an <img> tag referring to blob_plain view, and we
6531        # want to be sure not to break that by serving the image as an
6532        # attachment (though Firefox 3 doesn't seem to care).
6533        my $sandbox = $prevent_xss &&
6534                $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6535
6536        # serve text/* as text/plain
6537        if ($prevent_xss &&
6538            ($type =~ m!^text/[a-z]+\b(.*)$! ||
6539             ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
6540                my $rest = $1;
6541                $rest = defined $rest ? $rest : '';
6542                $type = "text/plain$rest";
6543        }
6544
6545        print $cgi->header(
6546                -type => $type,
6547                -expires => $expires,
6548                -content_disposition =>
6549                        ($sandbox ? 'attachment' : 'inline')
6550                        . '; filename="' . $save_as . '"');
6551        local $/ = undef;
6552        binmode STDOUT, ':raw';
6553        print <$fd>;
6554        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6555        close $fd;
6556}
6557
6558sub git_blob {
6559        my $expires;
6560
6561        if (!defined $hash) {
6562                if (defined $file_name) {
6563                        my $base = $hash_base || git_get_head_hash($project);
6564                        $hash = git_get_hash_by_path($base, $file_name, "blob")
6565                                or die_error(404, "Cannot find file");
6566                } else {
6567                        die_error(400, "No file name defined");
6568                }
6569        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6570                # blobs defined by non-textual hash id's can be cached
6571                $expires = "+1d";
6572        }
6573
6574        my $have_blame = gitweb_check_feature('blame');
6575        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6576                or die_error(500, "Couldn't cat $file_name, $hash");
6577        my $mimetype = blob_mimetype($fd, $file_name);
6578        # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6579        if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6580                close $fd;
6581                return git_blob_plain($mimetype);
6582        }
6583        # we can have blame only for text/* mimetype
6584        $have_blame &&= ($mimetype =~ m!^text/!);
6585
6586        my $highlight = gitweb_check_feature('highlight');
6587        my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6588        $fd = run_highlighter($fd, $highlight, $syntax)
6589                if $syntax;
6590
6591        git_header_html(undef, $expires);
6592        my $formats_nav = '';
6593        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6594                if (defined $file_name) {
6595                        if ($have_blame) {
6596                                $formats_nav .=
6597                                        $cgi->a({-href => href(action=>"blame", -replay=>1)},
6598                                                "blame") .
6599                                        " | ";
6600                        }
6601                        $formats_nav .=
6602                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6603                                        "history") .
6604                                " | " .
6605                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6606                                        "raw") .
6607                                " | " .
6608                                $cgi->a({-href => href(action=>"blob",
6609                                                       hash_base=>"HEAD", file_name=>$file_name)},
6610                                        "HEAD");
6611                } else {
6612                        $formats_nav .=
6613                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6614                                        "raw");
6615                }
6616                git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6617                git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6618        } else {
6619                print "<div class=\"page_nav\">\n" .
6620                      "<br/><br/></div>\n" .
6621                      "<div class=\"title\">".esc_html($hash)."</div>\n";
6622        }
6623        git_print_page_path($file_name, "blob", $hash_base);
6624        print "<div class=\"page_body\">\n";
6625        if ($mimetype =~ m!^image/!) {
6626                print qq!<img type="!.esc_attr($mimetype).qq!"!;
6627                if ($file_name) {
6628                        print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
6629                }
6630                print qq! src="! .
6631                      href(action=>"blob_plain", hash=>$hash,
6632                           hash_base=>$hash_base, file_name=>$file_name) .
6633                      qq!" />\n!;
6634        } else {
6635                my $nr;
6636                while (my $line = <$fd>) {
6637                        chomp $line;
6638                        $nr++;
6639                        $line = untabify($line);
6640                        printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
6641                               $nr, esc_attr(href(-replay => 1)), $nr, $nr,
6642                               $syntax ? sanitize($line) : esc_html($line, -nbsp=>1);
6643                }
6644        }
6645        close $fd
6646                or print "Reading blob failed.\n";
6647        print "</div>";
6648        git_footer_html();
6649}
6650
6651sub git_tree {
6652        if (!defined $hash_base) {
6653                $hash_base = "HEAD";
6654        }
6655        if (!defined $hash) {
6656                if (defined $file_name) {
6657                        $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
6658                } else {
6659                        $hash = $hash_base;
6660                }
6661        }
6662        die_error(404, "No such tree") unless defined($hash);
6663
6664        my $show_sizes = gitweb_check_feature('show-sizes');
6665        my $have_blame = gitweb_check_feature('blame');
6666
6667        my @entries = ();
6668        {
6669                local $/ = "\0";
6670                open my $fd, "-|", git_cmd(), "ls-tree", '-z',
6671                        ($show_sizes ? '-l' : ()), @extra_options, $hash
6672                        or die_error(500, "Open git-ls-tree failed");
6673                @entries = map { chomp; $_ } <$fd>;
6674                close $fd
6675                        or die_error(404, "Reading tree failed");
6676        }
6677
6678        my $refs = git_get_references();
6679        my $ref = format_ref_marker($refs, $hash_base);
6680        git_header_html();
6681        my $basedir = '';
6682        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6683                my @views_nav = ();
6684                if (defined $file_name) {
6685                        push @views_nav,
6686                                $cgi->a({-href => href(action=>"history", -replay=>1)},
6687                                        "history"),
6688                                $cgi->a({-href => href(action=>"tree",
6689                                                       hash_base=>"HEAD", file_name=>$file_name)},
6690                                        "HEAD"),
6691                }
6692                my $snapshot_links = format_snapshot_links($hash);
6693                if (defined $snapshot_links) {
6694                        # FIXME: Should be available when we have no hash base as well.
6695                        push @views_nav, $snapshot_links;
6696                }
6697                git_print_page_nav('tree','', $hash_base, undef, undef,
6698                                   join(' | ', @views_nav));
6699                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6700        } else {
6701                undef $hash_base;
6702                print "<div class=\"page_nav\">\n";
6703                print "<br/><br/></div>\n";
6704                print "<div class=\"title\">".esc_html($hash)."</div>\n";
6705        }
6706        if (defined $file_name) {
6707                $basedir = $file_name;
6708                if ($basedir ne '' && substr($basedir, -1) ne '/') {
6709                        $basedir .= '/';
6710                }
6711                git_print_page_path($file_name, 'tree', $hash_base);
6712        }
6713        print "<div class=\"page_body\">\n";
6714        print "<table class=\"tree\">\n";
6715        my $alternate = 1;
6716        # '..' (top directory) link if possible
6717        if (defined $hash_base &&
6718            defined $file_name && $file_name =~ m![^/]+$!) {
6719                if ($alternate) {
6720                        print "<tr class=\"dark\">\n";
6721                } else {
6722                        print "<tr class=\"light\">\n";
6723                }
6724                $alternate ^= 1;
6725
6726                my $up = $file_name;
6727                $up =~ s!/?[^/]+$!!;
6728                undef $up unless $up;
6729                # based on git_print_tree_entry
6730                print '<td class="mode">' . mode_str('040000') . "</td>\n";
6731                print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6732                print '<td class="list">';
6733                print $cgi->a({-href => href(action=>"tree",
6734                                             hash_base=>$hash_base,
6735                                             file_name=>$up)},
6736                              "..");
6737                print "</td>\n";
6738                print "<td class=\"link\"></td>\n";
6739
6740                print "</tr>\n";
6741        }
6742        foreach my $line (@entries) {
6743                my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6744
6745                if ($alternate) {
6746                        print "<tr class=\"dark\">\n";
6747                } else {
6748                        print "<tr class=\"light\">\n";
6749                }
6750                $alternate ^= 1;
6751
6752                git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6753
6754                print "</tr>\n";
6755        }
6756        print "</table>\n" .
6757              "</div>";
6758        git_footer_html();
6759}
6760
6761sub snapshot_name {
6762        my ($project, $hash) = @_;
6763
6764        # path/to/project.git  -> project
6765        # path/to/project/.git -> project
6766        my $name = to_utf8($project);
6767        $name =~ s,([^/])/*\.git$,$1,;
6768        $name = basename($name);
6769        # sanitize name
6770        $name =~ s/[[:cntrl:]]/?/g;
6771
6772        my $ver = $hash;
6773        if ($hash =~ /^[0-9a-fA-F]+$/) {
6774                # shorten SHA-1 hash
6775                my $full_hash = git_get_full_hash($project, $hash);
6776                if ($full_hash =~ /^$hash/ && length($hash) > 7) {
6777                        $ver = git_get_short_hash($project, $hash);
6778                }
6779        } elsif ($hash =~ m!^refs/tags/(.*)$!) {
6780                # tags don't need shortened SHA-1 hash
6781                $ver = $1;
6782        } else {
6783                # branches and other need shortened SHA-1 hash
6784                if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
6785                        $ver = $1;
6786                }
6787                $ver .= '-' . git_get_short_hash($project, $hash);
6788        }
6789        # in case of hierarchical branch names
6790        $ver =~ s!/!.!g;
6791
6792        # name = project-version_string
6793        $name = "$name-$ver";
6794
6795        return wantarray ? ($name, $name) : $name;
6796}
6797
6798sub git_snapshot {
6799        my $format = $input_params{'snapshot_format'};
6800        if (!@snapshot_fmts) {
6801                die_error(403, "Snapshots not allowed");
6802        }
6803        # default to first supported snapshot format
6804        $format ||= $snapshot_fmts[0];
6805        if ($format !~ m/^[a-z0-9]+$/) {
6806                die_error(400, "Invalid snapshot format parameter");
6807        } elsif (!exists($known_snapshot_formats{$format})) {
6808                die_error(400, "Unknown snapshot format");
6809        } elsif ($known_snapshot_formats{$format}{'disabled'}) {
6810                die_error(403, "Snapshot format not allowed");
6811        } elsif (!grep($_ eq $format, @snapshot_fmts)) {
6812                die_error(403, "Unsupported snapshot format");
6813        }
6814
6815        my $type = git_get_type("$hash^{}");
6816        if (!$type) {
6817                die_error(404, 'Object does not exist');
6818        }  elsif ($type eq 'blob') {
6819                die_error(400, 'Object is not a tree-ish');
6820        }
6821
6822        my ($name, $prefix) = snapshot_name($project, $hash);
6823        my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
6824        my $cmd = quote_command(
6825                git_cmd(), 'archive',
6826                "--format=$known_snapshot_formats{$format}{'format'}",
6827                "--prefix=$prefix/", $hash);
6828        if (exists $known_snapshot_formats{$format}{'compressor'}) {
6829                $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
6830        }
6831
6832        $filename =~ s/(["\\])/\\$1/g;
6833        print $cgi->header(
6834                -type => $known_snapshot_formats{$format}{'type'},
6835                -content_disposition => 'inline; filename="' . $filename . '"',
6836                -status => '200 OK');
6837
6838        open my $fd, "-|", $cmd
6839                or die_error(500, "Execute git-archive failed");
6840        binmode STDOUT, ':raw';
6841        print <$fd>;
6842        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6843        close $fd;
6844}
6845
6846sub git_log_generic {
6847        my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
6848
6849        my $head = git_get_head_hash($project);
6850        if (!defined $base) {
6851                $base = $head;
6852        }
6853        if (!defined $page) {
6854                $page = 0;
6855        }
6856        my $refs = git_get_references();
6857
6858        my $commit_hash = $base;
6859        if (defined $parent) {
6860                $commit_hash = "$parent..$base";
6861        }
6862        my @commitlist =
6863                parse_commits($commit_hash, 101, (100 * $page),
6864                              defined $file_name ? ($file_name, "--full-history") : ());
6865
6866        my $ftype;
6867        if (!defined $file_hash && defined $file_name) {
6868                # some commits could have deleted file in question,
6869                # and not have it in tree, but one of them has to have it
6870                for (my $i = 0; $i < @commitlist; $i++) {
6871                        $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
6872                        last if defined $file_hash;
6873                }
6874        }
6875        if (defined $file_hash) {
6876                $ftype = git_get_type($file_hash);
6877        }
6878        if (defined $file_name && !defined $ftype) {
6879                die_error(500, "Unknown type of object");
6880        }
6881        my %co;
6882        if (defined $file_name) {
6883                %co = parse_commit($base)
6884                        or die_error(404, "Unknown commit object");
6885        }
6886
6887
6888        my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
6889        my $next_link = '';
6890        if ($#commitlist >= 100) {
6891                $next_link =
6892                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
6893                                 -accesskey => "n", -title => "Alt-n"}, "next");
6894        }
6895        my $patch_max = gitweb_get_feature('patches');
6896        if ($patch_max && !defined $file_name) {
6897                if ($patch_max < 0 || @commitlist <= $patch_max) {
6898                        $paging_nav .= " &sdot; " .
6899                                $cgi->a({-href => href(action=>"patches", -replay=>1)},
6900                                        "patches");
6901                }
6902        }
6903
6904        git_header_html();
6905        git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
6906        if (defined $file_name) {
6907                git_print_header_div('commit', esc_html($co{'title'}), $base);
6908        } else {
6909                git_print_header_div('summary', $project)
6910        }
6911        git_print_page_path($file_name, $ftype, $hash_base)
6912                if (defined $file_name);
6913
6914        $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
6915                     $file_name, $file_hash, $ftype);
6916
6917        git_footer_html();
6918}
6919
6920sub git_log {
6921        git_log_generic('log', \&git_log_body,
6922                        $hash, $hash_parent);
6923}
6924
6925sub git_commit {
6926        $hash ||= $hash_base || "HEAD";
6927        my %co = parse_commit($hash)
6928            or die_error(404, "Unknown commit object");
6929
6930        my $parent  = $co{'parent'};
6931        my $parents = $co{'parents'}; # listref
6932
6933        # we need to prepare $formats_nav before any parameter munging
6934        my $formats_nav;
6935        if (!defined $parent) {
6936                # --root commitdiff
6937                $formats_nav .= '(initial)';
6938        } elsif (@$parents == 1) {
6939                # single parent commit
6940                $formats_nav .=
6941                        '(parent: ' .
6942                        $cgi->a({-href => href(action=>"commit",
6943                                               hash=>$parent)},
6944                                esc_html(substr($parent, 0, 7))) .
6945                        ')';
6946        } else {
6947                # merge commit
6948                $formats_nav .=
6949                        '(merge: ' .
6950                        join(' ', map {
6951                                $cgi->a({-href => href(action=>"commit",
6952                                                       hash=>$_)},
6953                                        esc_html(substr($_, 0, 7)));
6954                        } @$parents ) .
6955                        ')';
6956        }
6957        if (gitweb_check_feature('patches') && @$parents <= 1) {
6958                $formats_nav .= " | " .
6959                        $cgi->a({-href => href(action=>"patch", -replay=>1)},
6960                                "patch");
6961        }
6962
6963        if (!defined $parent) {
6964                $parent = "--root";
6965        }
6966        my @difftree;
6967        open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
6968                @diff_opts,
6969                (@$parents <= 1 ? $parent : '-c'),
6970                $hash, "--"
6971                or die_error(500, "Open git-diff-tree failed");
6972        @difftree = map { chomp; $_ } <$fd>;
6973        close $fd or die_error(404, "Reading git-diff-tree failed");
6974
6975        # non-textual hash id's can be cached
6976        my $expires;
6977        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6978                $expires = "+1d";
6979        }
6980        my $refs = git_get_references();
6981        my $ref = format_ref_marker($refs, $co{'id'});
6982
6983        git_header_html(undef, $expires);
6984        git_print_page_nav('commit', '',
6985                           $hash, $co{'tree'}, $hash,
6986                           $formats_nav);
6987
6988        if (defined $co{'parent'}) {
6989                git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
6990        } else {
6991                git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
6992        }
6993        print "<div class=\"title_text\">\n" .
6994              "<table class=\"object_header\">\n";
6995        git_print_authorship_rows(\%co);
6996        print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
6997        print "<tr>" .
6998              "<td>tree</td>" .
6999              "<td class=\"sha1\">" .
7000              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7001                       class => "list"}, $co{'tree'}) .
7002              "</td>" .
7003              "<td class=\"link\">" .
7004              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7005                      "tree");
7006        my $snapshot_links = format_snapshot_links($hash);
7007        if (defined $snapshot_links) {
7008                print " | " . $snapshot_links;
7009        }
7010        print "</td>" .
7011              "</tr>\n";
7012
7013        foreach my $par (@$parents) {
7014                print "<tr>" .
7015                      "<td>parent</td>" .
7016                      "<td class=\"sha1\">" .
7017                      $cgi->a({-href => href(action=>"commit", hash=>$par),
7018                               class => "list"}, $par) .
7019                      "</td>" .
7020                      "<td class=\"link\">" .
7021                      $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7022                      " | " .
7023                      $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7024                      "</td>" .
7025                      "</tr>\n";
7026        }
7027        print "</table>".
7028              "</div>\n";
7029
7030        print "<div class=\"page_body\">\n";
7031        git_print_log($co{'comment'});
7032        print "</div>\n";
7033
7034        git_difftree_body(\@difftree, $hash, @$parents);
7035
7036        git_footer_html();
7037}
7038
7039sub git_object {
7040        # object is defined by:
7041        # - hash or hash_base alone
7042        # - hash_base and file_name
7043        my $type;
7044
7045        # - hash or hash_base alone
7046        if ($hash || ($hash_base && !defined $file_name)) {
7047                my $object_id = $hash || $hash_base;
7048
7049                open my $fd, "-|", quote_command(
7050                        git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7051                        or die_error(404, "Object does not exist");
7052                $type = <$fd>;
7053                chomp $type;
7054                close $fd
7055                        or die_error(404, "Object does not exist");
7056
7057        # - hash_base and file_name
7058        } elsif ($hash_base && defined $file_name) {
7059                $file_name =~ s,/+$,,;
7060
7061                system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7062                        or die_error(404, "Base object does not exist");
7063
7064                # here errors should not hapen
7065                open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7066                        or die_error(500, "Open git-ls-tree failed");
7067                my $line = <$fd>;
7068                close $fd;
7069
7070                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7071                unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7072                        die_error(404, "File or directory for given base does not exist");
7073                }
7074                $type = $2;
7075                $hash = $3;
7076        } else {
7077                die_error(400, "Not enough information to find object");
7078        }
7079
7080        print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7081                                          hash=>$hash, hash_base=>$hash_base,
7082                                          file_name=>$file_name),
7083                             -status => '302 Found');
7084}
7085
7086sub git_blobdiff {
7087        my $format = shift || 'html';
7088        my $diff_style = $input_params{'diff_style'} || 'inline';
7089
7090        my $fd;
7091        my @difftree;
7092        my %diffinfo;
7093        my $expires;
7094
7095        # preparing $fd and %diffinfo for git_patchset_body
7096        # new style URI
7097        if (defined $hash_base && defined $hash_parent_base) {
7098                if (defined $file_name) {
7099                        # read raw output
7100                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7101                                $hash_parent_base, $hash_base,
7102                                "--", (defined $file_parent ? $file_parent : ()), $file_name
7103                                or die_error(500, "Open git-diff-tree failed");
7104                        @difftree = map { chomp; $_ } <$fd>;
7105                        close $fd
7106                                or die_error(404, "Reading git-diff-tree failed");
7107                        @difftree
7108                                or die_error(404, "Blob diff not found");
7109
7110                } elsif (defined $hash &&
7111                         $hash =~ /[0-9a-fA-F]{40}/) {
7112                        # try to find filename from $hash
7113
7114                        # read filtered raw output
7115                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7116                                $hash_parent_base, $hash_base, "--"
7117                                or die_error(500, "Open git-diff-tree failed");
7118                        @difftree =
7119                                # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7120                                # $hash == to_id
7121                                grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7122                                map { chomp; $_ } <$fd>;
7123                        close $fd
7124                                or die_error(404, "Reading git-diff-tree failed");
7125                        @difftree
7126                                or die_error(404, "Blob diff not found");
7127
7128                } else {
7129                        die_error(400, "Missing one of the blob diff parameters");
7130                }
7131
7132                if (@difftree > 1) {
7133                        die_error(400, "Ambiguous blob diff specification");
7134                }
7135
7136                %diffinfo = parse_difftree_raw_line($difftree[0]);
7137                $file_parent ||= $diffinfo{'from_file'} || $file_name;
7138                $file_name   ||= $diffinfo{'to_file'};
7139
7140                $hash_parent ||= $diffinfo{'from_id'};
7141                $hash        ||= $diffinfo{'to_id'};
7142
7143                # non-textual hash id's can be cached
7144                if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7145                    $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7146                        $expires = '+1d';
7147                }
7148
7149                # open patch output
7150                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7151                        '-p', ($format eq 'html' ? "--full-index" : ()),
7152                        $hash_parent_base, $hash_base,
7153                        "--", (defined $file_parent ? $file_parent : ()), $file_name
7154                        or die_error(500, "Open git-diff-tree failed");
7155        }
7156
7157        # old/legacy style URI -- not generated anymore since 1.4.3.
7158        if (!%diffinfo) {
7159                die_error('404 Not Found', "Missing one of the blob diff parameters")
7160        }
7161
7162        # header
7163        if ($format eq 'html') {
7164                my $formats_nav =
7165                        $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7166                                "raw");
7167                $formats_nav .= diff_style_nav($diff_style);
7168                git_header_html(undef, $expires);
7169                if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7170                        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7171                        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7172                } else {
7173                        print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7174                        print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7175                }
7176                if (defined $file_name) {
7177                        git_print_page_path($file_name, "blob", $hash_base);
7178                } else {
7179                        print "<div class=\"page_path\"></div>\n";
7180                }
7181
7182        } elsif ($format eq 'plain') {
7183                print $cgi->header(
7184                        -type => 'text/plain',
7185                        -charset => 'utf-8',
7186                        -expires => $expires,
7187                        -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7188
7189                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7190
7191        } else {
7192                die_error(400, "Unknown blobdiff format");
7193        }
7194
7195        # patch
7196        if ($format eq 'html') {
7197                print "<div class=\"page_body\">\n";
7198
7199                git_patchset_body($fd, $diff_style,
7200                                  [ \%diffinfo ], $hash_base, $hash_parent_base);
7201                close $fd;
7202
7203                print "</div>\n"; # class="page_body"
7204                git_footer_html();
7205
7206        } else {
7207                while (my $line = <$fd>) {
7208                        $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7209                        $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7210
7211                        print $line;
7212
7213                        last if $line =~ m!^\+\+\+!;
7214                }
7215                local $/ = undef;
7216                print <$fd>;
7217                close $fd;
7218        }
7219}
7220
7221sub git_blobdiff_plain {
7222        git_blobdiff('plain');
7223}
7224
7225# assumes that it is added as later part of already existing navigation,
7226# so it returns "| foo | bar" rather than just "foo | bar"
7227sub diff_style_nav {
7228        my ($diff_style, $is_combined) = @_;
7229        $diff_style ||= 'inline';
7230
7231        return "" if ($is_combined);
7232
7233        my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7234        my %styles = @styles;
7235        @styles =
7236                @styles[ map { $_ * 2 } 0..$#styles/2 ];
7237
7238        return join '',
7239                map { " | ".$_ }
7240                map {
7241                        $_ eq $diff_style ? $styles{$_} :
7242                        $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7243                } @styles;
7244}
7245
7246sub git_commitdiff {
7247        my %params = @_;
7248        my $format = $params{-format} || 'html';
7249        my $diff_style = $input_params{'diff_style'} || 'inline';
7250
7251        my ($patch_max) = gitweb_get_feature('patches');
7252        if ($format eq 'patch') {
7253                die_error(403, "Patch view not allowed") unless $patch_max;
7254        }
7255
7256        $hash ||= $hash_base || "HEAD";
7257        my %co = parse_commit($hash)
7258            or die_error(404, "Unknown commit object");
7259
7260        # choose format for commitdiff for merge
7261        if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7262                $hash_parent = '--cc';
7263        }
7264        # we need to prepare $formats_nav before almost any parameter munging
7265        my $formats_nav;
7266        if ($format eq 'html') {
7267                $formats_nav =
7268                        $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7269                                "raw");
7270                if ($patch_max && @{$co{'parents'}} <= 1) {
7271                        $formats_nav .= " | " .
7272                                $cgi->a({-href => href(action=>"patch", -replay=>1)},
7273                                        "patch");
7274                }
7275                $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7276
7277                if (defined $hash_parent &&
7278                    $hash_parent ne '-c' && $hash_parent ne '--cc') {
7279                        # commitdiff with two commits given
7280                        my $hash_parent_short = $hash_parent;
7281                        if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7282                                $hash_parent_short = substr($hash_parent, 0, 7);
7283                        }
7284                        $formats_nav .=
7285                                ' (from';
7286                        for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7287                                if ($co{'parents'}[$i] eq $hash_parent) {
7288                                        $formats_nav .= ' parent ' . ($i+1);
7289                                        last;
7290                                }
7291                        }
7292                        $formats_nav .= ': ' .
7293                                $cgi->a({-href => href(-replay=>1,
7294                                                       hash=>$hash_parent, hash_base=>undef)},
7295                                        esc_html($hash_parent_short)) .
7296                                ')';
7297                } elsif (!$co{'parent'}) {
7298                        # --root commitdiff
7299                        $formats_nav .= ' (initial)';
7300                } elsif (scalar @{$co{'parents'}} == 1) {
7301                        # single parent commit
7302                        $formats_nav .=
7303                                ' (parent: ' .
7304                                $cgi->a({-href => href(-replay=>1,
7305                                                       hash=>$co{'parent'}, hash_base=>undef)},
7306                                        esc_html(substr($co{'parent'}, 0, 7))) .
7307                                ')';
7308                } else {
7309                        # merge commit
7310                        if ($hash_parent eq '--cc') {
7311                                $formats_nav .= ' | ' .
7312                                        $cgi->a({-href => href(-replay=>1,
7313                                                               hash=>$hash, hash_parent=>'-c')},
7314                                                'combined');
7315                        } else { # $hash_parent eq '-c'
7316                                $formats_nav .= ' | ' .
7317                                        $cgi->a({-href => href(-replay=>1,
7318                                                               hash=>$hash, hash_parent=>'--cc')},
7319                                                'compact');
7320                        }
7321                        $formats_nav .=
7322                                ' (merge: ' .
7323                                join(' ', map {
7324                                        $cgi->a({-href => href(-replay=>1,
7325                                                               hash=>$_, hash_base=>undef)},
7326                                                esc_html(substr($_, 0, 7)));
7327                                } @{$co{'parents'}} ) .
7328                                ')';
7329                }
7330        }
7331
7332        my $hash_parent_param = $hash_parent;
7333        if (!defined $hash_parent_param) {
7334                # --cc for multiple parents, --root for parentless
7335                $hash_parent_param =
7336                        @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7337        }
7338
7339        # read commitdiff
7340        my $fd;
7341        my @difftree;
7342        if ($format eq 'html') {
7343                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7344                        "--no-commit-id", "--patch-with-raw", "--full-index",
7345                        $hash_parent_param, $hash, "--"
7346                        or die_error(500, "Open git-diff-tree failed");
7347
7348                while (my $line = <$fd>) {
7349                        chomp $line;
7350                        # empty line ends raw part of diff-tree output
7351                        last unless $line;
7352                        push @difftree, scalar parse_difftree_raw_line($line);
7353                }
7354
7355        } elsif ($format eq 'plain') {
7356                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7357                        '-p', $hash_parent_param, $hash, "--"
7358                        or die_error(500, "Open git-diff-tree failed");
7359        } elsif ($format eq 'patch') {
7360                # For commit ranges, we limit the output to the number of
7361                # patches specified in the 'patches' feature.
7362                # For single commits, we limit the output to a single patch,
7363                # diverging from the git-format-patch default.
7364                my @commit_spec = ();
7365                if ($hash_parent) {
7366                        if ($patch_max > 0) {
7367                                push @commit_spec, "-$patch_max";
7368                        }
7369                        push @commit_spec, '-n', "$hash_parent..$hash";
7370                } else {
7371                        if ($params{-single}) {
7372                                push @commit_spec, '-1';
7373                        } else {
7374                                if ($patch_max > 0) {
7375                                        push @commit_spec, "-$patch_max";
7376                                }
7377                                push @commit_spec, "-n";
7378                        }
7379                        push @commit_spec, '--root', $hash;
7380                }
7381                open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7382                        '--encoding=utf8', '--stdout', @commit_spec
7383                        or die_error(500, "Open git-format-patch failed");
7384        } else {
7385                die_error(400, "Unknown commitdiff format");
7386        }
7387
7388        # non-textual hash id's can be cached
7389        my $expires;
7390        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7391                $expires = "+1d";
7392        }
7393
7394        # write commit message
7395        if ($format eq 'html') {
7396                my $refs = git_get_references();
7397                my $ref = format_ref_marker($refs, $co{'id'});
7398
7399                git_header_html(undef, $expires);
7400                git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7401                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7402                print "<div class=\"title_text\">\n" .
7403                      "<table class=\"object_header\">\n";
7404                git_print_authorship_rows(\%co);
7405                print "</table>".
7406                      "</div>\n";
7407                print "<div class=\"page_body\">\n";
7408                if (@{$co{'comment'}} > 1) {
7409                        print "<div class=\"log\">\n";
7410                        git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7411                        print "</div>\n"; # class="log"
7412                }
7413
7414        } elsif ($format eq 'plain') {
7415                my $refs = git_get_references("tags");
7416                my $tagname = git_get_rev_name_tags($hash);
7417                my $filename = basename($project) . "-$hash.patch";
7418
7419                print $cgi->header(
7420                        -type => 'text/plain',
7421                        -charset => 'utf-8',
7422                        -expires => $expires,
7423                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7424                my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7425                print "From: " . to_utf8($co{'author'}) . "\n";
7426                print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7427                print "Subject: " . to_utf8($co{'title'}) . "\n";
7428
7429                print "X-Git-Tag: $tagname\n" if $tagname;
7430                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7431
7432                foreach my $line (@{$co{'comment'}}) {
7433                        print to_utf8($line) . "\n";
7434                }
7435                print "---\n\n";
7436        } elsif ($format eq 'patch') {
7437                my $filename = basename($project) . "-$hash.patch";
7438
7439                print $cgi->header(
7440                        -type => 'text/plain',
7441                        -charset => 'utf-8',
7442                        -expires => $expires,
7443                        -content_disposition => 'inline; filename="' . "$filename" . '"');
7444        }
7445
7446        # write patch
7447        if ($format eq 'html') {
7448                my $use_parents = !defined $hash_parent ||
7449                        $hash_parent eq '-c' || $hash_parent eq '--cc';
7450                git_difftree_body(\@difftree, $hash,
7451                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7452                print "<br/>\n";
7453
7454                git_patchset_body($fd, $diff_style,
7455                                  \@difftree, $hash,
7456                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
7457                close $fd;
7458                print "</div>\n"; # class="page_body"
7459                git_footer_html();
7460
7461        } elsif ($format eq 'plain') {
7462                local $/ = undef;
7463                print <$fd>;
7464                close $fd
7465                        or print "Reading git-diff-tree failed\n";
7466        } elsif ($format eq 'patch') {
7467                local $/ = undef;
7468                print <$fd>;
7469                close $fd
7470                        or print "Reading git-format-patch failed\n";
7471        }
7472}
7473
7474sub git_commitdiff_plain {
7475        git_commitdiff(-format => 'plain');
7476}
7477
7478# format-patch-style patches
7479sub git_patch {
7480        git_commitdiff(-format => 'patch', -single => 1);
7481}
7482
7483sub git_patches {
7484        git_commitdiff(-format => 'patch');
7485}
7486
7487sub git_history {
7488        git_log_generic('history', \&git_history_body,
7489                        $hash_base, $hash_parent_base,
7490                        $file_name, $hash);
7491}
7492
7493sub git_search {
7494        $searchtype ||= 'commit';
7495
7496        # check if appropriate features are enabled
7497        gitweb_check_feature('search')
7498                or die_error(403, "Search is disabled");
7499        if ($searchtype eq 'pickaxe') {
7500                # pickaxe may take all resources of your box and run for several minutes
7501                # with every query - so decide by yourself how public you make this feature
7502                gitweb_check_feature('pickaxe')
7503                        or die_error(403, "Pickaxe search is disabled");
7504        }
7505        if ($searchtype eq 'grep') {
7506                # grep search might be potentially CPU-intensive, too
7507                gitweb_check_feature('grep')
7508                        or die_error(403, "Grep search is disabled");
7509        }
7510
7511        if (!defined $searchtext) {
7512                die_error(400, "Text field is empty");
7513        }
7514        if (!defined $hash) {
7515                $hash = git_get_head_hash($project);
7516        }
7517        my %co = parse_commit($hash);
7518        if (!%co) {
7519                die_error(404, "Unknown commit object");
7520        }
7521        if (!defined $page) {
7522                $page = 0;
7523        }
7524
7525        if ($searchtype eq 'commit' ||
7526            $searchtype eq 'author' ||
7527            $searchtype eq 'committer') {
7528                git_search_message(%co);
7529        } elsif ($searchtype eq 'pickaxe') {
7530                git_search_changes(%co);
7531        } elsif ($searchtype eq 'grep') {
7532                git_search_files(%co);
7533        } else {
7534                die_error(400, "Unknown search type");
7535        }
7536}
7537
7538sub git_search_help {
7539        git_header_html();
7540        git_print_page_nav('','', $hash,$hash,$hash);
7541        print <<EOT;
7542<p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7543regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7544the pattern entered is recognized as the POSIX extended
7545<a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7546insensitive).</p>
7547<dl>
7548<dt><b>commit</b></dt>
7549<dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7550EOT
7551        my $have_grep = gitweb_check_feature('grep');
7552        if ($have_grep) {
7553                print <<EOT;
7554<dt><b>grep</b></dt>
7555<dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7556    a different one) are searched for the given pattern. On large trees, this search can take
7557a while and put some strain on the server, so please use it with some consideration. Note that
7558due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7559case-sensitive.</dd>
7560EOT
7561        }
7562        print <<EOT;
7563<dt><b>author</b></dt>
7564<dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7565<dt><b>committer</b></dt>
7566<dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7567EOT
7568        my $have_pickaxe = gitweb_check_feature('pickaxe');
7569        if ($have_pickaxe) {
7570                print <<EOT;
7571<dt><b>pickaxe</b></dt>
7572<dd>All commits that caused the string to appear or disappear from any file (changes that
7573added, removed or "modified" the string) will be listed. This search can take a while and
7574takes a lot of strain on the server, so please use it wisely. Note that since you may be
7575interested even in changes just changing the case as well, this search is case sensitive.</dd>
7576EOT
7577        }
7578        print "</dl>\n";
7579        git_footer_html();
7580}
7581
7582sub git_shortlog {
7583        git_log_generic('shortlog', \&git_shortlog_body,
7584                        $hash, $hash_parent);
7585}
7586
7587## ......................................................................
7588## feeds (RSS, Atom; OPML)
7589
7590sub git_feed {
7591        my $format = shift || 'atom';
7592        my $have_blame = gitweb_check_feature('blame');
7593
7594        # Atom: http://www.atomenabled.org/developers/syndication/
7595        # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7596        if ($format ne 'rss' && $format ne 'atom') {
7597                die_error(400, "Unknown web feed format");
7598        }
7599
7600        # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7601        my $head = $hash || 'HEAD';
7602        my @commitlist = parse_commits($head, 150, 0, $file_name);
7603
7604        my %latest_commit;
7605        my %latest_date;
7606        my $content_type = "application/$format+xml";
7607        if (defined $cgi->http('HTTP_ACCEPT') &&
7608                 $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7609                # browser (feed reader) prefers text/xml
7610                $content_type = 'text/xml';
7611        }
7612        if (defined($commitlist[0])) {
7613                %latest_commit = %{$commitlist[0]};
7614                my $latest_epoch = $latest_commit{'committer_epoch'};
7615                %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7616                my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7617                if (defined $if_modified) {
7618                        my $since;
7619                        if (eval { require HTTP::Date; 1; }) {
7620                                $since = HTTP::Date::str2time($if_modified);
7621                        } elsif (eval { require Time::ParseDate; 1; }) {
7622                                $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7623                        }
7624                        if (defined $since && $latest_epoch <= $since) {
7625                                print $cgi->header(
7626                                        -type => $content_type,
7627                                        -charset => 'utf-8',
7628                                        -last_modified => $latest_date{'rfc2822'},
7629                                        -status => '304 Not Modified');
7630                                return;
7631                        }
7632                }
7633                print $cgi->header(
7634                        -type => $content_type,
7635                        -charset => 'utf-8',
7636                        -last_modified => $latest_date{'rfc2822'});
7637        } else {
7638                print $cgi->header(
7639                        -type => $content_type,
7640                        -charset => 'utf-8');
7641        }
7642
7643        # Optimization: skip generating the body if client asks only
7644        # for Last-Modified date.
7645        return if ($cgi->request_method() eq 'HEAD');
7646
7647        # header variables
7648        my $title = "$site_name - $project/$action";
7649        my $feed_type = 'log';
7650        if (defined $hash) {
7651                $title .= " - '$hash'";
7652                $feed_type = 'branch log';
7653                if (defined $file_name) {
7654                        $title .= " :: $file_name";
7655                        $feed_type = 'history';
7656                }
7657        } elsif (defined $file_name) {
7658                $title .= " - $file_name";
7659                $feed_type = 'history';
7660        }
7661        $title .= " $feed_type";
7662        my $descr = git_get_project_description($project);
7663        if (defined $descr) {
7664                $descr = esc_html($descr);
7665        } else {
7666                $descr = "$project " .
7667                         ($format eq 'rss' ? 'RSS' : 'Atom') .
7668                         " feed";
7669        }
7670        my $owner = git_get_project_owner($project);
7671        $owner = esc_html($owner);
7672
7673        #header
7674        my $alt_url;
7675        if (defined $file_name) {
7676                $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7677        } elsif (defined $hash) {
7678                $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7679        } else {
7680                $alt_url = href(-full=>1, action=>"summary");
7681        }
7682        print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7683        if ($format eq 'rss') {
7684                print <<XML;
7685<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7686<channel>
7687XML
7688                print "<title>$title</title>\n" .
7689                      "<link>$alt_url</link>\n" .
7690                      "<description>$descr</description>\n" .
7691                      "<language>en</language>\n" .
7692                      # project owner is responsible for 'editorial' content
7693                      "<managingEditor>$owner</managingEditor>\n";
7694                if (defined $logo || defined $favicon) {
7695                        # prefer the logo to the favicon, since RSS
7696                        # doesn't allow both
7697                        my $img = esc_url($logo || $favicon);
7698                        print "<image>\n" .
7699                              "<url>$img</url>\n" .
7700                              "<title>$title</title>\n" .
7701                              "<link>$alt_url</link>\n" .
7702                              "</image>\n";
7703                }
7704                if (%latest_date) {
7705                        print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7706                        print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7707                }
7708                print "<generator>gitweb v.$version/$git_version</generator>\n";
7709        } elsif ($format eq 'atom') {
7710                print <<XML;
7711<feed xmlns="http://www.w3.org/2005/Atom">
7712XML
7713                print "<title>$title</title>\n" .
7714                      "<subtitle>$descr</subtitle>\n" .
7715                      '<link rel="alternate" type="text/html" href="' .
7716                      $alt_url . '" />' . "\n" .
7717                      '<link rel="self" type="' . $content_type . '" href="' .
7718                      $cgi->self_url() . '" />' . "\n" .
7719                      "<id>" . href(-full=>1) . "</id>\n" .
7720                      # use project owner for feed author
7721                      "<author><name>$owner</name></author>\n";
7722                if (defined $favicon) {
7723                        print "<icon>" . esc_url($favicon) . "</icon>\n";
7724                }
7725                if (defined $logo) {
7726                        # not twice as wide as tall: 72 x 27 pixels
7727                        print "<logo>" . esc_url($logo) . "</logo>\n";
7728                }
7729                if (! %latest_date) {
7730                        # dummy date to keep the feed valid until commits trickle in:
7731                        print "<updated>1970-01-01T00:00:00Z</updated>\n";
7732                } else {
7733                        print "<updated>$latest_date{'iso-8601'}</updated>\n";
7734                }
7735                print "<generator version='$version/$git_version'>gitweb</generator>\n";
7736        }
7737
7738        # contents
7739        for (my $i = 0; $i <= $#commitlist; $i++) {
7740                my %co = %{$commitlist[$i]};
7741                my $commit = $co{'id'};
7742                # we read 150, we always show 30 and the ones more recent than 48 hours
7743                if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7744                        last;
7745                }
7746                my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7747
7748                # get list of changed files
7749                open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7750                        $co{'parent'} || "--root",
7751                        $co{'id'}, "--", (defined $file_name ? $file_name : ())
7752                        or next;
7753                my @difftree = map { chomp; $_ } <$fd>;
7754                close $fd
7755                        or next;
7756
7757                # print element (entry, item)
7758                my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7759                if ($format eq 'rss') {
7760                        print "<item>\n" .
7761                              "<title>" . esc_html($co{'title'}) . "</title>\n" .
7762                              "<author>" . esc_html($co{'author'}) . "</author>\n" .
7763                              "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7764                              "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7765                              "<link>$co_url</link>\n" .
7766                              "<description>" . esc_html($co{'title'}) . "</description>\n" .
7767                              "<content:encoded>" .
7768                              "<![CDATA[\n";
7769                } elsif ($format eq 'atom') {
7770                        print "<entry>\n" .
7771                              "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7772                              "<updated>$cd{'iso-8601'}</updated>\n" .
7773                              "<author>\n" .
7774                              "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7775                        if ($co{'author_email'}) {
7776                                print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7777                        }
7778                        print "</author>\n" .
7779                              # use committer for contributor
7780                              "<contributor>\n" .
7781                              "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7782                        if ($co{'committer_email'}) {
7783                                print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7784                        }
7785                        print "</contributor>\n" .
7786                              "<published>$cd{'iso-8601'}</published>\n" .
7787                              "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7788                              "<id>$co_url</id>\n" .
7789                              "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
7790                              "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
7791                }
7792                my $comment = $co{'comment'};
7793                print "<pre>\n";
7794                foreach my $line (@$comment) {
7795                        $line = esc_html($line);
7796                        print "$line\n";
7797                }
7798                print "</pre><ul>\n";
7799                foreach my $difftree_line (@difftree) {
7800                        my %difftree = parse_difftree_raw_line($difftree_line);
7801                        next if !$difftree{'from_id'};
7802
7803                        my $file = $difftree{'file'} || $difftree{'to_file'};
7804
7805                        print "<li>" .
7806                              "[" .
7807                              $cgi->a({-href => href(-full=>1, action=>"blobdiff",
7808                                                     hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
7809                                                     hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
7810                                                     file_name=>$file, file_parent=>$difftree{'from_file'}),
7811                                      -title => "diff"}, 'D');
7812                        if ($have_blame) {
7813                                print $cgi->a({-href => href(-full=>1, action=>"blame",
7814                                                             file_name=>$file, hash_base=>$commit),
7815                                              -title => "blame"}, 'B');
7816                        }
7817                        # if this is not a feed of a file history
7818                        if (!defined $file_name || $file_name ne $file) {
7819                                print $cgi->a({-href => href(-full=>1, action=>"history",
7820                                                             file_name=>$file, hash=>$commit),
7821                                              -title => "history"}, 'H');
7822                        }
7823                        $file = esc_path($file);
7824                        print "] ".
7825                              "$file</li>\n";
7826                }
7827                if ($format eq 'rss') {
7828                        print "</ul>]]>\n" .
7829                              "</content:encoded>\n" .
7830                              "</item>\n";
7831                } elsif ($format eq 'atom') {
7832                        print "</ul>\n</div>\n" .
7833                              "</content>\n" .
7834                              "</entry>\n";
7835                }
7836        }
7837
7838        # end of feed
7839        if ($format eq 'rss') {
7840                print "</channel>\n</rss>\n";
7841        } elsif ($format eq 'atom') {
7842                print "</feed>\n";
7843        }
7844}
7845
7846sub git_rss {
7847        git_feed('rss');
7848}
7849
7850sub git_atom {
7851        git_feed('atom');
7852}
7853
7854sub git_opml {
7855        my @list = git_get_projects_list();
7856        if (!@list) {
7857                die_error(404, "No projects found");
7858        }
7859
7860        print $cgi->header(
7861                -type => 'text/xml',
7862                -charset => 'utf-8',
7863                -content_disposition => 'inline; filename="opml.xml"');
7864
7865        print <<XML;
7866<?xml version="1.0" encoding="utf-8"?>
7867<opml version="1.0">
7868<head>
7869  <title>$site_name OPML Export</title>
7870</head>
7871<body>
7872<outline text="git RSS feeds">
7873XML
7874
7875        foreach my $pr (@list) {
7876                my %proj = %$pr;
7877                my $head = git_get_head_hash($proj{'path'});
7878                if (!defined $head) {
7879                        next;
7880                }
7881                $git_dir = "$projectroot/$proj{'path'}";
7882                my %co = parse_commit($head);
7883                if (!%co) {
7884                        next;
7885                }
7886
7887                my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7888                my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7889                my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7890                print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7891        }
7892        print <<XML;
7893</outline>
7894</body>
7895</opml>
7896XML
7897}