gitweb / gitweb.perlon commit bash: simple reimplementation of _get_comp_words_by_ref (dbda3b1)
   1#!/usr/bin/perl
   2
   3# gitweb - simple web interface to track changes in git repositories
   4#
   5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
   6# (C) 2005, Christian Gierke
   7#
   8# This program is licensed under the GPLv2
   9
  10use strict;
  11use warnings;
  12use CGI qw(:standard :escapeHTML -nosticky);
  13use CGI::Util qw(unescape);
  14use CGI::Carp qw(fatalsToBrowser set_message);
  15use Encode;
  16use Fcntl ':mode';
  17use File::Find qw();
  18use File::Basename qw(basename);
  19binmode STDOUT, ':utf8';
  20
  21our $t0;
  22if (eval { require Time::HiRes; 1; }) {
  23        $t0 = [Time::HiRes::gettimeofday()];
  24}
  25our $number_of_git_cmds = 0;
  26
  27BEGIN {
  28        CGI->compile() if $ENV{'MOD_PERL'};
  29}
  30
  31our $version = "++GIT_VERSION++";
  32
  33our ($my_url, $my_uri, $base_url, $path_info, $home_link);
  34sub evaluate_uri {
  35        our $cgi;
  36
  37        our $my_url = $cgi->url();
  38        our $my_uri = $cgi->url(-absolute => 1);
  39
  40        # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
  41        # needed and used only for URLs with nonempty PATH_INFO
  42        our $base_url = $my_url;
  43
  44        # When the script is used as DirectoryIndex, the URL does not contain the name
  45        # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
  46        # have to do it ourselves. We make $path_info global because it's also used
  47        # later on.
  48        #
  49        # Another issue with the script being the DirectoryIndex is that the resulting
  50        # $my_url data is not the full script URL: this is good, because we want
  51        # generated links to keep implying the script name if it wasn't explicitly
  52        # indicated in the URL we're handling, but it means that $my_url cannot be used
  53        # as base URL.
  54        # Therefore, if we needed to strip PATH_INFO, then we know that we have
  55        # to build the base URL ourselves:
  56        our $path_info = $ENV{"PATH_INFO"};
  57        if ($path_info) {
  58                if ($my_url =~ s,\Q$path_info\E$,, &&
  59                    $my_uri =~ s,\Q$path_info\E$,, &&
  60                    defined $ENV{'SCRIPT_NAME'}) {
  61                        $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
  62                }
  63        }
  64
  65        # target of the home link on top of all pages
  66        our $home_link = $my_uri || "/";
  67}
  68
  69# core git executable to use
  70# this can just be "git" if your webserver has a sensible PATH
  71our $GIT = "++GIT_BINDIR++/git";
  72
  73# absolute fs-path which will be prepended to the project path
  74#our $projectroot = "/pub/scm";
  75our $projectroot = "++GITWEB_PROJECTROOT++";
  76
  77# fs traversing limit for getting project list
  78# the number is relative to the projectroot
  79our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
  80
  81# string of the home link on top of all pages
  82our $home_link_str = "++GITWEB_HOME_LINK_STR++";
  83
  84# name of your site or organization to appear in page titles
  85# replace this with something more descriptive for clearer bookmarks
  86our $site_name = "++GITWEB_SITENAME++"
  87                 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
  88
  89# filename of html text to include at top of each page
  90our $site_header = "++GITWEB_SITE_HEADER++";
  91# html text to include at home page
  92our $home_text = "++GITWEB_HOMETEXT++";
  93# filename of html text to include at bottom of each page
  94our $site_footer = "++GITWEB_SITE_FOOTER++";
  95
  96# URI of stylesheets
  97our @stylesheets = ("++GITWEB_CSS++");
  98# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
  99our $stylesheet = undef;
 100# URI of GIT logo (72x27 size)
 101our $logo = "++GITWEB_LOGO++";
 102# URI of GIT favicon, assumed to be image/png type
 103our $favicon = "++GITWEB_FAVICON++";
 104# URI of gitweb.js (JavaScript code for gitweb)
 105our $javascript = "++GITWEB_JS++";
 106
 107# URI and label (title) of GIT logo link
 108#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
 109#our $logo_label = "git documentation";
 110our $logo_url = "http://git-scm.com/";
 111our $logo_label = "git homepage";
 112
 113# source of projects list
 114our $projects_list = "++GITWEB_LIST++";
 115
 116# the width (in characters) of the projects list "Description" column
 117our $projects_list_description_width = 25;
 118
 119# default order of projects list
 120# valid values are none, project, descr, owner, and age
 121our $default_projects_order = "project";
 122
 123# show repository only if this file exists
 124# (only effective if this variable evaluates to true)
 125our $export_ok = "++GITWEB_EXPORT_OK++";
 126
 127# show repository only if this subroutine returns true
 128# when given the path to the project, for example:
 129#    sub { return -e "$_[0]/git-daemon-export-ok"; }
 130our $export_auth_hook = undef;
 131
 132# only allow viewing of repositories also shown on the overview page
 133our $strict_export = "++GITWEB_STRICT_EXPORT++";
 134
 135# list of git base URLs used for URL to where fetch project from,
 136# i.e. full URL is "$git_base_url/$project"
 137our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
 138
 139# default blob_plain mimetype and default charset for text/plain blob
 140our $default_blob_plain_mimetype = 'text/plain';
 141our $default_text_plain_charset  = undef;
 142
 143# file to use for guessing MIME types before trying /etc/mime.types
 144# (relative to the current git repository)
 145our $mimetypes_file = undef;
 146
 147# assume this charset if line contains non-UTF-8 characters;
 148# it should be valid encoding (see Encoding::Supported(3pm) for list),
 149# for which encoding all byte sequences are valid, for example
 150# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
 151# could be even 'utf-8' for the old behavior)
 152our $fallback_encoding = 'latin1';
 153
 154# rename detection options for git-diff and git-diff-tree
 155# - default is '-M', with the cost proportional to
 156#   (number of removed files) * (number of new files).
 157# - more costly is '-C' (which implies '-M'), with the cost proportional to
 158#   (number of changed files + number of removed files) * (number of new files)
 159# - even more costly is '-C', '--find-copies-harder' with cost
 160#   (number of files in the original tree) * (number of new files)
 161# - one might want to include '-B' option, e.g. '-B', '-M'
 162our @diff_opts = ('-M'); # taken from git_commit
 163
 164# Disables features that would allow repository owners to inject script into
 165# the gitweb domain.
 166our $prevent_xss = 0;
 167
 168# information about snapshot formats that gitweb is capable of serving
 169our %known_snapshot_formats = (
 170        # name => {
 171        #       'display' => display name,
 172        #       'type' => mime type,
 173        #       'suffix' => filename suffix,
 174        #       'format' => --format for git-archive,
 175        #       'compressor' => [compressor command and arguments]
 176        #                       (array reference, optional)
 177        #       'disabled' => boolean (optional)}
 178        #
 179        'tgz' => {
 180                'display' => 'tar.gz',
 181                'type' => 'application/x-gzip',
 182                'suffix' => '.tar.gz',
 183                'format' => 'tar',
 184                'compressor' => ['gzip']},
 185
 186        'tbz2' => {
 187                'display' => 'tar.bz2',
 188                'type' => 'application/x-bzip2',
 189                'suffix' => '.tar.bz2',
 190                'format' => 'tar',
 191                'compressor' => ['bzip2']},
 192
 193        'txz' => {
 194                'display' => 'tar.xz',
 195                'type' => 'application/x-xz',
 196                'suffix' => '.tar.xz',
 197                'format' => 'tar',
 198                'compressor' => ['xz'],
 199                'disabled' => 1},
 200
 201        'zip' => {
 202                'display' => 'zip',
 203                'type' => 'application/x-zip',
 204                'suffix' => '.zip',
 205                'format' => 'zip'},
 206);
 207
 208# Aliases so we understand old gitweb.snapshot values in repository
 209# configuration.
 210our %known_snapshot_format_aliases = (
 211        'gzip'  => 'tgz',
 212        'bzip2' => 'tbz2',
 213        'xz'    => 'txz',
 214
 215        # backward compatibility: legacy gitweb config support
 216        'x-gzip' => undef, 'gz' => undef,
 217        'x-bzip2' => undef, 'bz2' => undef,
 218        'x-zip' => undef, '' => undef,
 219);
 220
 221# Pixel sizes for icons and avatars. If the default font sizes or lineheights
 222# are changed, it may be appropriate to change these values too via
 223# $GITWEB_CONFIG.
 224our %avatar_size = (
 225        'default' => 16,
 226        'double'  => 32
 227);
 228
 229# Used to set the maximum load that we will still respond to gitweb queries.
 230# If server load exceed this value then return "503 server busy" error.
 231# If gitweb cannot determined server load, it is taken to be 0.
 232# Leave it undefined (or set to 'undef') to turn off load checking.
 233our $maxload = 300;
 234
 235# You define site-wide feature defaults here; override them with
 236# $GITWEB_CONFIG as necessary.
 237our %feature = (
 238        # feature => {
 239        #       'sub' => feature-sub (subroutine),
 240        #       'override' => allow-override (boolean),
 241        #       'default' => [ default options...] (array reference)}
 242        #
 243        # if feature is overridable (it means that allow-override has true value),
 244        # then feature-sub will be called with default options as parameters;
 245        # return value of feature-sub indicates if to enable specified feature
 246        #
 247        # if there is no 'sub' key (no feature-sub), then feature cannot be
 248        # overridden
 249        #
 250        # use gitweb_get_feature(<feature>) to retrieve the <feature> value
 251        # (an array) or gitweb_check_feature(<feature>) to check if <feature>
 252        # is enabled
 253
 254        # Enable the 'blame' blob view, showing the last commit that modified
 255        # each line in the file. This can be very CPU-intensive.
 256
 257        # To enable system wide have in $GITWEB_CONFIG
 258        # $feature{'blame'}{'default'} = [1];
 259        # To have project specific config enable override in $GITWEB_CONFIG
 260        # $feature{'blame'}{'override'} = 1;
 261        # and in project config gitweb.blame = 0|1;
 262        'blame' => {
 263                'sub' => sub { feature_bool('blame', @_) },
 264                'override' => 0,
 265                'default' => [0]},
 266
 267        # Enable the 'snapshot' link, providing a compressed archive of any
 268        # tree. This can potentially generate high traffic if you have large
 269        # project.
 270
 271        # Value is a list of formats defined in %known_snapshot_formats that
 272        # you wish to offer.
 273        # To disable system wide have in $GITWEB_CONFIG
 274        # $feature{'snapshot'}{'default'} = [];
 275        # To have project specific config enable override in $GITWEB_CONFIG
 276        # $feature{'snapshot'}{'override'} = 1;
 277        # and in project config, a comma-separated list of formats or "none"
 278        # to disable.  Example: gitweb.snapshot = tbz2,zip;
 279        'snapshot' => {
 280                'sub' => \&feature_snapshot,
 281                'override' => 0,
 282                'default' => ['tgz']},
 283
 284        # Enable text search, which will list the commits which match author,
 285        # committer or commit text to a given string.  Enabled by default.
 286        # Project specific override is not supported.
 287        'search' => {
 288                'override' => 0,
 289                'default' => [1]},
 290
 291        # Enable grep search, which will list the files in currently selected
 292        # tree containing the given string. Enabled by default. This can be
 293        # potentially CPU-intensive, of course.
 294
 295        # To enable system wide have in $GITWEB_CONFIG
 296        # $feature{'grep'}{'default'} = [1];
 297        # To have project specific config enable override in $GITWEB_CONFIG
 298        # $feature{'grep'}{'override'} = 1;
 299        # and in project config gitweb.grep = 0|1;
 300        'grep' => {
 301                'sub' => sub { feature_bool('grep', @_) },
 302                'override' => 0,
 303                'default' => [1]},
 304
 305        # Enable the pickaxe search, which will list the commits that modified
 306        # a given string in a file. This can be practical and quite faster
 307        # alternative to 'blame', but still potentially CPU-intensive.
 308
 309        # To enable system wide have in $GITWEB_CONFIG
 310        # $feature{'pickaxe'}{'default'} = [1];
 311        # To have project specific config enable override in $GITWEB_CONFIG
 312        # $feature{'pickaxe'}{'override'} = 1;
 313        # and in project config gitweb.pickaxe = 0|1;
 314        'pickaxe' => {
 315                'sub' => sub { feature_bool('pickaxe', @_) },
 316                'override' => 0,
 317                'default' => [1]},
 318
 319        # Enable showing size of blobs in a 'tree' view, in a separate
 320        # column, similar to what 'ls -l' does.  This cost a bit of IO.
 321
 322        # To disable system wide have in $GITWEB_CONFIG
 323        # $feature{'show-sizes'}{'default'} = [0];
 324        # To have project specific config enable override in $GITWEB_CONFIG
 325        # $feature{'show-sizes'}{'override'} = 1;
 326        # and in project config gitweb.showsizes = 0|1;
 327        'show-sizes' => {
 328                'sub' => sub { feature_bool('showsizes', @_) },
 329                'override' => 0,
 330                'default' => [1]},
 331
 332        # Make gitweb use an alternative format of the URLs which can be
 333        # more readable and natural-looking: project name is embedded
 334        # directly in the path and the query string contains other
 335        # auxiliary information. All gitweb installations recognize
 336        # URL in either format; this configures in which formats gitweb
 337        # generates links.
 338
 339        # To enable system wide have in $GITWEB_CONFIG
 340        # $feature{'pathinfo'}{'default'} = [1];
 341        # Project specific override is not supported.
 342
 343        # Note that you will need to change the default location of CSS,
 344        # favicon, logo and possibly other files to an absolute URL. Also,
 345        # if gitweb.cgi serves as your indexfile, you will need to force
 346        # $my_uri to contain the script name in your $GITWEB_CONFIG.
 347        'pathinfo' => {
 348                'override' => 0,
 349                'default' => [0]},
 350
 351        # Make gitweb consider projects in project root subdirectories
 352        # to be forks of existing projects. Given project $projname.git,
 353        # projects matching $projname/*.git will not be shown in the main
 354        # projects list, instead a '+' mark will be added to $projname
 355        # there and a 'forks' view will be enabled for the project, listing
 356        # all the forks. If project list is taken from a file, forks have
 357        # to be listed after the main project.
 358
 359        # To enable system wide have in $GITWEB_CONFIG
 360        # $feature{'forks'}{'default'} = [1];
 361        # Project specific override is not supported.
 362        'forks' => {
 363                'override' => 0,
 364                'default' => [0]},
 365
 366        # Insert custom links to the action bar of all project pages.
 367        # This enables you mainly to link to third-party scripts integrating
 368        # into gitweb; e.g. git-browser for graphical history representation
 369        # or custom web-based repository administration interface.
 370
 371        # The 'default' value consists of a list of triplets in the form
 372        # (label, link, position) where position is the label after which
 373        # to insert the link and link is a format string where %n expands
 374        # to the project name, %f to the project path within the filesystem,
 375        # %h to the current hash (h gitweb parameter) and %b to the current
 376        # hash base (hb gitweb parameter); %% expands to %.
 377
 378        # To enable system wide have in $GITWEB_CONFIG e.g.
 379        # $feature{'actions'}{'default'} = [('graphiclog',
 380        #       '/git-browser/by-commit.html?r=%n', 'summary')];
 381        # Project specific override is not supported.
 382        'actions' => {
 383                'override' => 0,
 384                'default' => []},
 385
 386        # Allow gitweb scan project content tags described in ctags/
 387        # of project repository, and display the popular Web 2.0-ish
 388        # "tag cloud" near the project list. Note that this is something
 389        # COMPLETELY different from the normal Git tags.
 390
 391        # gitweb by itself can show existing tags, but it does not handle
 392        # tagging itself; you need an external application for that.
 393        # For an example script, check Girocco's cgi/tagproj.cgi.
 394        # You may want to install the HTML::TagCloud Perl module to get
 395        # a pretty tag cloud instead of just a list of tags.
 396
 397        # To enable system wide have in $GITWEB_CONFIG
 398        # $feature{'ctags'}{'default'} = ['path_to_tag_script'];
 399        # Project specific override is not supported.
 400        'ctags' => {
 401                'override' => 0,
 402                'default' => [0]},
 403
 404        # The maximum number of patches in a patchset generated in patch
 405        # view. Set this to 0 or undef to disable patch view, or to a
 406        # negative number to remove any limit.
 407
 408        # To disable system wide have in $GITWEB_CONFIG
 409        # $feature{'patches'}{'default'} = [0];
 410        # To have project specific config enable override in $GITWEB_CONFIG
 411        # $feature{'patches'}{'override'} = 1;
 412        # and in project config gitweb.patches = 0|n;
 413        # where n is the maximum number of patches allowed in a patchset.
 414        'patches' => {
 415                'sub' => \&feature_patches,
 416                'override' => 0,
 417                'default' => [16]},
 418
 419        # Avatar support. When this feature is enabled, views such as
 420        # shortlog or commit will display an avatar associated with
 421        # the email of the committer(s) and/or author(s).
 422
 423        # Currently available providers are gravatar and picon.
 424        # If an unknown provider is specified, the feature is disabled.
 425
 426        # Gravatar depends on Digest::MD5.
 427        # Picon currently relies on the indiana.edu database.
 428
 429        # To enable system wide have in $GITWEB_CONFIG
 430        # $feature{'avatar'}{'default'} = ['<provider>'];
 431        # where <provider> is either gravatar or picon.
 432        # To have project specific config enable override in $GITWEB_CONFIG
 433        # $feature{'avatar'}{'override'} = 1;
 434        # and in project config gitweb.avatar = <provider>;
 435        'avatar' => {
 436                'sub' => \&feature_avatar,
 437                'override' => 0,
 438                'default' => ['']},
 439
 440        # Enable displaying how much time and how many git commands
 441        # it took to generate and display page.  Disabled by default.
 442        # Project specific override is not supported.
 443        'timed' => {
 444                'override' => 0,
 445                'default' => [0]},
 446
 447        # Enable turning some links into links to actions which require
 448        # JavaScript to run (like 'blame_incremental').  Not enabled by
 449        # default.  Project specific override is currently not supported.
 450        'javascript-actions' => {
 451                'override' => 0,
 452                'default' => [0]},
 453
 454        # Syntax highlighting support. This is based on Daniel Svensson's
 455        # and Sham Chukoury's work in gitweb-xmms2.git.
 456        # It requires the 'highlight' program present in $PATH,
 457        # and therefore is disabled by default.
 458
 459        # To enable system wide have in $GITWEB_CONFIG
 460        # $feature{'highlight'}{'default'} = [1];
 461
 462        'highlight' => {
 463                'sub' => sub { feature_bool('highlight', @_) },
 464                'override' => 0,
 465                'default' => [0]},
 466);
 467
 468sub gitweb_get_feature {
 469        my ($name) = @_;
 470        return unless exists $feature{$name};
 471        my ($sub, $override, @defaults) = (
 472                $feature{$name}{'sub'},
 473                $feature{$name}{'override'},
 474                @{$feature{$name}{'default'}});
 475        # project specific override is possible only if we have project
 476        our $git_dir; # global variable, declared later
 477        if (!$override || !defined $git_dir) {
 478                return @defaults;
 479        }
 480        if (!defined $sub) {
 481                warn "feature $name is not overridable";
 482                return @defaults;
 483        }
 484        return $sub->(@defaults);
 485}
 486
 487# A wrapper to check if a given feature is enabled.
 488# With this, you can say
 489#
 490#   my $bool_feat = gitweb_check_feature('bool_feat');
 491#   gitweb_check_feature('bool_feat') or somecode;
 492#
 493# instead of
 494#
 495#   my ($bool_feat) = gitweb_get_feature('bool_feat');
 496#   (gitweb_get_feature('bool_feat'))[0] or somecode;
 497#
 498sub gitweb_check_feature {
 499        return (gitweb_get_feature(@_))[0];
 500}
 501
 502
 503sub feature_bool {
 504        my $key = shift;
 505        my ($val) = git_get_project_config($key, '--bool');
 506
 507        if (!defined $val) {
 508                return ($_[0]);
 509        } elsif ($val eq 'true') {
 510                return (1);
 511        } elsif ($val eq 'false') {
 512                return (0);
 513        }
 514}
 515
 516sub feature_snapshot {
 517        my (@fmts) = @_;
 518
 519        my ($val) = git_get_project_config('snapshot');
 520
 521        if ($val) {
 522                @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
 523        }
 524
 525        return @fmts;
 526}
 527
 528sub feature_patches {
 529        my @val = (git_get_project_config('patches', '--int'));
 530
 531        if (@val) {
 532                return @val;
 533        }
 534
 535        return ($_[0]);
 536}
 537
 538sub feature_avatar {
 539        my @val = (git_get_project_config('avatar'));
 540
 541        return @val ? @val : @_;
 542}
 543
 544# checking HEAD file with -e is fragile if the repository was
 545# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
 546# and then pruned.
 547sub check_head_link {
 548        my ($dir) = @_;
 549        my $headfile = "$dir/HEAD";
 550        return ((-e $headfile) ||
 551                (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
 552}
 553
 554sub check_export_ok {
 555        my ($dir) = @_;
 556        return (check_head_link($dir) &&
 557                (!$export_ok || -e "$dir/$export_ok") &&
 558                (!$export_auth_hook || $export_auth_hook->($dir)));
 559}
 560
 561# process alternate names for backward compatibility
 562# filter out unsupported (unknown) snapshot formats
 563sub filter_snapshot_fmts {
 564        my @fmts = @_;
 565
 566        @fmts = map {
 567                exists $known_snapshot_format_aliases{$_} ?
 568                       $known_snapshot_format_aliases{$_} : $_} @fmts;
 569        @fmts = grep {
 570                exists $known_snapshot_formats{$_} &&
 571                !$known_snapshot_formats{$_}{'disabled'}} @fmts;
 572}
 573
 574our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM);
 575sub evaluate_gitweb_config {
 576        our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
 577        our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
 578        # die if there are errors parsing config file
 579        if (-e $GITWEB_CONFIG) {
 580                do $GITWEB_CONFIG;
 581                die $@ if $@;
 582        } elsif (-e $GITWEB_CONFIG_SYSTEM) {
 583                do $GITWEB_CONFIG_SYSTEM;
 584                die $@ if $@;
 585        }
 586}
 587
 588# Get loadavg of system, to compare against $maxload.
 589# Currently it requires '/proc/loadavg' present to get loadavg;
 590# if it is not present it returns 0, which means no load checking.
 591sub get_loadavg {
 592        if( -e '/proc/loadavg' ){
 593                open my $fd, '<', '/proc/loadavg'
 594                        or return 0;
 595                my @load = split(/\s+/, scalar <$fd>);
 596                close $fd;
 597
 598                # The first three columns measure CPU and IO utilization of the last one,
 599                # five, and 10 minute periods.  The fourth column shows the number of
 600                # currently running processes and the total number of processes in the m/n
 601                # format.  The last column displays the last process ID used.
 602                return $load[0] || 0;
 603        }
 604        # additional checks for load average should go here for things that don't export
 605        # /proc/loadavg
 606
 607        return 0;
 608}
 609
 610# version of the core git binary
 611our $git_version;
 612sub evaluate_git_version {
 613        our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
 614        $number_of_git_cmds++;
 615}
 616
 617sub check_loadavg {
 618        if (defined $maxload && get_loadavg() > $maxload) {
 619                die_error(503, "The load average on the server is too high");
 620        }
 621}
 622
 623# ======================================================================
 624# input validation and dispatch
 625
 626# input parameters can be collected from a variety of sources (presently, CGI
 627# and PATH_INFO), so we define an %input_params hash that collects them all
 628# together during validation: this allows subsequent uses (e.g. href()) to be
 629# agnostic of the parameter origin
 630
 631our %input_params = ();
 632
 633# input parameters are stored with the long parameter name as key. This will
 634# also be used in the href subroutine to convert parameters to their CGI
 635# equivalent, and since the href() usage is the most frequent one, we store
 636# the name -> CGI key mapping here, instead of the reverse.
 637#
 638# XXX: Warning: If you touch this, check the search form for updating,
 639# too.
 640
 641our @cgi_param_mapping = (
 642        project => "p",
 643        action => "a",
 644        file_name => "f",
 645        file_parent => "fp",
 646        hash => "h",
 647        hash_parent => "hp",
 648        hash_base => "hb",
 649        hash_parent_base => "hpb",
 650        page => "pg",
 651        order => "o",
 652        searchtext => "s",
 653        searchtype => "st",
 654        snapshot_format => "sf",
 655        extra_options => "opt",
 656        search_use_regexp => "sr",
 657        # this must be last entry (for manipulation from JavaScript)
 658        javascript => "js"
 659);
 660our %cgi_param_mapping = @cgi_param_mapping;
 661
 662# we will also need to know the possible actions, for validation
 663our %actions = (
 664        "blame" => \&git_blame,
 665        "blame_incremental" => \&git_blame_incremental,
 666        "blame_data" => \&git_blame_data,
 667        "blobdiff" => \&git_blobdiff,
 668        "blobdiff_plain" => \&git_blobdiff_plain,
 669        "blob" => \&git_blob,
 670        "blob_plain" => \&git_blob_plain,
 671        "commitdiff" => \&git_commitdiff,
 672        "commitdiff_plain" => \&git_commitdiff_plain,
 673        "commit" => \&git_commit,
 674        "forks" => \&git_forks,
 675        "heads" => \&git_heads,
 676        "history" => \&git_history,
 677        "log" => \&git_log,
 678        "patch" => \&git_patch,
 679        "patches" => \&git_patches,
 680        "rss" => \&git_rss,
 681        "atom" => \&git_atom,
 682        "search" => \&git_search,
 683        "search_help" => \&git_search_help,
 684        "shortlog" => \&git_shortlog,
 685        "summary" => \&git_summary,
 686        "tag" => \&git_tag,
 687        "tags" => \&git_tags,
 688        "tree" => \&git_tree,
 689        "snapshot" => \&git_snapshot,
 690        "object" => \&git_object,
 691        # those below don't need $project
 692        "opml" => \&git_opml,
 693        "project_list" => \&git_project_list,
 694        "project_index" => \&git_project_index,
 695);
 696
 697# finally, we have the hash of allowed extra_options for the commands that
 698# allow them
 699our %allowed_options = (
 700        "--no-merges" => [ qw(rss atom log shortlog history) ],
 701);
 702
 703# fill %input_params with the CGI parameters. All values except for 'opt'
 704# should be single values, but opt can be an array. We should probably
 705# build an array of parameters that can be multi-valued, but since for the time
 706# being it's only this one, we just single it out
 707sub evaluate_query_params {
 708        our $cgi;
 709
 710        while (my ($name, $symbol) = each %cgi_param_mapping) {
 711                if ($symbol eq 'opt') {
 712                        $input_params{$name} = [ $cgi->param($symbol) ];
 713                } else {
 714                        $input_params{$name} = $cgi->param($symbol);
 715                }
 716        }
 717}
 718
 719# now read PATH_INFO and update the parameter list for missing parameters
 720sub evaluate_path_info {
 721        return if defined $input_params{'project'};
 722        return if !$path_info;
 723        $path_info =~ s,^/+,,;
 724        return if !$path_info;
 725
 726        # find which part of PATH_INFO is project
 727        my $project = $path_info;
 728        $project =~ s,/+$,,;
 729        while ($project && !check_head_link("$projectroot/$project")) {
 730                $project =~ s,/*[^/]*$,,;
 731        }
 732        return unless $project;
 733        $input_params{'project'} = $project;
 734
 735        # do not change any parameters if an action is given using the query string
 736        return if $input_params{'action'};
 737        $path_info =~ s,^\Q$project\E/*,,;
 738
 739        # next, check if we have an action
 740        my $action = $path_info;
 741        $action =~ s,/.*$,,;
 742        if (exists $actions{$action}) {
 743                $path_info =~ s,^$action/*,,;
 744                $input_params{'action'} = $action;
 745        }
 746
 747        # list of actions that want hash_base instead of hash, but can have no
 748        # pathname (f) parameter
 749        my @wants_base = (
 750                'tree',
 751                'history',
 752        );
 753
 754        # we want to catch
 755        # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
 756        my ($parentrefname, $parentpathname, $refname, $pathname) =
 757                ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?(.+?)(?::(.+))?$/);
 758
 759        # first, analyze the 'current' part
 760        if (defined $pathname) {
 761                # we got "branch:filename" or "branch:dir/"
 762                # we could use git_get_type(branch:pathname), but:
 763                # - it needs $git_dir
 764                # - it does a git() call
 765                # - the convention of terminating directories with a slash
 766                #   makes it superfluous
 767                # - embedding the action in the PATH_INFO would make it even
 768                #   more superfluous
 769                $pathname =~ s,^/+,,;
 770                if (!$pathname || substr($pathname, -1) eq "/") {
 771                        $input_params{'action'} ||= "tree";
 772                        $pathname =~ s,/$,,;
 773                } else {
 774                        # the default action depends on whether we had parent info
 775                        # or not
 776                        if ($parentrefname) {
 777                                $input_params{'action'} ||= "blobdiff_plain";
 778                        } else {
 779                                $input_params{'action'} ||= "blob_plain";
 780                        }
 781                }
 782                $input_params{'hash_base'} ||= $refname;
 783                $input_params{'file_name'} ||= $pathname;
 784        } elsif (defined $refname) {
 785                # we got "branch". In this case we have to choose if we have to
 786                # set hash or hash_base.
 787                #
 788                # Most of the actions without a pathname only want hash to be
 789                # set, except for the ones specified in @wants_base that want
 790                # hash_base instead. It should also be noted that hand-crafted
 791                # links having 'history' as an action and no pathname or hash
 792                # set will fail, but that happens regardless of PATH_INFO.
 793                $input_params{'action'} ||= "shortlog";
 794                if (grep { $_ eq $input_params{'action'} } @wants_base) {
 795                        $input_params{'hash_base'} ||= $refname;
 796                } else {
 797                        $input_params{'hash'} ||= $refname;
 798                }
 799        }
 800
 801        # next, handle the 'parent' part, if present
 802        if (defined $parentrefname) {
 803                # a missing pathspec defaults to the 'current' filename, allowing e.g.
 804                # someproject/blobdiff/oldrev..newrev:/filename
 805                if ($parentpathname) {
 806                        $parentpathname =~ s,^/+,,;
 807                        $parentpathname =~ s,/$,,;
 808                        $input_params{'file_parent'} ||= $parentpathname;
 809                } else {
 810                        $input_params{'file_parent'} ||= $input_params{'file_name'};
 811                }
 812                # we assume that hash_parent_base is wanted if a path was specified,
 813                # or if the action wants hash_base instead of hash
 814                if (defined $input_params{'file_parent'} ||
 815                        grep { $_ eq $input_params{'action'} } @wants_base) {
 816                        $input_params{'hash_parent_base'} ||= $parentrefname;
 817                } else {
 818                        $input_params{'hash_parent'} ||= $parentrefname;
 819                }
 820        }
 821
 822        # for the snapshot action, we allow URLs in the form
 823        # $project/snapshot/$hash.ext
 824        # where .ext determines the snapshot and gets removed from the
 825        # passed $refname to provide the $hash.
 826        #
 827        # To be able to tell that $refname includes the format extension, we
 828        # require the following two conditions to be satisfied:
 829        # - the hash input parameter MUST have been set from the $refname part
 830        #   of the URL (i.e. they must be equal)
 831        # - the snapshot format MUST NOT have been defined already (e.g. from
 832        #   CGI parameter sf)
 833        # It's also useless to try any matching unless $refname has a dot,
 834        # so we check for that too
 835        if (defined $input_params{'action'} &&
 836                $input_params{'action'} eq 'snapshot' &&
 837                defined $refname && index($refname, '.') != -1 &&
 838                $refname eq $input_params{'hash'} &&
 839                !defined $input_params{'snapshot_format'}) {
 840                # We loop over the known snapshot formats, checking for
 841                # extensions. Allowed extensions are both the defined suffix
 842                # (which includes the initial dot already) and the snapshot
 843                # format key itself, with a prepended dot
 844                while (my ($fmt, $opt) = each %known_snapshot_formats) {
 845                        my $hash = $refname;
 846                        unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
 847                                next;
 848                        }
 849                        my $sfx = $1;
 850                        # a valid suffix was found, so set the snapshot format
 851                        # and reset the hash parameter
 852                        $input_params{'snapshot_format'} = $fmt;
 853                        $input_params{'hash'} = $hash;
 854                        # we also set the format suffix to the one requested
 855                        # in the URL: this way a request for e.g. .tgz returns
 856                        # a .tgz instead of a .tar.gz
 857                        $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
 858                        last;
 859                }
 860        }
 861}
 862
 863our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
 864     $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
 865     $searchtext, $search_regexp);
 866sub evaluate_and_validate_params {
 867        our $action = $input_params{'action'};
 868        if (defined $action) {
 869                if (!validate_action($action)) {
 870                        die_error(400, "Invalid action parameter");
 871                }
 872        }
 873
 874        # parameters which are pathnames
 875        our $project = $input_params{'project'};
 876        if (defined $project) {
 877                if (!validate_project($project)) {
 878                        undef $project;
 879                        die_error(404, "No such project");
 880                }
 881        }
 882
 883        our $file_name = $input_params{'file_name'};
 884        if (defined $file_name) {
 885                if (!validate_pathname($file_name)) {
 886                        die_error(400, "Invalid file parameter");
 887                }
 888        }
 889
 890        our $file_parent = $input_params{'file_parent'};
 891        if (defined $file_parent) {
 892                if (!validate_pathname($file_parent)) {
 893                        die_error(400, "Invalid file parent parameter");
 894                }
 895        }
 896
 897        # parameters which are refnames
 898        our $hash = $input_params{'hash'};
 899        if (defined $hash) {
 900                if (!validate_refname($hash)) {
 901                        die_error(400, "Invalid hash parameter");
 902                }
 903        }
 904
 905        our $hash_parent = $input_params{'hash_parent'};
 906        if (defined $hash_parent) {
 907                if (!validate_refname($hash_parent)) {
 908                        die_error(400, "Invalid hash parent parameter");
 909                }
 910        }
 911
 912        our $hash_base = $input_params{'hash_base'};
 913        if (defined $hash_base) {
 914                if (!validate_refname($hash_base)) {
 915                        die_error(400, "Invalid hash base parameter");
 916                }
 917        }
 918
 919        our @extra_options = @{$input_params{'extra_options'}};
 920        # @extra_options is always defined, since it can only be (currently) set from
 921        # CGI, and $cgi->param() returns the empty array in array context if the param
 922        # is not set
 923        foreach my $opt (@extra_options) {
 924                if (not exists $allowed_options{$opt}) {
 925                        die_error(400, "Invalid option parameter");
 926                }
 927                if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
 928                        die_error(400, "Invalid option parameter for this action");
 929                }
 930        }
 931
 932        our $hash_parent_base = $input_params{'hash_parent_base'};
 933        if (defined $hash_parent_base) {
 934                if (!validate_refname($hash_parent_base)) {
 935                        die_error(400, "Invalid hash parent base parameter");
 936                }
 937        }
 938
 939        # other parameters
 940        our $page = $input_params{'page'};
 941        if (defined $page) {
 942                if ($page =~ m/[^0-9]/) {
 943                        die_error(400, "Invalid page parameter");
 944                }
 945        }
 946
 947        our $searchtype = $input_params{'searchtype'};
 948        if (defined $searchtype) {
 949                if ($searchtype =~ m/[^a-z]/) {
 950                        die_error(400, "Invalid searchtype parameter");
 951                }
 952        }
 953
 954        our $search_use_regexp = $input_params{'search_use_regexp'};
 955
 956        our $searchtext = $input_params{'searchtext'};
 957        our $search_regexp;
 958        if (defined $searchtext) {
 959                if (length($searchtext) < 2) {
 960                        die_error(403, "At least two characters are required for search parameter");
 961                }
 962                $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
 963        }
 964}
 965
 966# path to the current git repository
 967our $git_dir;
 968sub evaluate_git_dir {
 969        our $git_dir = "$projectroot/$project" if $project;
 970}
 971
 972our (@snapshot_fmts, $git_avatar);
 973sub configure_gitweb_features {
 974        # list of supported snapshot formats
 975        our @snapshot_fmts = gitweb_get_feature('snapshot');
 976        @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
 977
 978        # check that the avatar feature is set to a known provider name,
 979        # and for each provider check if the dependencies are satisfied.
 980        # if the provider name is invalid or the dependencies are not met,
 981        # reset $git_avatar to the empty string.
 982        our ($git_avatar) = gitweb_get_feature('avatar');
 983        if ($git_avatar eq 'gravatar') {
 984                $git_avatar = '' unless (eval { require Digest::MD5; 1; });
 985        } elsif ($git_avatar eq 'picon') {
 986                # no dependencies
 987        } else {
 988                $git_avatar = '';
 989        }
 990}
 991
 992# custom error handler: 'die <message>' is Internal Server Error
 993sub handle_errors_html {
 994        my $msg = shift; # it is already HTML escaped
 995
 996        # to avoid infinite loop where error occurs in die_error,
 997        # change handler to default handler, disabling handle_errors_html
 998        set_message("Error occured when inside die_error:\n$msg");
 999
1000        # you cannot jump out of die_error when called as error handler;
1001        # the subroutine set via CGI::Carp::set_message is called _after_
1002        # HTTP headers are already written, so it cannot write them itself
1003        die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1004}
1005set_message(\&handle_errors_html);
1006
1007# dispatch
1008sub dispatch {
1009        if (!defined $action) {
1010                if (defined $hash) {
1011                        $action = git_get_type($hash);
1012                } elsif (defined $hash_base && defined $file_name) {
1013                        $action = git_get_type("$hash_base:$file_name");
1014                } elsif (defined $project) {
1015                        $action = 'summary';
1016                } else {
1017                        $action = 'project_list';
1018                }
1019        }
1020        if (!defined($actions{$action})) {
1021                die_error(400, "Unknown action");
1022        }
1023        if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1024            !$project) {
1025                die_error(400, "Project needed");
1026        }
1027        $actions{$action}->();
1028}
1029
1030sub reset_timer {
1031        our $t0 = [Time::HiRes::gettimeofday()]
1032                if defined $t0;
1033        our $number_of_git_cmds = 0;
1034}
1035
1036sub run_request {
1037        reset_timer();
1038
1039        evaluate_uri();
1040        check_loadavg();
1041
1042        evaluate_query_params();
1043        evaluate_path_info();
1044        evaluate_and_validate_params();
1045        evaluate_git_dir();
1046
1047        configure_gitweb_features();
1048
1049        dispatch();
1050}
1051
1052our $is_last_request = sub { 1 };
1053our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1054our $CGI = 'CGI';
1055our $cgi;
1056sub configure_as_fcgi {
1057        require CGI::Fast;
1058        our $CGI = 'CGI::Fast';
1059
1060        my $request_number = 0;
1061        # let each child service 100 requests
1062        our $is_last_request = sub { ++$request_number > 100 };
1063}
1064sub evaluate_argv {
1065        my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1066        configure_as_fcgi()
1067                if $script_name =~ /\.fcgi$/;
1068
1069        return unless (@ARGV);
1070
1071        require Getopt::Long;
1072        Getopt::Long::GetOptions(
1073                'fastcgi|fcgi|f' => \&configure_as_fcgi,
1074                'nproc|n=i' => sub {
1075                        my ($arg, $val) = @_;
1076                        return unless eval { require FCGI::ProcManager; 1; };
1077                        my $proc_manager = FCGI::ProcManager->new({
1078                                n_processes => $val,
1079                        });
1080                        our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1081                        our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1082                        our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1083                },
1084        );
1085}
1086
1087sub run {
1088        evaluate_argv();
1089        evaluate_gitweb_config();
1090        evaluate_git_version();
1091
1092        # $projectroot and $projects_list might be set in gitweb config file
1093        $projects_list ||= $projectroot;
1094
1095        $pre_listen_hook->()
1096                if $pre_listen_hook;
1097
1098 REQUEST:
1099        while ($cgi = $CGI->new()) {
1100                $pre_dispatch_hook->()
1101                        if $pre_dispatch_hook;
1102
1103                run_request();
1104
1105                $pre_dispatch_hook->()
1106                        if $post_dispatch_hook;
1107
1108                last REQUEST if ($is_last_request->());
1109        }
1110
1111 DONE_GITWEB:
1112        1;
1113}
1114
1115run();
1116
1117if (defined caller) {
1118        # wrapped in a subroutine processing requests,
1119        # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1120        return;
1121} else {
1122        # pure CGI script, serving single request
1123        exit;
1124}
1125
1126## ======================================================================
1127## action links
1128
1129# possible values of extra options
1130# -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1131# -replay => 1      - start from a current view (replay with modifications)
1132# -path_info => 0|1 - don't use/use path_info URL (if possible)
1133sub href {
1134        my %params = @_;
1135        # default is to use -absolute url() i.e. $my_uri
1136        my $href = $params{-full} ? $my_url : $my_uri;
1137
1138        $params{'project'} = $project unless exists $params{'project'};
1139
1140        if ($params{-replay}) {
1141                while (my ($name, $symbol) = each %cgi_param_mapping) {
1142                        if (!exists $params{$name}) {
1143                                $params{$name} = $input_params{$name};
1144                        }
1145                }
1146        }
1147
1148        my $use_pathinfo = gitweb_check_feature('pathinfo');
1149        if (defined $params{'project'} &&
1150            (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1151                # try to put as many parameters as possible in PATH_INFO:
1152                #   - project name
1153                #   - action
1154                #   - hash_parent or hash_parent_base:/file_parent
1155                #   - hash or hash_base:/filename
1156                #   - the snapshot_format as an appropriate suffix
1157
1158                # When the script is the root DirectoryIndex for the domain,
1159                # $href here would be something like http://gitweb.example.com/
1160                # Thus, we strip any trailing / from $href, to spare us double
1161                # slashes in the final URL
1162                $href =~ s,/$,,;
1163
1164                # Then add the project name, if present
1165                $href .= "/".esc_url($params{'project'});
1166                delete $params{'project'};
1167
1168                # since we destructively absorb parameters, we keep this
1169                # boolean that remembers if we're handling a snapshot
1170                my $is_snapshot = $params{'action'} eq 'snapshot';
1171
1172                # Summary just uses the project path URL, any other action is
1173                # added to the URL
1174                if (defined $params{'action'}) {
1175                        $href .= "/".esc_url($params{'action'}) unless $params{'action'} eq 'summary';
1176                        delete $params{'action'};
1177                }
1178
1179                # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1180                # stripping nonexistent or useless pieces
1181                $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1182                        || $params{'hash_parent'} || $params{'hash'});
1183                if (defined $params{'hash_base'}) {
1184                        if (defined $params{'hash_parent_base'}) {
1185                                $href .= esc_url($params{'hash_parent_base'});
1186                                # skip the file_parent if it's the same as the file_name
1187                                if (defined $params{'file_parent'}) {
1188                                        if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1189                                                delete $params{'file_parent'};
1190                                        } elsif ($params{'file_parent'} !~ /\.\./) {
1191                                                $href .= ":/".esc_url($params{'file_parent'});
1192                                                delete $params{'file_parent'};
1193                                        }
1194                                }
1195                                $href .= "..";
1196                                delete $params{'hash_parent'};
1197                                delete $params{'hash_parent_base'};
1198                        } elsif (defined $params{'hash_parent'}) {
1199                                $href .= esc_url($params{'hash_parent'}). "..";
1200                                delete $params{'hash_parent'};
1201                        }
1202
1203                        $href .= esc_url($params{'hash_base'});
1204                        if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1205                                $href .= ":/".esc_url($params{'file_name'});
1206                                delete $params{'file_name'};
1207                        }
1208                        delete $params{'hash'};
1209                        delete $params{'hash_base'};
1210                } elsif (defined $params{'hash'}) {
1211                        $href .= esc_url($params{'hash'});
1212                        delete $params{'hash'};
1213                }
1214
1215                # If the action was a snapshot, we can absorb the
1216                # snapshot_format parameter too
1217                if ($is_snapshot) {
1218                        my $fmt = $params{'snapshot_format'};
1219                        # snapshot_format should always be defined when href()
1220                        # is called, but just in case some code forgets, we
1221                        # fall back to the default
1222                        $fmt ||= $snapshot_fmts[0];
1223                        $href .= $known_snapshot_formats{$fmt}{'suffix'};
1224                        delete $params{'snapshot_format'};
1225                }
1226        }
1227
1228        # now encode the parameters explicitly
1229        my @result = ();
1230        for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1231                my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1232                if (defined $params{$name}) {
1233                        if (ref($params{$name}) eq "ARRAY") {
1234                                foreach my $par (@{$params{$name}}) {
1235                                        push @result, $symbol . "=" . esc_param($par);
1236                                }
1237                        } else {
1238                                push @result, $symbol . "=" . esc_param($params{$name});
1239                        }
1240                }
1241        }
1242        $href .= "?" . join(';', @result) if scalar @result;
1243
1244        return $href;
1245}
1246
1247
1248## ======================================================================
1249## validation, quoting/unquoting and escaping
1250
1251sub validate_action {
1252        my $input = shift || return undef;
1253        return undef unless exists $actions{$input};
1254        return $input;
1255}
1256
1257sub validate_project {
1258        my $input = shift || return undef;
1259        if (!validate_pathname($input) ||
1260                !(-d "$projectroot/$input") ||
1261                !check_export_ok("$projectroot/$input") ||
1262                ($strict_export && !project_in_list($input))) {
1263                return undef;
1264        } else {
1265                return $input;
1266        }
1267}
1268
1269sub validate_pathname {
1270        my $input = shift || return undef;
1271
1272        # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1273        # at the beginning, at the end, and between slashes.
1274        # also this catches doubled slashes
1275        if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1276                return undef;
1277        }
1278        # no null characters
1279        if ($input =~ m!\0!) {
1280                return undef;
1281        }
1282        return $input;
1283}
1284
1285sub validate_refname {
1286        my $input = shift || return undef;
1287
1288        # textual hashes are O.K.
1289        if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1290                return $input;
1291        }
1292        # it must be correct pathname
1293        $input = validate_pathname($input)
1294                or return undef;
1295        # restrictions on ref name according to git-check-ref-format
1296        if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1297                return undef;
1298        }
1299        return $input;
1300}
1301
1302# decode sequences of octets in utf8 into Perl's internal form,
1303# which is utf-8 with utf8 flag set if needed.  gitweb writes out
1304# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1305sub to_utf8 {
1306        my $str = shift;
1307        return undef unless defined $str;
1308        if (utf8::valid($str)) {
1309                utf8::decode($str);
1310                return $str;
1311        } else {
1312                return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1313        }
1314}
1315
1316# quote unsafe chars, but keep the slash, even when it's not
1317# correct, but quoted slashes look too horrible in bookmarks
1318sub esc_param {
1319        my $str = shift;
1320        return undef unless defined $str;
1321        $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1322        $str =~ s/ /\+/g;
1323        return $str;
1324}
1325
1326# quote unsafe chars in whole URL, so some characters cannot be quoted
1327sub esc_url {
1328        my $str = shift;
1329        return undef unless defined $str;
1330        $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1331        $str =~ s/ /\+/g;
1332        return $str;
1333}
1334
1335# replace invalid utf8 character with SUBSTITUTION sequence
1336sub esc_html {
1337        my $str = shift;
1338        my %opts = @_;
1339
1340        return undef unless defined $str;
1341
1342        $str = to_utf8($str);
1343        $str = $cgi->escapeHTML($str);
1344        if ($opts{'-nbsp'}) {
1345                $str =~ s/ /&nbsp;/g;
1346        }
1347        $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1348        return $str;
1349}
1350
1351# quote control characters and escape filename to HTML
1352sub esc_path {
1353        my $str = shift;
1354        my %opts = @_;
1355
1356        return undef unless defined $str;
1357
1358        $str = to_utf8($str);
1359        $str = $cgi->escapeHTML($str);
1360        if ($opts{'-nbsp'}) {
1361                $str =~ s/ /&nbsp;/g;
1362        }
1363        $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1364        return $str;
1365}
1366
1367# Make control characters "printable", using character escape codes (CEC)
1368sub quot_cec {
1369        my $cntrl = shift;
1370        my %opts = @_;
1371        my %es = ( # character escape codes, aka escape sequences
1372                "\t" => '\t',   # tab            (HT)
1373                "\n" => '\n',   # line feed      (LF)
1374                "\r" => '\r',   # carrige return (CR)
1375                "\f" => '\f',   # form feed      (FF)
1376                "\b" => '\b',   # backspace      (BS)
1377                "\a" => '\a',   # alarm (bell)   (BEL)
1378                "\e" => '\e',   # escape         (ESC)
1379                "\013" => '\v', # vertical tab   (VT)
1380                "\000" => '\0', # nul character  (NUL)
1381        );
1382        my $chr = ( (exists $es{$cntrl})
1383                    ? $es{$cntrl}
1384                    : sprintf('\%2x', ord($cntrl)) );
1385        if ($opts{-nohtml}) {
1386                return $chr;
1387        } else {
1388                return "<span class=\"cntrl\">$chr</span>";
1389        }
1390}
1391
1392# Alternatively use unicode control pictures codepoints,
1393# Unicode "printable representation" (PR)
1394sub quot_upr {
1395        my $cntrl = shift;
1396        my %opts = @_;
1397
1398        my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1399        if ($opts{-nohtml}) {
1400                return $chr;
1401        } else {
1402                return "<span class=\"cntrl\">$chr</span>";
1403        }
1404}
1405
1406# git may return quoted and escaped filenames
1407sub unquote {
1408        my $str = shift;
1409
1410        sub unq {
1411                my $seq = shift;
1412                my %es = ( # character escape codes, aka escape sequences
1413                        't' => "\t",   # tab            (HT, TAB)
1414                        'n' => "\n",   # newline        (NL)
1415                        'r' => "\r",   # return         (CR)
1416                        'f' => "\f",   # form feed      (FF)
1417                        'b' => "\b",   # backspace      (BS)
1418                        'a' => "\a",   # alarm (bell)   (BEL)
1419                        'e' => "\e",   # escape         (ESC)
1420                        'v' => "\013", # vertical tab   (VT)
1421                );
1422
1423                if ($seq =~ m/^[0-7]{1,3}$/) {
1424                        # octal char sequence
1425                        return chr(oct($seq));
1426                } elsif (exists $es{$seq}) {
1427                        # C escape sequence, aka character escape code
1428                        return $es{$seq};
1429                }
1430                # quoted ordinary character
1431                return $seq;
1432        }
1433
1434        if ($str =~ m/^"(.*)"$/) {
1435                # needs unquoting
1436                $str = $1;
1437                $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1438        }
1439        return $str;
1440}
1441
1442# escape tabs (convert tabs to spaces)
1443sub untabify {
1444        my $line = shift;
1445
1446        while ((my $pos = index($line, "\t")) != -1) {
1447                if (my $count = (8 - ($pos % 8))) {
1448                        my $spaces = ' ' x $count;
1449                        $line =~ s/\t/$spaces/;
1450                }
1451        }
1452
1453        return $line;
1454}
1455
1456sub project_in_list {
1457        my $project = shift;
1458        my @list = git_get_projects_list();
1459        return @list && scalar(grep { $_->{'path'} eq $project } @list);
1460}
1461
1462## ----------------------------------------------------------------------
1463## HTML aware string manipulation
1464
1465# Try to chop given string on a word boundary between position
1466# $len and $len+$add_len. If there is no word boundary there,
1467# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1468# (marking chopped part) would be longer than given string.
1469sub chop_str {
1470        my $str = shift;
1471        my $len = shift;
1472        my $add_len = shift || 10;
1473        my $where = shift || 'right'; # 'left' | 'center' | 'right'
1474
1475        # Make sure perl knows it is utf8 encoded so we don't
1476        # cut in the middle of a utf8 multibyte char.
1477        $str = to_utf8($str);
1478
1479        # allow only $len chars, but don't cut a word if it would fit in $add_len
1480        # if it doesn't fit, cut it if it's still longer than the dots we would add
1481        # remove chopped character entities entirely
1482
1483        # when chopping in the middle, distribute $len into left and right part
1484        # return early if chopping wouldn't make string shorter
1485        if ($where eq 'center') {
1486                return $str if ($len + 5 >= length($str)); # filler is length 5
1487                $len = int($len/2);
1488        } else {
1489                return $str if ($len + 4 >= length($str)); # filler is length 4
1490        }
1491
1492        # regexps: ending and beginning with word part up to $add_len
1493        my $endre = qr/.{$len}\w{0,$add_len}/;
1494        my $begre = qr/\w{0,$add_len}.{$len}/;
1495
1496        if ($where eq 'left') {
1497                $str =~ m/^(.*?)($begre)$/;
1498                my ($lead, $body) = ($1, $2);
1499                if (length($lead) > 4) {
1500                        $lead = " ...";
1501                }
1502                return "$lead$body";
1503
1504        } elsif ($where eq 'center') {
1505                $str =~ m/^($endre)(.*)$/;
1506                my ($left, $str)  = ($1, $2);
1507                $str =~ m/^(.*?)($begre)$/;
1508                my ($mid, $right) = ($1, $2);
1509                if (length($mid) > 5) {
1510                        $mid = " ... ";
1511                }
1512                return "$left$mid$right";
1513
1514        } else {
1515                $str =~ m/^($endre)(.*)$/;
1516                my $body = $1;
1517                my $tail = $2;
1518                if (length($tail) > 4) {
1519                        $tail = "... ";
1520                }
1521                return "$body$tail";
1522        }
1523}
1524
1525# takes the same arguments as chop_str, but also wraps a <span> around the
1526# result with a title attribute if it does get chopped. Additionally, the
1527# string is HTML-escaped.
1528sub chop_and_escape_str {
1529        my ($str) = @_;
1530
1531        my $chopped = chop_str(@_);
1532        if ($chopped eq $str) {
1533                return esc_html($chopped);
1534        } else {
1535                $str =~ s/[[:cntrl:]]/?/g;
1536                return $cgi->span({-title=>$str}, esc_html($chopped));
1537        }
1538}
1539
1540## ----------------------------------------------------------------------
1541## functions returning short strings
1542
1543# CSS class for given age value (in seconds)
1544sub age_class {
1545        my $age = shift;
1546
1547        if (!defined $age) {
1548                return "noage";
1549        } elsif ($age < 60*60*2) {
1550                return "age0";
1551        } elsif ($age < 60*60*24*2) {
1552                return "age1";
1553        } else {
1554                return "age2";
1555        }
1556}
1557
1558# convert age in seconds to "nn units ago" string
1559sub age_string {
1560        my $age = shift;
1561        my $age_str;
1562
1563        if ($age > 60*60*24*365*2) {
1564                $age_str = (int $age/60/60/24/365);
1565                $age_str .= " years ago";
1566        } elsif ($age > 60*60*24*(365/12)*2) {
1567                $age_str = int $age/60/60/24/(365/12);
1568                $age_str .= " months ago";
1569        } elsif ($age > 60*60*24*7*2) {
1570                $age_str = int $age/60/60/24/7;
1571                $age_str .= " weeks ago";
1572        } elsif ($age > 60*60*24*2) {
1573                $age_str = int $age/60/60/24;
1574                $age_str .= " days ago";
1575        } elsif ($age > 60*60*2) {
1576                $age_str = int $age/60/60;
1577                $age_str .= " hours ago";
1578        } elsif ($age > 60*2) {
1579                $age_str = int $age/60;
1580                $age_str .= " min ago";
1581        } elsif ($age > 2) {
1582                $age_str = int $age;
1583                $age_str .= " sec ago";
1584        } else {
1585                $age_str .= " right now";
1586        }
1587        return $age_str;
1588}
1589
1590use constant {
1591        S_IFINVALID => 0030000,
1592        S_IFGITLINK => 0160000,
1593};
1594
1595# submodule/subproject, a commit object reference
1596sub S_ISGITLINK {
1597        my $mode = shift;
1598
1599        return (($mode & S_IFMT) == S_IFGITLINK)
1600}
1601
1602# convert file mode in octal to symbolic file mode string
1603sub mode_str {
1604        my $mode = oct shift;
1605
1606        if (S_ISGITLINK($mode)) {
1607                return 'm---------';
1608        } elsif (S_ISDIR($mode & S_IFMT)) {
1609                return 'drwxr-xr-x';
1610        } elsif (S_ISLNK($mode)) {
1611                return 'lrwxrwxrwx';
1612        } elsif (S_ISREG($mode)) {
1613                # git cares only about the executable bit
1614                if ($mode & S_IXUSR) {
1615                        return '-rwxr-xr-x';
1616                } else {
1617                        return '-rw-r--r--';
1618                };
1619        } else {
1620                return '----------';
1621        }
1622}
1623
1624# convert file mode in octal to file type string
1625sub file_type {
1626        my $mode = shift;
1627
1628        if ($mode !~ m/^[0-7]+$/) {
1629                return $mode;
1630        } else {
1631                $mode = oct $mode;
1632        }
1633
1634        if (S_ISGITLINK($mode)) {
1635                return "submodule";
1636        } elsif (S_ISDIR($mode & S_IFMT)) {
1637                return "directory";
1638        } elsif (S_ISLNK($mode)) {
1639                return "symlink";
1640        } elsif (S_ISREG($mode)) {
1641                return "file";
1642        } else {
1643                return "unknown";
1644        }
1645}
1646
1647# convert file mode in octal to file type description string
1648sub file_type_long {
1649        my $mode = shift;
1650
1651        if ($mode !~ m/^[0-7]+$/) {
1652                return $mode;
1653        } else {
1654                $mode = oct $mode;
1655        }
1656
1657        if (S_ISGITLINK($mode)) {
1658                return "submodule";
1659        } elsif (S_ISDIR($mode & S_IFMT)) {
1660                return "directory";
1661        } elsif (S_ISLNK($mode)) {
1662                return "symlink";
1663        } elsif (S_ISREG($mode)) {
1664                if ($mode & S_IXUSR) {
1665                        return "executable";
1666                } else {
1667                        return "file";
1668                };
1669        } else {
1670                return "unknown";
1671        }
1672}
1673
1674
1675## ----------------------------------------------------------------------
1676## functions returning short HTML fragments, or transforming HTML fragments
1677## which don't belong to other sections
1678
1679# format line of commit message.
1680sub format_log_line_html {
1681        my $line = shift;
1682
1683        $line = esc_html($line, -nbsp=>1);
1684        $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1685                $cgi->a({-href => href(action=>"object", hash=>$1),
1686                                        -class => "text"}, $1);
1687        }eg;
1688
1689        return $line;
1690}
1691
1692# format marker of refs pointing to given object
1693
1694# the destination action is chosen based on object type and current context:
1695# - for annotated tags, we choose the tag view unless it's the current view
1696#   already, in which case we go to shortlog view
1697# - for other refs, we keep the current view if we're in history, shortlog or
1698#   log view, and select shortlog otherwise
1699sub format_ref_marker {
1700        my ($refs, $id) = @_;
1701        my $markers = '';
1702
1703        if (defined $refs->{$id}) {
1704                foreach my $ref (@{$refs->{$id}}) {
1705                        # this code exploits the fact that non-lightweight tags are the
1706                        # only indirect objects, and that they are the only objects for which
1707                        # we want to use tag instead of shortlog as action
1708                        my ($type, $name) = qw();
1709                        my $indirect = ($ref =~ s/\^\{\}$//);
1710                        # e.g. tags/v2.6.11 or heads/next
1711                        if ($ref =~ m!^(.*?)s?/(.*)$!) {
1712                                $type = $1;
1713                                $name = $2;
1714                        } else {
1715                                $type = "ref";
1716                                $name = $ref;
1717                        }
1718
1719                        my $class = $type;
1720                        $class .= " indirect" if $indirect;
1721
1722                        my $dest_action = "shortlog";
1723
1724                        if ($indirect) {
1725                                $dest_action = "tag" unless $action eq "tag";
1726                        } elsif ($action =~ /^(history|(short)?log)$/) {
1727                                $dest_action = $action;
1728                        }
1729
1730                        my $dest = "";
1731                        $dest .= "refs/" unless $ref =~ m!^refs/!;
1732                        $dest .= $ref;
1733
1734                        my $link = $cgi->a({
1735                                -href => href(
1736                                        action=>$dest_action,
1737                                        hash=>$dest
1738                                )}, $name);
1739
1740                        $markers .= " <span class=\"$class\" title=\"$ref\">" .
1741                                $link . "</span>";
1742                }
1743        }
1744
1745        if ($markers) {
1746                return ' <span class="refs">'. $markers . '</span>';
1747        } else {
1748                return "";
1749        }
1750}
1751
1752# format, perhaps shortened and with markers, title line
1753sub format_subject_html {
1754        my ($long, $short, $href, $extra) = @_;
1755        $extra = '' unless defined($extra);
1756
1757        if (length($short) < length($long)) {
1758                $long =~ s/[[:cntrl:]]/?/g;
1759                return $cgi->a({-href => $href, -class => "list subject",
1760                                -title => to_utf8($long)},
1761                       esc_html($short)) . $extra;
1762        } else {
1763                return $cgi->a({-href => $href, -class => "list subject"},
1764                       esc_html($long)) . $extra;
1765        }
1766}
1767
1768# Rather than recomputing the url for an email multiple times, we cache it
1769# after the first hit. This gives a visible benefit in views where the avatar
1770# for the same email is used repeatedly (e.g. shortlog).
1771# The cache is shared by all avatar engines (currently gravatar only), which
1772# are free to use it as preferred. Since only one avatar engine is used for any
1773# given page, there's no risk for cache conflicts.
1774our %avatar_cache = ();
1775
1776# Compute the picon url for a given email, by using the picon search service over at
1777# http://www.cs.indiana.edu/picons/search.html
1778sub picon_url {
1779        my $email = lc shift;
1780        if (!$avatar_cache{$email}) {
1781                my ($user, $domain) = split('@', $email);
1782                $avatar_cache{$email} =
1783                        "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1784                        "$domain/$user/" .
1785                        "users+domains+unknown/up/single";
1786        }
1787        return $avatar_cache{$email};
1788}
1789
1790# Compute the gravatar url for a given email, if it's not in the cache already.
1791# Gravatar stores only the part of the URL before the size, since that's the
1792# one computationally more expensive. This also allows reuse of the cache for
1793# different sizes (for this particular engine).
1794sub gravatar_url {
1795        my $email = lc shift;
1796        my $size = shift;
1797        $avatar_cache{$email} ||=
1798                "http://www.gravatar.com/avatar/" .
1799                        Digest::MD5::md5_hex($email) . "?s=";
1800        return $avatar_cache{$email} . $size;
1801}
1802
1803# Insert an avatar for the given $email at the given $size if the feature
1804# is enabled.
1805sub git_get_avatar {
1806        my ($email, %opts) = @_;
1807        my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1808        my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1809        $opts{-size} ||= 'default';
1810        my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1811        my $url = "";
1812        if ($git_avatar eq 'gravatar') {
1813                $url = gravatar_url($email, $size);
1814        } elsif ($git_avatar eq 'picon') {
1815                $url = picon_url($email);
1816        }
1817        # Other providers can be added by extending the if chain, defining $url
1818        # as needed. If no variant puts something in $url, we assume avatars
1819        # are completely disabled/unavailable.
1820        if ($url) {
1821                return $pre_white .
1822                       "<img width=\"$size\" " .
1823                            "class=\"avatar\" " .
1824                            "src=\"$url\" " .
1825                            "alt=\"\" " .
1826                       "/>" . $post_white;
1827        } else {
1828                return "";
1829        }
1830}
1831
1832sub format_search_author {
1833        my ($author, $searchtype, $displaytext) = @_;
1834        my $have_search = gitweb_check_feature('search');
1835
1836        if ($have_search) {
1837                my $performed = "";
1838                if ($searchtype eq 'author') {
1839                        $performed = "authored";
1840                } elsif ($searchtype eq 'committer') {
1841                        $performed = "committed";
1842                }
1843
1844                return $cgi->a({-href => href(action=>"search", hash=>$hash,
1845                                searchtext=>$author,
1846                                searchtype=>$searchtype), class=>"list",
1847                                title=>"Search for commits $performed by $author"},
1848                                $displaytext);
1849
1850        } else {
1851                return $displaytext;
1852        }
1853}
1854
1855# format the author name of the given commit with the given tag
1856# the author name is chopped and escaped according to the other
1857# optional parameters (see chop_str).
1858sub format_author_html {
1859        my $tag = shift;
1860        my $co = shift;
1861        my $author = chop_and_escape_str($co->{'author_name'}, @_);
1862        return "<$tag class=\"author\">" .
1863               format_search_author($co->{'author_name'}, "author",
1864                       git_get_avatar($co->{'author_email'}, -pad_after => 1) .
1865                       $author) .
1866               "</$tag>";
1867}
1868
1869# format git diff header line, i.e. "diff --(git|combined|cc) ..."
1870sub format_git_diff_header_line {
1871        my $line = shift;
1872        my $diffinfo = shift;
1873        my ($from, $to) = @_;
1874
1875        if ($diffinfo->{'nparents'}) {
1876                # combined diff
1877                $line =~ s!^(diff (.*?) )"?.*$!$1!;
1878                if ($to->{'href'}) {
1879                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1880                                         esc_path($to->{'file'}));
1881                } else { # file was deleted (no href)
1882                        $line .= esc_path($to->{'file'});
1883                }
1884        } else {
1885                # "ordinary" diff
1886                $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
1887                if ($from->{'href'}) {
1888                        $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
1889                                         'a/' . esc_path($from->{'file'}));
1890                } else { # file was added (no href)
1891                        $line .= 'a/' . esc_path($from->{'file'});
1892                }
1893                $line .= ' ';
1894                if ($to->{'href'}) {
1895                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1896                                         'b/' . esc_path($to->{'file'}));
1897                } else { # file was deleted
1898                        $line .= 'b/' . esc_path($to->{'file'});
1899                }
1900        }
1901
1902        return "<div class=\"diff header\">$line</div>\n";
1903}
1904
1905# format extended diff header line, before patch itself
1906sub format_extended_diff_header_line {
1907        my $line = shift;
1908        my $diffinfo = shift;
1909        my ($from, $to) = @_;
1910
1911        # match <path>
1912        if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
1913                $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
1914                                       esc_path($from->{'file'}));
1915        }
1916        if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
1917                $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
1918                                 esc_path($to->{'file'}));
1919        }
1920        # match single <mode>
1921        if ($line =~ m/\s(\d{6})$/) {
1922                $line .= '<span class="info"> (' .
1923                         file_type_long($1) .
1924                         ')</span>';
1925        }
1926        # match <hash>
1927        if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
1928                # can match only for combined diff
1929                $line = 'index ';
1930                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
1931                        if ($from->{'href'}[$i]) {
1932                                $line .= $cgi->a({-href=>$from->{'href'}[$i],
1933                                                  -class=>"hash"},
1934                                                 substr($diffinfo->{'from_id'}[$i],0,7));
1935                        } else {
1936                                $line .= '0' x 7;
1937                        }
1938                        # separator
1939                        $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
1940                }
1941                $line .= '..';
1942                if ($to->{'href'}) {
1943                        $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
1944                                         substr($diffinfo->{'to_id'},0,7));
1945                } else {
1946                        $line .= '0' x 7;
1947                }
1948
1949        } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
1950                # can match only for ordinary diff
1951                my ($from_link, $to_link);
1952                if ($from->{'href'}) {
1953                        $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
1954                                             substr($diffinfo->{'from_id'},0,7));
1955                } else {
1956                        $from_link = '0' x 7;
1957                }
1958                if ($to->{'href'}) {
1959                        $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
1960                                           substr($diffinfo->{'to_id'},0,7));
1961                } else {
1962                        $to_link = '0' x 7;
1963                }
1964                my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
1965                $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
1966        }
1967
1968        return $line . "<br/>\n";
1969}
1970
1971# format from-file/to-file diff header
1972sub format_diff_from_to_header {
1973        my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
1974        my $line;
1975        my $result = '';
1976
1977        $line = $from_line;
1978        #assert($line =~ m/^---/) if DEBUG;
1979        # no extra formatting for "^--- /dev/null"
1980        if (! $diffinfo->{'nparents'}) {
1981                # ordinary (single parent) diff
1982                if ($line =~ m!^--- "?a/!) {
1983                        if ($from->{'href'}) {
1984                                $line = '--- a/' .
1985                                        $cgi->a({-href=>$from->{'href'}, -class=>"path"},
1986                                                esc_path($from->{'file'}));
1987                        } else {
1988                                $line = '--- a/' .
1989                                        esc_path($from->{'file'});
1990                        }
1991                }
1992                $result .= qq!<div class="diff from_file">$line</div>\n!;
1993
1994        } else {
1995                # combined diff (merge commit)
1996                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
1997                        if ($from->{'href'}[$i]) {
1998                                $line = '--- ' .
1999                                        $cgi->a({-href=>href(action=>"blobdiff",
2000                                                             hash_parent=>$diffinfo->{'from_id'}[$i],
2001                                                             hash_parent_base=>$parents[$i],
2002                                                             file_parent=>$from->{'file'}[$i],
2003                                                             hash=>$diffinfo->{'to_id'},
2004                                                             hash_base=>$hash,
2005                                                             file_name=>$to->{'file'}),
2006                                                 -class=>"path",
2007                                                 -title=>"diff" . ($i+1)},
2008                                                $i+1) .
2009                                        '/' .
2010                                        $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2011                                                esc_path($from->{'file'}[$i]));
2012                        } else {
2013                                $line = '--- /dev/null';
2014                        }
2015                        $result .= qq!<div class="diff from_file">$line</div>\n!;
2016                }
2017        }
2018
2019        $line = $to_line;
2020        #assert($line =~ m/^\+\+\+/) if DEBUG;
2021        # no extra formatting for "^+++ /dev/null"
2022        if ($line =~ m!^\+\+\+ "?b/!) {
2023                if ($to->{'href'}) {
2024                        $line = '+++ b/' .
2025                                $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2026                                        esc_path($to->{'file'}));
2027                } else {
2028                        $line = '+++ b/' .
2029                                esc_path($to->{'file'});
2030                }
2031        }
2032        $result .= qq!<div class="diff to_file">$line</div>\n!;
2033
2034        return $result;
2035}
2036
2037# create note for patch simplified by combined diff
2038sub format_diff_cc_simplified {
2039        my ($diffinfo, @parents) = @_;
2040        my $result = '';
2041
2042        $result .= "<div class=\"diff header\">" .
2043                   "diff --cc ";
2044        if (!is_deleted($diffinfo)) {
2045                $result .= $cgi->a({-href => href(action=>"blob",
2046                                                  hash_base=>$hash,
2047                                                  hash=>$diffinfo->{'to_id'},
2048                                                  file_name=>$diffinfo->{'to_file'}),
2049                                    -class => "path"},
2050                                   esc_path($diffinfo->{'to_file'}));
2051        } else {
2052                $result .= esc_path($diffinfo->{'to_file'});
2053        }
2054        $result .= "</div>\n" . # class="diff header"
2055                   "<div class=\"diff nodifferences\">" .
2056                   "Simple merge" .
2057                   "</div>\n"; # class="diff nodifferences"
2058
2059        return $result;
2060}
2061
2062# format patch (diff) line (not to be used for diff headers)
2063sub format_diff_line {
2064        my $line = shift;
2065        my ($from, $to) = @_;
2066        my $diff_class = "";
2067
2068        chomp $line;
2069
2070        if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2071                # combined diff
2072                my $prefix = substr($line, 0, scalar @{$from->{'href'}});
2073                if ($line =~ m/^\@{3}/) {
2074                        $diff_class = " chunk_header";
2075                } elsif ($line =~ m/^\\/) {
2076                        $diff_class = " incomplete";
2077                } elsif ($prefix =~ tr/+/+/) {
2078                        $diff_class = " add";
2079                } elsif ($prefix =~ tr/-/-/) {
2080                        $diff_class = " rem";
2081                }
2082        } else {
2083                # assume ordinary diff
2084                my $char = substr($line, 0, 1);
2085                if ($char eq '+') {
2086                        $diff_class = " add";
2087                } elsif ($char eq '-') {
2088                        $diff_class = " rem";
2089                } elsif ($char eq '@') {
2090                        $diff_class = " chunk_header";
2091                } elsif ($char eq "\\") {
2092                        $diff_class = " incomplete";
2093                }
2094        }
2095        $line = untabify($line);
2096        if ($from && $to && $line =~ m/^\@{2} /) {
2097                my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2098                        $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2099
2100                $from_lines = 0 unless defined $from_lines;
2101                $to_lines   = 0 unless defined $to_lines;
2102
2103                if ($from->{'href'}) {
2104                        $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2105                                             -class=>"list"}, $from_text);
2106                }
2107                if ($to->{'href'}) {
2108                        $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2109                                             -class=>"list"}, $to_text);
2110                }
2111                $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2112                        "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2113                return "<div class=\"diff$diff_class\">$line</div>\n";
2114        } elsif ($from && $to && $line =~ m/^\@{3}/) {
2115                my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2116                my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2117
2118                @from_text = split(' ', $ranges);
2119                for (my $i = 0; $i < @from_text; ++$i) {
2120                        ($from_start[$i], $from_nlines[$i]) =
2121                                (split(',', substr($from_text[$i], 1)), 0);
2122                }
2123
2124                $to_text   = pop @from_text;
2125                $to_start  = pop @from_start;
2126                $to_nlines = pop @from_nlines;
2127
2128                $line = "<span class=\"chunk_info\">$prefix ";
2129                for (my $i = 0; $i < @from_text; ++$i) {
2130                        if ($from->{'href'}[$i]) {
2131                                $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2132                                                  -class=>"list"}, $from_text[$i]);
2133                        } else {
2134                                $line .= $from_text[$i];
2135                        }
2136                        $line .= " ";
2137                }
2138                if ($to->{'href'}) {
2139                        $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2140                                          -class=>"list"}, $to_text);
2141                } else {
2142                        $line .= $to_text;
2143                }
2144                $line .= " $prefix</span>" .
2145                         "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2146                return "<div class=\"diff$diff_class\">$line</div>\n";
2147        }
2148        return "<div class=\"diff$diff_class\">" . esc_html($line, -nbsp=>1) . "</div>\n";
2149}
2150
2151# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2152# linked.  Pass the hash of the tree/commit to snapshot.
2153sub format_snapshot_links {
2154        my ($hash) = @_;
2155        my $num_fmts = @snapshot_fmts;
2156        if ($num_fmts > 1) {
2157                # A parenthesized list of links bearing format names.
2158                # e.g. "snapshot (_tar.gz_ _zip_)"
2159                return "snapshot (" . join(' ', map
2160                        $cgi->a({
2161                                -href => href(
2162                                        action=>"snapshot",
2163                                        hash=>$hash,
2164                                        snapshot_format=>$_
2165                                )
2166                        }, $known_snapshot_formats{$_}{'display'})
2167                , @snapshot_fmts) . ")";
2168        } elsif ($num_fmts == 1) {
2169                # A single "snapshot" link whose tooltip bears the format name.
2170                # i.e. "_snapshot_"
2171                my ($fmt) = @snapshot_fmts;
2172                return
2173                        $cgi->a({
2174                                -href => href(
2175                                        action=>"snapshot",
2176                                        hash=>$hash,
2177                                        snapshot_format=>$fmt
2178                                ),
2179                                -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2180                        }, "snapshot");
2181        } else { # $num_fmts == 0
2182                return undef;
2183        }
2184}
2185
2186## ......................................................................
2187## functions returning values to be passed, perhaps after some
2188## transformation, to other functions; e.g. returning arguments to href()
2189
2190# returns hash to be passed to href to generate gitweb URL
2191# in -title key it returns description of link
2192sub get_feed_info {
2193        my $format = shift || 'Atom';
2194        my %res = (action => lc($format));
2195
2196        # feed links are possible only for project views
2197        return unless (defined $project);
2198        # some views should link to OPML, or to generic project feed,
2199        # or don't have specific feed yet (so they should use generic)
2200        return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2201
2202        my $branch;
2203        # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2204        # from tag links; this also makes possible to detect branch links
2205        if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2206            (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2207                $branch = $1;
2208        }
2209        # find log type for feed description (title)
2210        my $type = 'log';
2211        if (defined $file_name) {
2212                $type  = "history of $file_name";
2213                $type .= "/" if ($action eq 'tree');
2214                $type .= " on '$branch'" if (defined $branch);
2215        } else {
2216                $type = "log of $branch" if (defined $branch);
2217        }
2218
2219        $res{-title} = $type;
2220        $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2221        $res{'file_name'} = $file_name;
2222
2223        return %res;
2224}
2225
2226## ----------------------------------------------------------------------
2227## git utility subroutines, invoking git commands
2228
2229# returns path to the core git executable and the --git-dir parameter as list
2230sub git_cmd {
2231        $number_of_git_cmds++;
2232        return $GIT, '--git-dir='.$git_dir;
2233}
2234
2235# quote the given arguments for passing them to the shell
2236# quote_command("command", "arg 1", "arg with ' and ! characters")
2237# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2238# Try to avoid using this function wherever possible.
2239sub quote_command {
2240        return join(' ',
2241                map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2242}
2243
2244# get HEAD ref of given project as hash
2245sub git_get_head_hash {
2246        return git_get_full_hash(shift, 'HEAD');
2247}
2248
2249sub git_get_full_hash {
2250        return git_get_hash(@_);
2251}
2252
2253sub git_get_short_hash {
2254        return git_get_hash(@_, '--short=7');
2255}
2256
2257sub git_get_hash {
2258        my ($project, $hash, @options) = @_;
2259        my $o_git_dir = $git_dir;
2260        my $retval = undef;
2261        $git_dir = "$projectroot/$project";
2262        if (open my $fd, '-|', git_cmd(), 'rev-parse',
2263            '--verify', '-q', @options, $hash) {
2264                $retval = <$fd>;
2265                chomp $retval if defined $retval;
2266                close $fd;
2267        }
2268        if (defined $o_git_dir) {
2269                $git_dir = $o_git_dir;
2270        }
2271        return $retval;
2272}
2273
2274# get type of given object
2275sub git_get_type {
2276        my $hash = shift;
2277
2278        open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2279        my $type = <$fd>;
2280        close $fd or return;
2281        chomp $type;
2282        return $type;
2283}
2284
2285# repository configuration
2286our $config_file = '';
2287our %config;
2288
2289# store multiple values for single key as anonymous array reference
2290# single values stored directly in the hash, not as [ <value> ]
2291sub hash_set_multi {
2292        my ($hash, $key, $value) = @_;
2293
2294        if (!exists $hash->{$key}) {
2295                $hash->{$key} = $value;
2296        } elsif (!ref $hash->{$key}) {
2297                $hash->{$key} = [ $hash->{$key}, $value ];
2298        } else {
2299                push @{$hash->{$key}}, $value;
2300        }
2301}
2302
2303# return hash of git project configuration
2304# optionally limited to some section, e.g. 'gitweb'
2305sub git_parse_project_config {
2306        my $section_regexp = shift;
2307        my %config;
2308
2309        local $/ = "\0";
2310
2311        open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2312                or return;
2313
2314        while (my $keyval = <$fh>) {
2315                chomp $keyval;
2316                my ($key, $value) = split(/\n/, $keyval, 2);
2317
2318                hash_set_multi(\%config, $key, $value)
2319                        if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2320        }
2321        close $fh;
2322
2323        return %config;
2324}
2325
2326# convert config value to boolean: 'true' or 'false'
2327# no value, number > 0, 'true' and 'yes' values are true
2328# rest of values are treated as false (never as error)
2329sub config_to_bool {
2330        my $val = shift;
2331
2332        return 1 if !defined $val;             # section.key
2333
2334        # strip leading and trailing whitespace
2335        $val =~ s/^\s+//;
2336        $val =~ s/\s+$//;
2337
2338        return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2339                ($val =~ /^(?:true|yes)$/i));  # section.key = true
2340}
2341
2342# convert config value to simple decimal number
2343# an optional value suffix of 'k', 'm', or 'g' will cause the value
2344# to be multiplied by 1024, 1048576, or 1073741824
2345sub config_to_int {
2346        my $val = shift;
2347
2348        # strip leading and trailing whitespace
2349        $val =~ s/^\s+//;
2350        $val =~ s/\s+$//;
2351
2352        if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2353                $unit = lc($unit);
2354                # unknown unit is treated as 1
2355                return $num * ($unit eq 'g' ? 1073741824 :
2356                               $unit eq 'm' ?    1048576 :
2357                               $unit eq 'k' ?       1024 : 1);
2358        }
2359        return $val;
2360}
2361
2362# convert config value to array reference, if needed
2363sub config_to_multi {
2364        my $val = shift;
2365
2366        return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2367}
2368
2369sub git_get_project_config {
2370        my ($key, $type) = @_;
2371
2372        return unless defined $git_dir;
2373
2374        # key sanity check
2375        return unless ($key);
2376        $key =~ s/^gitweb\.//;
2377        return if ($key =~ m/\W/);
2378
2379        # type sanity check
2380        if (defined $type) {
2381                $type =~ s/^--//;
2382                $type = undef
2383                        unless ($type eq 'bool' || $type eq 'int');
2384        }
2385
2386        # get config
2387        if (!defined $config_file ||
2388            $config_file ne "$git_dir/config") {
2389                %config = git_parse_project_config('gitweb');
2390                $config_file = "$git_dir/config";
2391        }
2392
2393        # check if config variable (key) exists
2394        return unless exists $config{"gitweb.$key"};
2395
2396        # ensure given type
2397        if (!defined $type) {
2398                return $config{"gitweb.$key"};
2399        } elsif ($type eq 'bool') {
2400                # backward compatibility: 'git config --bool' returns true/false
2401                return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2402        } elsif ($type eq 'int') {
2403                return config_to_int($config{"gitweb.$key"});
2404        }
2405        return $config{"gitweb.$key"};
2406}
2407
2408# get hash of given path at given ref
2409sub git_get_hash_by_path {
2410        my $base = shift;
2411        my $path = shift || return undef;
2412        my $type = shift;
2413
2414        $path =~ s,/+$,,;
2415
2416        open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2417                or die_error(500, "Open git-ls-tree failed");
2418        my $line = <$fd>;
2419        close $fd or return undef;
2420
2421        if (!defined $line) {
2422                # there is no tree or hash given by $path at $base
2423                return undef;
2424        }
2425
2426        #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2427        $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2428        if (defined $type && $type ne $2) {
2429                # type doesn't match
2430                return undef;
2431        }
2432        return $3;
2433}
2434
2435# get path of entry with given hash at given tree-ish (ref)
2436# used to get 'from' filename for combined diff (merge commit) for renames
2437sub git_get_path_by_hash {
2438        my $base = shift || return;
2439        my $hash = shift || return;
2440
2441        local $/ = "\0";
2442
2443        open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2444                or return undef;
2445        while (my $line = <$fd>) {
2446                chomp $line;
2447
2448                #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2449                #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2450                if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2451                        close $fd;
2452                        return $1;
2453                }
2454        }
2455        close $fd;
2456        return undef;
2457}
2458
2459## ......................................................................
2460## git utility functions, directly accessing git repository
2461
2462sub git_get_project_description {
2463        my $path = shift;
2464
2465        $git_dir = "$projectroot/$path";
2466        open my $fd, '<', "$git_dir/description"
2467                or return git_get_project_config('description');
2468        my $descr = <$fd>;
2469        close $fd;
2470        if (defined $descr) {
2471                chomp $descr;
2472        }
2473        return $descr;
2474}
2475
2476sub git_get_project_ctags {
2477        my $path = shift;
2478        my $ctags = {};
2479
2480        $git_dir = "$projectroot/$path";
2481        opendir my $dh, "$git_dir/ctags"
2482                or return $ctags;
2483        foreach (grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh)) {
2484                open my $ct, '<', $_ or next;
2485                my $val = <$ct>;
2486                chomp $val;
2487                close $ct;
2488                my $ctag = $_; $ctag =~ s#.*/##;
2489                $ctags->{$ctag} = $val;
2490        }
2491        closedir $dh;
2492        $ctags;
2493}
2494
2495sub git_populate_project_tagcloud {
2496        my $ctags = shift;
2497
2498        # First, merge different-cased tags; tags vote on casing
2499        my %ctags_lc;
2500        foreach (keys %$ctags) {
2501                $ctags_lc{lc $_}->{count} += $ctags->{$_};
2502                if (not $ctags_lc{lc $_}->{topcount}
2503                    or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2504                        $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2505                        $ctags_lc{lc $_}->{topname} = $_;
2506                }
2507        }
2508
2509        my $cloud;
2510        if (eval { require HTML::TagCloud; 1; }) {
2511                $cloud = HTML::TagCloud->new;
2512                foreach (sort keys %ctags_lc) {
2513                        # Pad the title with spaces so that the cloud looks
2514                        # less crammed.
2515                        my $title = $ctags_lc{$_}->{topname};
2516                        $title =~ s/ /&nbsp;/g;
2517                        $title =~ s/^/&nbsp;/g;
2518                        $title =~ s/$/&nbsp;/g;
2519                        $cloud->add($title, $home_link."?by_tag=".$_, $ctags_lc{$_}->{count});
2520                }
2521        } else {
2522                $cloud = \%ctags_lc;
2523        }
2524        $cloud;
2525}
2526
2527sub git_show_project_tagcloud {
2528        my ($cloud, $count) = @_;
2529        print STDERR ref($cloud)."..\n";
2530        if (ref $cloud eq 'HTML::TagCloud') {
2531                return $cloud->html_and_css($count);
2532        } else {
2533                my @tags = sort { $cloud->{$a}->{count} <=> $cloud->{$b}->{count} } keys %$cloud;
2534                return '<p align="center">' . join (', ', map {
2535                        "<a href=\"$home_link?by_tag=$_\">$cloud->{$_}->{topname}</a>"
2536                } splice(@tags, 0, $count)) . '</p>';
2537        }
2538}
2539
2540sub git_get_project_url_list {
2541        my $path = shift;
2542
2543        $git_dir = "$projectroot/$path";
2544        open my $fd, '<', "$git_dir/cloneurl"
2545                or return wantarray ?
2546                @{ config_to_multi(git_get_project_config('url')) } :
2547                   config_to_multi(git_get_project_config('url'));
2548        my @git_project_url_list = map { chomp; $_ } <$fd>;
2549        close $fd;
2550
2551        return wantarray ? @git_project_url_list : \@git_project_url_list;
2552}
2553
2554sub git_get_projects_list {
2555        my ($filter) = @_;
2556        my @list;
2557
2558        $filter ||= '';
2559        $filter =~ s/\.git$//;
2560
2561        my $check_forks = gitweb_check_feature('forks');
2562
2563        if (-d $projects_list) {
2564                # search in directory
2565                my $dir = $projects_list . ($filter ? "/$filter" : '');
2566                # remove the trailing "/"
2567                $dir =~ s!/+$!!;
2568                my $pfxlen = length("$dir");
2569                my $pfxdepth = ($dir =~ tr!/!!);
2570
2571                File::Find::find({
2572                        follow_fast => 1, # follow symbolic links
2573                        follow_skip => 2, # ignore duplicates
2574                        dangling_symlinks => 0, # ignore dangling symlinks, silently
2575                        wanted => sub {
2576                                # global variables
2577                                our $project_maxdepth;
2578                                our $projectroot;
2579                                # skip project-list toplevel, if we get it.
2580                                return if (m!^[/.]$!);
2581                                # only directories can be git repositories
2582                                return unless (-d $_);
2583                                # don't traverse too deep (Find is super slow on os x)
2584                                if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2585                                        $File::Find::prune = 1;
2586                                        return;
2587                                }
2588
2589                                my $subdir = substr($File::Find::name, $pfxlen + 1);
2590                                # we check related file in $projectroot
2591                                my $path = ($filter ? "$filter/" : '') . $subdir;
2592                                if (check_export_ok("$projectroot/$path")) {
2593                                        push @list, { path => $path };
2594                                        $File::Find::prune = 1;
2595                                }
2596                        },
2597                }, "$dir");
2598
2599        } elsif (-f $projects_list) {
2600                # read from file(url-encoded):
2601                # 'git%2Fgit.git Linus+Torvalds'
2602                # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2603                # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2604                my %paths;
2605                open my $fd, '<', $projects_list or return;
2606        PROJECT:
2607                while (my $line = <$fd>) {
2608                        chomp $line;
2609                        my ($path, $owner) = split ' ', $line;
2610                        $path = unescape($path);
2611                        $owner = unescape($owner);
2612                        if (!defined $path) {
2613                                next;
2614                        }
2615                        if ($filter ne '') {
2616                                # looking for forks;
2617                                my $pfx = substr($path, 0, length($filter));
2618                                if ($pfx ne $filter) {
2619                                        next PROJECT;
2620                                }
2621                                my $sfx = substr($path, length($filter));
2622                                if ($sfx !~ /^\/.*\.git$/) {
2623                                        next PROJECT;
2624                                }
2625                        } elsif ($check_forks) {
2626                        PATH:
2627                                foreach my $filter (keys %paths) {
2628                                        # looking for forks;
2629                                        my $pfx = substr($path, 0, length($filter));
2630                                        if ($pfx ne $filter) {
2631                                                next PATH;
2632                                        }
2633                                        my $sfx = substr($path, length($filter));
2634                                        if ($sfx !~ /^\/.*\.git$/) {
2635                                                next PATH;
2636                                        }
2637                                        # is a fork, don't include it in
2638                                        # the list
2639                                        next PROJECT;
2640                                }
2641                        }
2642                        if (check_export_ok("$projectroot/$path")) {
2643                                my $pr = {
2644                                        path => $path,
2645                                        owner => to_utf8($owner),
2646                                };
2647                                push @list, $pr;
2648                                (my $forks_path = $path) =~ s/\.git$//;
2649                                $paths{$forks_path}++;
2650                        }
2651                }
2652                close $fd;
2653        }
2654        return @list;
2655}
2656
2657our $gitweb_project_owner = undef;
2658sub git_get_project_list_from_file {
2659
2660        return if (defined $gitweb_project_owner);
2661
2662        $gitweb_project_owner = {};
2663        # read from file (url-encoded):
2664        # 'git%2Fgit.git Linus+Torvalds'
2665        # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2666        # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2667        if (-f $projects_list) {
2668                open(my $fd, '<', $projects_list);
2669                while (my $line = <$fd>) {
2670                        chomp $line;
2671                        my ($pr, $ow) = split ' ', $line;
2672                        $pr = unescape($pr);
2673                        $ow = unescape($ow);
2674                        $gitweb_project_owner->{$pr} = to_utf8($ow);
2675                }
2676                close $fd;
2677        }
2678}
2679
2680sub git_get_project_owner {
2681        my $project = shift;
2682        my $owner;
2683
2684        return undef unless $project;
2685        $git_dir = "$projectroot/$project";
2686
2687        if (!defined $gitweb_project_owner) {
2688                git_get_project_list_from_file();
2689        }
2690
2691        if (exists $gitweb_project_owner->{$project}) {
2692                $owner = $gitweb_project_owner->{$project};
2693        }
2694        if (!defined $owner){
2695                $owner = git_get_project_config('owner');
2696        }
2697        if (!defined $owner) {
2698                $owner = get_file_owner("$git_dir");
2699        }
2700
2701        return $owner;
2702}
2703
2704sub git_get_last_activity {
2705        my ($path) = @_;
2706        my $fd;
2707
2708        $git_dir = "$projectroot/$path";
2709        open($fd, "-|", git_cmd(), 'for-each-ref',
2710             '--format=%(committer)',
2711             '--sort=-committerdate',
2712             '--count=1',
2713             'refs/heads') or return;
2714        my $most_recent = <$fd>;
2715        close $fd or return;
2716        if (defined $most_recent &&
2717            $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
2718                my $timestamp = $1;
2719                my $age = time - $timestamp;
2720                return ($age, age_string($age));
2721        }
2722        return (undef, undef);
2723}
2724
2725sub git_get_references {
2726        my $type = shift || "";
2727        my %refs;
2728        # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
2729        # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
2730        open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
2731                ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
2732                or return;
2733
2734        while (my $line = <$fd>) {
2735                chomp $line;
2736                if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
2737                        if (defined $refs{$1}) {
2738                                push @{$refs{$1}}, $2;
2739                        } else {
2740                                $refs{$1} = [ $2 ];
2741                        }
2742                }
2743        }
2744        close $fd or return;
2745        return \%refs;
2746}
2747
2748sub git_get_rev_name_tags {
2749        my $hash = shift || return undef;
2750
2751        open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
2752                or return;
2753        my $name_rev = <$fd>;
2754        close $fd;
2755
2756        if ($name_rev =~ m|^$hash tags/(.*)$|) {
2757                return $1;
2758        } else {
2759                # catches also '$hash undefined' output
2760                return undef;
2761        }
2762}
2763
2764## ----------------------------------------------------------------------
2765## parse to hash functions
2766
2767sub parse_date {
2768        my $epoch = shift;
2769        my $tz = shift || "-0000";
2770
2771        my %date;
2772        my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
2773        my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
2774        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
2775        $date{'hour'} = $hour;
2776        $date{'minute'} = $min;
2777        $date{'mday'} = $mday;
2778        $date{'day'} = $days[$wday];
2779        $date{'month'} = $months[$mon];
2780        $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
2781                             $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
2782        $date{'mday-time'} = sprintf "%d %s %02d:%02d",
2783                             $mday, $months[$mon], $hour ,$min;
2784        $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
2785                             1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
2786
2787        $tz =~ m/^([+\-][0-9][0-9])([0-9][0-9])$/;
2788        my $local = $epoch + ((int $1 + ($2/60)) * 3600);
2789        ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
2790        $date{'hour_local'} = $hour;
2791        $date{'minute_local'} = $min;
2792        $date{'tz_local'} = $tz;
2793        $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
2794                                  1900+$year, $mon+1, $mday,
2795                                  $hour, $min, $sec, $tz);
2796        return %date;
2797}
2798
2799sub parse_tag {
2800        my $tag_id = shift;
2801        my %tag;
2802        my @comment;
2803
2804        open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
2805        $tag{'id'} = $tag_id;
2806        while (my $line = <$fd>) {
2807                chomp $line;
2808                if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
2809                        $tag{'object'} = $1;
2810                } elsif ($line =~ m/^type (.+)$/) {
2811                        $tag{'type'} = $1;
2812                } elsif ($line =~ m/^tag (.+)$/) {
2813                        $tag{'name'} = $1;
2814                } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
2815                        $tag{'author'} = $1;
2816                        $tag{'author_epoch'} = $2;
2817                        $tag{'author_tz'} = $3;
2818                        if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
2819                                $tag{'author_name'}  = $1;
2820                                $tag{'author_email'} = $2;
2821                        } else {
2822                                $tag{'author_name'} = $tag{'author'};
2823                        }
2824                } elsif ($line =~ m/--BEGIN/) {
2825                        push @comment, $line;
2826                        last;
2827                } elsif ($line eq "") {
2828                        last;
2829                }
2830        }
2831        push @comment, <$fd>;
2832        $tag{'comment'} = \@comment;
2833        close $fd or return;
2834        if (!defined $tag{'name'}) {
2835                return
2836        };
2837        return %tag
2838}
2839
2840sub parse_commit_text {
2841        my ($commit_text, $withparents) = @_;
2842        my @commit_lines = split '\n', $commit_text;
2843        my %co;
2844
2845        pop @commit_lines; # Remove '\0'
2846
2847        if (! @commit_lines) {
2848                return;
2849        }
2850
2851        my $header = shift @commit_lines;
2852        if ($header !~ m/^[0-9a-fA-F]{40}/) {
2853                return;
2854        }
2855        ($co{'id'}, my @parents) = split ' ', $header;
2856        while (my $line = shift @commit_lines) {
2857                last if $line eq "\n";
2858                if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
2859                        $co{'tree'} = $1;
2860                } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
2861                        push @parents, $1;
2862                } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
2863                        $co{'author'} = to_utf8($1);
2864                        $co{'author_epoch'} = $2;
2865                        $co{'author_tz'} = $3;
2866                        if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
2867                                $co{'author_name'}  = $1;
2868                                $co{'author_email'} = $2;
2869                        } else {
2870                                $co{'author_name'} = $co{'author'};
2871                        }
2872                } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
2873                        $co{'committer'} = to_utf8($1);
2874                        $co{'committer_epoch'} = $2;
2875                        $co{'committer_tz'} = $3;
2876                        if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
2877                                $co{'committer_name'}  = $1;
2878                                $co{'committer_email'} = $2;
2879                        } else {
2880                                $co{'committer_name'} = $co{'committer'};
2881                        }
2882                }
2883        }
2884        if (!defined $co{'tree'}) {
2885                return;
2886        };
2887        $co{'parents'} = \@parents;
2888        $co{'parent'} = $parents[0];
2889
2890        foreach my $title (@commit_lines) {
2891                $title =~ s/^    //;
2892                if ($title ne "") {
2893                        $co{'title'} = chop_str($title, 80, 5);
2894                        # remove leading stuff of merges to make the interesting part visible
2895                        if (length($title) > 50) {
2896                                $title =~ s/^Automatic //;
2897                                $title =~ s/^merge (of|with) /Merge ... /i;
2898                                if (length($title) > 50) {
2899                                        $title =~ s/(http|rsync):\/\///;
2900                                }
2901                                if (length($title) > 50) {
2902                                        $title =~ s/(master|www|rsync)\.//;
2903                                }
2904                                if (length($title) > 50) {
2905                                        $title =~ s/kernel.org:?//;
2906                                }
2907                                if (length($title) > 50) {
2908                                        $title =~ s/\/pub\/scm//;
2909                                }
2910                        }
2911                        $co{'title_short'} = chop_str($title, 50, 5);
2912                        last;
2913                }
2914        }
2915        if (! defined $co{'title'} || $co{'title'} eq "") {
2916                $co{'title'} = $co{'title_short'} = '(no commit message)';
2917        }
2918        # remove added spaces
2919        foreach my $line (@commit_lines) {
2920                $line =~ s/^    //;
2921        }
2922        $co{'comment'} = \@commit_lines;
2923
2924        my $age = time - $co{'committer_epoch'};
2925        $co{'age'} = $age;
2926        $co{'age_string'} = age_string($age);
2927        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
2928        if ($age > 60*60*24*7*2) {
2929                $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
2930                $co{'age_string_age'} = $co{'age_string'};
2931        } else {
2932                $co{'age_string_date'} = $co{'age_string'};
2933                $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
2934        }
2935        return %co;
2936}
2937
2938sub parse_commit {
2939        my ($commit_id) = @_;
2940        my %co;
2941
2942        local $/ = "\0";
2943
2944        open my $fd, "-|", git_cmd(), "rev-list",
2945                "--parents",
2946                "--header",
2947                "--max-count=1",
2948                $commit_id,
2949                "--",
2950                or die_error(500, "Open git-rev-list failed");
2951        %co = parse_commit_text(<$fd>, 1);
2952        close $fd;
2953
2954        return %co;
2955}
2956
2957sub parse_commits {
2958        my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
2959        my @cos;
2960
2961        $maxcount ||= 1;
2962        $skip ||= 0;
2963
2964        local $/ = "\0";
2965
2966        open my $fd, "-|", git_cmd(), "rev-list",
2967                "--header",
2968                @args,
2969                ("--max-count=" . $maxcount),
2970                ("--skip=" . $skip),
2971                @extra_options,
2972                $commit_id,
2973                "--",
2974                ($filename ? ($filename) : ())
2975                or die_error(500, "Open git-rev-list failed");
2976        while (my $line = <$fd>) {
2977                my %co = parse_commit_text($line);
2978                push @cos, \%co;
2979        }
2980        close $fd;
2981
2982        return wantarray ? @cos : \@cos;
2983}
2984
2985# parse line of git-diff-tree "raw" output
2986sub parse_difftree_raw_line {
2987        my $line = shift;
2988        my %res;
2989
2990        # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
2991        # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
2992        if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
2993                $res{'from_mode'} = $1;
2994                $res{'to_mode'} = $2;
2995                $res{'from_id'} = $3;
2996                $res{'to_id'} = $4;
2997                $res{'status'} = $5;
2998                $res{'similarity'} = $6;
2999                if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3000                        ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3001                } else {
3002                        $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3003                }
3004        }
3005        # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3006        # combined diff (for merge commit)
3007        elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3008                $res{'nparents'}  = length($1);
3009                $res{'from_mode'} = [ split(' ', $2) ];
3010                $res{'to_mode'} = pop @{$res{'from_mode'}};
3011                $res{'from_id'} = [ split(' ', $3) ];
3012                $res{'to_id'} = pop @{$res{'from_id'}};
3013                $res{'status'} = [ split('', $4) ];
3014                $res{'to_file'} = unquote($5);
3015        }
3016        # 'c512b523472485aef4fff9e57b229d9d243c967f'
3017        elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3018                $res{'commit'} = $1;
3019        }
3020
3021        return wantarray ? %res : \%res;
3022}
3023
3024# wrapper: return parsed line of git-diff-tree "raw" output
3025# (the argument might be raw line, or parsed info)
3026sub parsed_difftree_line {
3027        my $line_or_ref = shift;
3028
3029        if (ref($line_or_ref) eq "HASH") {
3030                # pre-parsed (or generated by hand)
3031                return $line_or_ref;
3032        } else {
3033                return parse_difftree_raw_line($line_or_ref);
3034        }
3035}
3036
3037# parse line of git-ls-tree output
3038sub parse_ls_tree_line {
3039        my $line = shift;
3040        my %opts = @_;
3041        my %res;
3042
3043        if ($opts{'-l'}) {
3044                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3045                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3046
3047                $res{'mode'} = $1;
3048                $res{'type'} = $2;
3049                $res{'hash'} = $3;
3050                $res{'size'} = $4;
3051                if ($opts{'-z'}) {
3052                        $res{'name'} = $5;
3053                } else {
3054                        $res{'name'} = unquote($5);
3055                }
3056        } else {
3057                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3058                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3059
3060                $res{'mode'} = $1;
3061                $res{'type'} = $2;
3062                $res{'hash'} = $3;
3063                if ($opts{'-z'}) {
3064                        $res{'name'} = $4;
3065                } else {
3066                        $res{'name'} = unquote($4);
3067                }
3068        }
3069
3070        return wantarray ? %res : \%res;
3071}
3072
3073# generates _two_ hashes, references to which are passed as 2 and 3 argument
3074sub parse_from_to_diffinfo {
3075        my ($diffinfo, $from, $to, @parents) = @_;
3076
3077        if ($diffinfo->{'nparents'}) {
3078                # combined diff
3079                $from->{'file'} = [];
3080                $from->{'href'} = [];
3081                fill_from_file_info($diffinfo, @parents)
3082                        unless exists $diffinfo->{'from_file'};
3083                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3084                        $from->{'file'}[$i] =
3085                                defined $diffinfo->{'from_file'}[$i] ?
3086                                        $diffinfo->{'from_file'}[$i] :
3087                                        $diffinfo->{'to_file'};
3088                        if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3089                                $from->{'href'}[$i] = href(action=>"blob",
3090                                                           hash_base=>$parents[$i],
3091                                                           hash=>$diffinfo->{'from_id'}[$i],
3092                                                           file_name=>$from->{'file'}[$i]);
3093                        } else {
3094                                $from->{'href'}[$i] = undef;
3095                        }
3096                }
3097        } else {
3098                # ordinary (not combined) diff
3099                $from->{'file'} = $diffinfo->{'from_file'};
3100                if ($diffinfo->{'status'} ne "A") { # not new (added) file
3101                        $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3102                                               hash=>$diffinfo->{'from_id'},
3103                                               file_name=>$from->{'file'});
3104                } else {
3105                        delete $from->{'href'};
3106                }
3107        }
3108
3109        $to->{'file'} = $diffinfo->{'to_file'};
3110        if (!is_deleted($diffinfo)) { # file exists in result
3111                $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3112                                     hash=>$diffinfo->{'to_id'},
3113                                     file_name=>$to->{'file'});
3114        } else {
3115                delete $to->{'href'};
3116        }
3117}
3118
3119## ......................................................................
3120## parse to array of hashes functions
3121
3122sub git_get_heads_list {
3123        my $limit = shift;
3124        my @headslist;
3125
3126        open my $fd, '-|', git_cmd(), 'for-each-ref',
3127                ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3128                '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3129                'refs/heads'
3130                or return;
3131        while (my $line = <$fd>) {
3132                my %ref_item;
3133
3134                chomp $line;
3135                my ($refinfo, $committerinfo) = split(/\0/, $line);
3136                my ($hash, $name, $title) = split(' ', $refinfo, 3);
3137                my ($committer, $epoch, $tz) =
3138                        ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3139                $ref_item{'fullname'}  = $name;
3140                $name =~ s!^refs/heads/!!;
3141
3142                $ref_item{'name'}  = $name;
3143                $ref_item{'id'}    = $hash;
3144                $ref_item{'title'} = $title || '(no commit message)';
3145                $ref_item{'epoch'} = $epoch;
3146                if ($epoch) {
3147                        $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3148                } else {
3149                        $ref_item{'age'} = "unknown";
3150                }
3151
3152                push @headslist, \%ref_item;
3153        }
3154        close $fd;
3155
3156        return wantarray ? @headslist : \@headslist;
3157}
3158
3159sub git_get_tags_list {
3160        my $limit = shift;
3161        my @tagslist;
3162
3163        open my $fd, '-|', git_cmd(), 'for-each-ref',
3164                ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3165                '--format=%(objectname) %(objecttype) %(refname) '.
3166                '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3167                'refs/tags'
3168                or return;
3169        while (my $line = <$fd>) {
3170                my %ref_item;
3171
3172                chomp $line;
3173                my ($refinfo, $creatorinfo) = split(/\0/, $line);
3174                my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3175                my ($creator, $epoch, $tz) =
3176                        ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3177                $ref_item{'fullname'} = $name;
3178                $name =~ s!^refs/tags/!!;
3179
3180                $ref_item{'type'} = $type;
3181                $ref_item{'id'} = $id;
3182                $ref_item{'name'} = $name;
3183                if ($type eq "tag") {
3184                        $ref_item{'subject'} = $title;
3185                        $ref_item{'reftype'} = $reftype;
3186                        $ref_item{'refid'}   = $refid;
3187                } else {
3188                        $ref_item{'reftype'} = $type;
3189                        $ref_item{'refid'}   = $id;
3190                }
3191
3192                if ($type eq "tag" || $type eq "commit") {
3193                        $ref_item{'epoch'} = $epoch;
3194                        if ($epoch) {
3195                                $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3196                        } else {
3197                                $ref_item{'age'} = "unknown";
3198                        }
3199                }
3200
3201                push @tagslist, \%ref_item;
3202        }
3203        close $fd;
3204
3205        return wantarray ? @tagslist : \@tagslist;
3206}
3207
3208## ----------------------------------------------------------------------
3209## filesystem-related functions
3210
3211sub get_file_owner {
3212        my $path = shift;
3213
3214        my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3215        my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3216        if (!defined $gcos) {
3217                return undef;
3218        }
3219        my $owner = $gcos;
3220        $owner =~ s/[,;].*$//;
3221        return to_utf8($owner);
3222}
3223
3224# assume that file exists
3225sub insert_file {
3226        my $filename = shift;
3227
3228        open my $fd, '<', $filename;
3229        print map { to_utf8($_) } <$fd>;
3230        close $fd;
3231}
3232
3233## ......................................................................
3234## mimetype related functions
3235
3236sub mimetype_guess_file {
3237        my $filename = shift;
3238        my $mimemap = shift;
3239        -r $mimemap or return undef;
3240
3241        my %mimemap;
3242        open(my $mh, '<', $mimemap) or return undef;
3243        while (<$mh>) {
3244                next if m/^#/; # skip comments
3245                my ($mimetype, $exts) = split(/\t+/);
3246                if (defined $exts) {
3247                        my @exts = split(/\s+/, $exts);
3248                        foreach my $ext (@exts) {
3249                                $mimemap{$ext} = $mimetype;
3250                        }
3251                }
3252        }
3253        close($mh);
3254
3255        $filename =~ /\.([^.]*)$/;
3256        return $mimemap{$1};
3257}
3258
3259sub mimetype_guess {
3260        my $filename = shift;
3261        my $mime;
3262        $filename =~ /\./ or return undef;
3263
3264        if ($mimetypes_file) {
3265                my $file = $mimetypes_file;
3266                if ($file !~ m!^/!) { # if it is relative path
3267                        # it is relative to project
3268                        $file = "$projectroot/$project/$file";
3269                }
3270                $mime = mimetype_guess_file($filename, $file);
3271        }
3272        $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3273        return $mime;
3274}
3275
3276sub blob_mimetype {
3277        my $fd = shift;
3278        my $filename = shift;
3279
3280        if ($filename) {
3281                my $mime = mimetype_guess($filename);
3282                $mime and return $mime;
3283        }
3284
3285        # just in case
3286        return $default_blob_plain_mimetype unless $fd;
3287
3288        if (-T $fd) {
3289                return 'text/plain';
3290        } elsif (! $filename) {
3291                return 'application/octet-stream';
3292        } elsif ($filename =~ m/\.png$/i) {
3293                return 'image/png';
3294        } elsif ($filename =~ m/\.gif$/i) {
3295                return 'image/gif';
3296        } elsif ($filename =~ m/\.jpe?g$/i) {
3297                return 'image/jpeg';
3298        } else {
3299                return 'application/octet-stream';
3300        }
3301}
3302
3303sub blob_contenttype {
3304        my ($fd, $file_name, $type) = @_;
3305
3306        $type ||= blob_mimetype($fd, $file_name);
3307        if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3308                $type .= "; charset=$default_text_plain_charset";
3309        }
3310
3311        return $type;
3312}
3313
3314# guess file syntax for syntax highlighting; return undef if no highlighting
3315# the name of syntax can (in the future) depend on syntax highlighter used
3316sub guess_file_syntax {
3317        my ($highlight, $mimetype, $file_name) = @_;
3318        return undef unless ($highlight && defined $file_name);
3319
3320        # configuration for 'highlight' (http://www.andre-simon.de/)
3321        # match by basename
3322        my %highlight_basename = (
3323                #'Program' => 'py',
3324                #'Library' => 'py',
3325                'SConstruct' => 'py', # SCons equivalent of Makefile
3326                'Makefile' => 'make',
3327        );
3328        # match by extension
3329        my %highlight_ext = (
3330                # main extensions, defining name of syntax;
3331                # see files in /usr/share/highlight/langDefs/ directory
3332                map { $_ => $_ }
3333                        qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl),
3334                # alternate extensions, see /etc/highlight/filetypes.conf
3335                'h' => 'c',
3336                map { $_ => 'cpp' } qw(cxx c++ cc),
3337                map { $_ => 'php' } qw(php3 php4),
3338                map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
3339                'mak' => 'make',
3340                map { $_ => 'xml' } qw(xhtml html htm),
3341        );
3342
3343        my $basename = basename($file_name, '.in');
3344        return $highlight_basename{$basename}
3345                if exists $highlight_basename{$basename};
3346
3347        $basename =~ /\.([^.]*)$/;
3348        my $ext = $1 or return undef;
3349        return $highlight_ext{$ext}
3350                if exists $highlight_ext{$ext};
3351
3352        return undef;
3353}
3354
3355# run highlighter and return FD of its output,
3356# or return original FD if no highlighting
3357sub run_highlighter {
3358        my ($fd, $highlight, $syntax) = @_;
3359        return $fd unless ($highlight && defined $syntax);
3360
3361        close $fd
3362                or die_error(404, "Reading blob failed");
3363        open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3364                  "highlight --xhtml --fragment --syntax $syntax |"
3365                or die_error(500, "Couldn't open file or run syntax highlighter");
3366        return $fd;
3367}
3368
3369## ======================================================================
3370## functions printing HTML: header, footer, error page
3371
3372sub get_page_title {
3373        my $title = to_utf8($site_name);
3374
3375        return $title unless (defined $project);
3376        $title .= " - " . to_utf8($project);
3377
3378        return $title unless (defined $action);
3379        $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3380
3381        return $title unless (defined $file_name);
3382        $title .= " - " . esc_path($file_name);
3383        if ($action eq "tree" && $file_name !~ m|/$|) {
3384                $title .= "/";
3385        }
3386
3387        return $title;
3388}
3389
3390sub git_header_html {
3391        my $status = shift || "200 OK";
3392        my $expires = shift;
3393        my %opts = @_;
3394
3395        my $title = get_page_title();
3396        my $content_type;
3397        # require explicit support from the UA if we are to send the page as
3398        # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3399        # we have to do this because MSIE sometimes globs '*/*', pretending to
3400        # support xhtml+xml but choking when it gets what it asked for.
3401        if (defined $cgi->http('HTTP_ACCEPT') &&
3402            $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3403            $cgi->Accept('application/xhtml+xml') != 0) {
3404                $content_type = 'application/xhtml+xml';
3405        } else {
3406                $content_type = 'text/html';
3407        }
3408        print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3409                           -status=> $status, -expires => $expires)
3410                unless ($opts{'-no_http_header'});
3411        my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3412        print <<EOF;
3413<?xml version="1.0" encoding="utf-8"?>
3414<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3415<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3416<!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3417<!-- git core binaries version $git_version -->
3418<head>
3419<meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3420<meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3421<meta name="robots" content="index, nofollow"/>
3422<title>$title</title>
3423EOF
3424        # the stylesheet, favicon etc urls won't work correctly with path_info
3425        # unless we set the appropriate base URL
3426        if ($ENV{'PATH_INFO'}) {
3427                print "<base href=\"".esc_url($base_url)."\" />\n";
3428        }
3429        # print out each stylesheet that exist, providing backwards capability
3430        # for those people who defined $stylesheet in a config file
3431        if (defined $stylesheet) {
3432                print '<link rel="stylesheet" type="text/css" href="'.$stylesheet.'"/>'."\n";
3433        } else {
3434                foreach my $stylesheet (@stylesheets) {
3435                        next unless $stylesheet;
3436                        print '<link rel="stylesheet" type="text/css" href="'.$stylesheet.'"/>'."\n";
3437                }
3438        }
3439        if (defined $project) {
3440                my %href_params = get_feed_info();
3441                if (!exists $href_params{'-title'}) {
3442                        $href_params{'-title'} = 'log';
3443                }
3444
3445                foreach my $format qw(RSS Atom) {
3446                        my $type = lc($format);
3447                        my %link_attr = (
3448                                '-rel' => 'alternate',
3449                                '-title' => "$project - $href_params{'-title'} - $format feed",
3450                                '-type' => "application/$type+xml"
3451                        );
3452
3453                        $href_params{'action'} = $type;
3454                        $link_attr{'-href'} = href(%href_params);
3455                        print "<link ".
3456                              "rel=\"$link_attr{'-rel'}\" ".
3457                              "title=\"$link_attr{'-title'}\" ".
3458                              "href=\"$link_attr{'-href'}\" ".
3459                              "type=\"$link_attr{'-type'}\" ".
3460                              "/>\n";
3461
3462                        $href_params{'extra_options'} = '--no-merges';
3463                        $link_attr{'-href'} = href(%href_params);
3464                        $link_attr{'-title'} .= ' (no merges)';
3465                        print "<link ".
3466                              "rel=\"$link_attr{'-rel'}\" ".
3467                              "title=\"$link_attr{'-title'}\" ".
3468                              "href=\"$link_attr{'-href'}\" ".
3469                              "type=\"$link_attr{'-type'}\" ".
3470                              "/>\n";
3471                }
3472
3473        } else {
3474                printf('<link rel="alternate" title="%s projects list" '.
3475                       'href="%s" type="text/plain; charset=utf-8" />'."\n",
3476                       $site_name, href(project=>undef, action=>"project_index"));
3477                printf('<link rel="alternate" title="%s projects feeds" '.
3478                       'href="%s" type="text/x-opml" />'."\n",
3479                       $site_name, href(project=>undef, action=>"opml"));
3480        }
3481        if (defined $favicon) {
3482                print qq(<link rel="shortcut icon" href="$favicon" type="image/png" />\n);
3483        }
3484
3485        print "</head>\n" .
3486              "<body>\n";
3487
3488        if (defined $site_header && -f $site_header) {
3489                insert_file($site_header);
3490        }
3491
3492        print "<div class=\"page_header\">\n" .
3493              $cgi->a({-href => esc_url($logo_url),
3494                       -title => $logo_label},
3495                      qq(<img src="$logo" width="72" height="27" alt="git" class="logo"/>));
3496        print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3497        if (defined $project) {
3498                print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3499                if (defined $action) {
3500                        print " / $action";
3501                }
3502                print "\n";
3503        }
3504        print "</div>\n";
3505
3506        my $have_search = gitweb_check_feature('search');
3507        if (defined $project && $have_search) {
3508                if (!defined $searchtext) {
3509                        $searchtext = "";
3510                }
3511                my $search_hash;
3512                if (defined $hash_base) {
3513                        $search_hash = $hash_base;
3514                } elsif (defined $hash) {
3515                        $search_hash = $hash;
3516                } else {
3517                        $search_hash = "HEAD";
3518                }
3519                my $action = $my_uri;
3520                my $use_pathinfo = gitweb_check_feature('pathinfo');
3521                if ($use_pathinfo) {
3522                        $action .= "/".esc_url($project);
3523                }
3524                print $cgi->startform(-method => "get", -action => $action) .
3525                      "<div class=\"search\">\n" .
3526                      (!$use_pathinfo &&
3527                      $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3528                      $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3529                      $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3530                      $cgi->popup_menu(-name => 'st', -default => 'commit',
3531                                       -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3532                      $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3533                      " search:\n",
3534                      $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3535                      "<span title=\"Extended regular expression\">" .
3536                      $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3537                                     -checked => $search_use_regexp) .
3538                      "</span>" .
3539                      "</div>" .
3540                      $cgi->end_form() . "\n";
3541        }
3542}
3543
3544sub git_footer_html {
3545        my $feed_class = 'rss_logo';
3546
3547        print "<div class=\"page_footer\">\n";
3548        if (defined $project) {
3549                my $descr = git_get_project_description($project);
3550                if (defined $descr) {
3551                        print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3552                }
3553
3554                my %href_params = get_feed_info();
3555                if (!%href_params) {
3556                        $feed_class .= ' generic';
3557                }
3558                $href_params{'-title'} ||= 'log';
3559
3560                foreach my $format qw(RSS Atom) {
3561                        $href_params{'action'} = lc($format);
3562                        print $cgi->a({-href => href(%href_params),
3563                                      -title => "$href_params{'-title'} $format feed",
3564                                      -class => $feed_class}, $format)."\n";
3565                }
3566
3567        } else {
3568                print $cgi->a({-href => href(project=>undef, action=>"opml"),
3569                              -class => $feed_class}, "OPML") . " ";
3570                print $cgi->a({-href => href(project=>undef, action=>"project_index"),
3571                              -class => $feed_class}, "TXT") . "\n";
3572        }
3573        print "</div>\n"; # class="page_footer"
3574
3575        if (defined $t0 && gitweb_check_feature('timed')) {
3576                print "<div id=\"generating_info\">\n";
3577                print 'This page took '.
3578                      '<span id="generating_time" class="time_span">'.
3579                      Time::HiRes::tv_interval($t0, [Time::HiRes::gettimeofday()]).
3580                      ' seconds </span>'.
3581                      ' and '.
3582                      '<span id="generating_cmd">'.
3583                      $number_of_git_cmds.
3584                      '</span> git commands '.
3585                      " to generate.\n";
3586                print "</div>\n"; # class="page_footer"
3587        }
3588
3589        if (defined $site_footer && -f $site_footer) {
3590                insert_file($site_footer);
3591        }
3592
3593        print qq!<script type="text/javascript" src="$javascript"></script>\n!;
3594        if (defined $action &&
3595            $action eq 'blame_incremental') {
3596                print qq!<script type="text/javascript">\n!.
3597                      qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
3598                      qq!           "!. href() .qq!");\n!.
3599                      qq!</script>\n!;
3600        } elsif (gitweb_check_feature('javascript-actions')) {
3601                print qq!<script type="text/javascript">\n!.
3602                      qq!window.onload = fixLinks;\n!.
3603                      qq!</script>\n!;
3604        }
3605
3606        print "</body>\n" .
3607              "</html>";
3608}
3609
3610# die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
3611# Example: die_error(404, 'Hash not found')
3612# By convention, use the following status codes (as defined in RFC 2616):
3613# 400: Invalid or missing CGI parameters, or
3614#      requested object exists but has wrong type.
3615# 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
3616#      this server or project.
3617# 404: Requested object/revision/project doesn't exist.
3618# 500: The server isn't configured properly, or
3619#      an internal error occurred (e.g. failed assertions caused by bugs), or
3620#      an unknown error occurred (e.g. the git binary died unexpectedly).
3621# 503: The server is currently unavailable (because it is overloaded,
3622#      or down for maintenance).  Generally, this is a temporary state.
3623sub die_error {
3624        my $status = shift || 500;
3625        my $error = esc_html(shift) || "Internal Server Error";
3626        my $extra = shift;
3627        my %opts = @_;
3628
3629        my %http_responses = (
3630                400 => '400 Bad Request',
3631                403 => '403 Forbidden',
3632                404 => '404 Not Found',
3633                500 => '500 Internal Server Error',
3634                503 => '503 Service Unavailable',
3635        );
3636        git_header_html($http_responses{$status}, undef, %opts);
3637        print <<EOF;
3638<div class="page_body">
3639<br /><br />
3640$status - $error
3641<br />
3642EOF
3643        if (defined $extra) {
3644                print "<hr />\n" .
3645                      "$extra\n";
3646        }
3647        print "</div>\n";
3648
3649        git_footer_html();
3650        goto DONE_GITWEB
3651                unless ($opts{'-error_handler'});
3652}
3653
3654## ----------------------------------------------------------------------
3655## functions printing or outputting HTML: navigation
3656
3657sub git_print_page_nav {
3658        my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
3659        $extra = '' if !defined $extra; # pager or formats
3660
3661        my @navs = qw(summary shortlog log commit commitdiff tree);
3662        if ($suppress) {
3663                @navs = grep { $_ ne $suppress } @navs;
3664        }
3665
3666        my %arg = map { $_ => {action=>$_} } @navs;
3667        if (defined $head) {
3668                for (qw(commit commitdiff)) {
3669                        $arg{$_}{'hash'} = $head;
3670                }
3671                if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
3672                        for (qw(shortlog log)) {
3673                                $arg{$_}{'hash'} = $head;
3674                        }
3675                }
3676        }
3677
3678        $arg{'tree'}{'hash'} = $treehead if defined $treehead;
3679        $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
3680
3681        my @actions = gitweb_get_feature('actions');
3682        my %repl = (
3683                '%' => '%',
3684                'n' => $project,         # project name
3685                'f' => $git_dir,         # project path within filesystem
3686                'h' => $treehead || '',  # current hash ('h' parameter)
3687                'b' => $treebase || '',  # hash base ('hb' parameter)
3688        );
3689        while (@actions) {
3690                my ($label, $link, $pos) = splice(@actions,0,3);
3691                # insert
3692                @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
3693                # munch munch
3694                $link =~ s/%([%nfhb])/$repl{$1}/g;
3695                $arg{$label}{'_href'} = $link;
3696        }
3697
3698        print "<div class=\"page_nav\">\n" .
3699                (join " | ",
3700                 map { $_ eq $current ?
3701                       $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
3702                 } @navs);
3703        print "<br/>\n$extra<br/>\n" .
3704              "</div>\n";
3705}
3706
3707sub format_paging_nav {
3708        my ($action, $page, $has_next_link) = @_;
3709        my $paging_nav;
3710
3711
3712        if ($page > 0) {
3713                $paging_nav .=
3714                        $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
3715                        " &sdot; " .
3716                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
3717                                 -accesskey => "p", -title => "Alt-p"}, "prev");
3718        } else {
3719                $paging_nav .= "first &sdot; prev";
3720        }
3721
3722        if ($has_next_link) {
3723                $paging_nav .= " &sdot; " .
3724                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
3725                                 -accesskey => "n", -title => "Alt-n"}, "next");
3726        } else {
3727                $paging_nav .= " &sdot; next";
3728        }
3729
3730        return $paging_nav;
3731}
3732
3733## ......................................................................
3734## functions printing or outputting HTML: div
3735
3736sub git_print_header_div {
3737        my ($action, $title, $hash, $hash_base) = @_;
3738        my %args = ();
3739
3740        $args{'action'} = $action;
3741        $args{'hash'} = $hash if $hash;
3742        $args{'hash_base'} = $hash_base if $hash_base;
3743
3744        print "<div class=\"header\">\n" .
3745              $cgi->a({-href => href(%args), -class => "title"},
3746              $title ? $title : $action) .
3747              "\n</div>\n";
3748}
3749
3750sub print_local_time {
3751        print format_local_time(@_);
3752}
3753
3754sub format_local_time {
3755        my $localtime = '';
3756        my %date = @_;
3757        if ($date{'hour_local'} < 6) {
3758                $localtime .= sprintf(" (<span class=\"atnight\">%02d:%02d</span> %s)",
3759                        $date{'hour_local'}, $date{'minute_local'}, $date{'tz_local'});
3760        } else {
3761                $localtime .= sprintf(" (%02d:%02d %s)",
3762                        $date{'hour_local'}, $date{'minute_local'}, $date{'tz_local'});
3763        }
3764
3765        return $localtime;
3766}
3767
3768# Outputs the author name and date in long form
3769sub git_print_authorship {
3770        my $co = shift;
3771        my %opts = @_;
3772        my $tag = $opts{-tag} || 'div';
3773        my $author = $co->{'author_name'};
3774
3775        my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
3776        print "<$tag class=\"author_date\">" .
3777              format_search_author($author, "author", esc_html($author)) .
3778              " [$ad{'rfc2822'}";
3779        print_local_time(%ad) if ($opts{-localtime});
3780        print "]" . git_get_avatar($co->{'author_email'}, -pad_before => 1)
3781                  . "</$tag>\n";
3782}
3783
3784# Outputs table rows containing the full author or committer information,
3785# in the format expected for 'commit' view (& similar).
3786# Parameters are a commit hash reference, followed by the list of people
3787# to output information for. If the list is empty it defaults to both
3788# author and committer.
3789sub git_print_authorship_rows {
3790        my $co = shift;
3791        # too bad we can't use @people = @_ || ('author', 'committer')
3792        my @people = @_;
3793        @people = ('author', 'committer') unless @people;
3794        foreach my $who (@people) {
3795                my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
3796                print "<tr><td>$who</td><td>" .
3797                      format_search_author($co->{"${who}_name"}, $who,
3798                               esc_html($co->{"${who}_name"})) . " " .
3799                      format_search_author($co->{"${who}_email"}, $who,
3800                               esc_html("<" . $co->{"${who}_email"} . ">")) .
3801                      "</td><td rowspan=\"2\">" .
3802                      git_get_avatar($co->{"${who}_email"}, -size => 'double') .
3803                      "</td></tr>\n" .
3804                      "<tr>" .
3805                      "<td></td><td> $wd{'rfc2822'}";
3806                print_local_time(%wd);
3807                print "</td>" .
3808                      "</tr>\n";
3809        }
3810}
3811
3812sub git_print_page_path {
3813        my $name = shift;
3814        my $type = shift;
3815        my $hb = shift;
3816
3817
3818        print "<div class=\"page_path\">";
3819        print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
3820                      -title => 'tree root'}, to_utf8("[$project]"));
3821        print " / ";
3822        if (defined $name) {
3823                my @dirname = split '/', $name;
3824                my $basename = pop @dirname;
3825                my $fullname = '';
3826
3827                foreach my $dir (@dirname) {
3828                        $fullname .= ($fullname ? '/' : '') . $dir;
3829                        print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
3830                                                     hash_base=>$hb),
3831                                      -title => $fullname}, esc_path($dir));
3832                        print " / ";
3833                }
3834                if (defined $type && $type eq 'blob') {
3835                        print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
3836                                                     hash_base=>$hb),
3837                                      -title => $name}, esc_path($basename));
3838                } elsif (defined $type && $type eq 'tree') {
3839                        print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
3840                                                     hash_base=>$hb),
3841                                      -title => $name}, esc_path($basename));
3842                        print " / ";
3843                } else {
3844                        print esc_path($basename);
3845                }
3846        }
3847        print "<br/></div>\n";
3848}
3849
3850sub git_print_log {
3851        my $log = shift;
3852        my %opts = @_;
3853
3854        if ($opts{'-remove_title'}) {
3855                # remove title, i.e. first line of log
3856                shift @$log;
3857        }
3858        # remove leading empty lines
3859        while (defined $log->[0] && $log->[0] eq "") {
3860                shift @$log;
3861        }
3862
3863        # print log
3864        my $signoff = 0;
3865        my $empty = 0;
3866        foreach my $line (@$log) {
3867                if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
3868                        $signoff = 1;
3869                        $empty = 0;
3870                        if (! $opts{'-remove_signoff'}) {
3871                                print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
3872                                next;
3873                        } else {
3874                                # remove signoff lines
3875                                next;
3876                        }
3877                } else {
3878                        $signoff = 0;
3879                }
3880
3881                # print only one empty line
3882                # do not print empty line after signoff
3883                if ($line eq "") {
3884                        next if ($empty || $signoff);
3885                        $empty = 1;
3886                } else {
3887                        $empty = 0;
3888                }
3889
3890                print format_log_line_html($line) . "<br/>\n";
3891        }
3892
3893        if ($opts{'-final_empty_line'}) {
3894                # end with single empty line
3895                print "<br/>\n" unless $empty;
3896        }
3897}
3898
3899# return link target (what link points to)
3900sub git_get_link_target {
3901        my $hash = shift;
3902        my $link_target;
3903
3904        # read link
3905        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
3906                or return;
3907        {
3908                local $/ = undef;
3909                $link_target = <$fd>;
3910        }
3911        close $fd
3912                or return;
3913
3914        return $link_target;
3915}
3916
3917# given link target, and the directory (basedir) the link is in,
3918# return target of link relative to top directory (top tree);
3919# return undef if it is not possible (including absolute links).
3920sub normalize_link_target {
3921        my ($link_target, $basedir) = @_;
3922
3923        # absolute symlinks (beginning with '/') cannot be normalized
3924        return if (substr($link_target, 0, 1) eq '/');
3925
3926        # normalize link target to path from top (root) tree (dir)
3927        my $path;
3928        if ($basedir) {
3929                $path = $basedir . '/' . $link_target;
3930        } else {
3931                # we are in top (root) tree (dir)
3932                $path = $link_target;
3933        }
3934
3935        # remove //, /./, and /../
3936        my @path_parts;
3937        foreach my $part (split('/', $path)) {
3938                # discard '.' and ''
3939                next if (!$part || $part eq '.');
3940                # handle '..'
3941                if ($part eq '..') {
3942                        if (@path_parts) {
3943                                pop @path_parts;
3944                        } else {
3945                                # link leads outside repository (outside top dir)
3946                                return;
3947                        }
3948                } else {
3949                        push @path_parts, $part;
3950                }
3951        }
3952        $path = join('/', @path_parts);
3953
3954        return $path;
3955}
3956
3957# print tree entry (row of git_tree), but without encompassing <tr> element
3958sub git_print_tree_entry {
3959        my ($t, $basedir, $hash_base, $have_blame) = @_;
3960
3961        my %base_key = ();
3962        $base_key{'hash_base'} = $hash_base if defined $hash_base;
3963
3964        # The format of a table row is: mode list link.  Where mode is
3965        # the mode of the entry, list is the name of the entry, an href,
3966        # and link is the action links of the entry.
3967
3968        print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
3969        if (exists $t->{'size'}) {
3970                print "<td class=\"size\">$t->{'size'}</td>\n";
3971        }
3972        if ($t->{'type'} eq "blob") {
3973                print "<td class=\"list\">" .
3974                        $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
3975                                               file_name=>"$basedir$t->{'name'}", %base_key),
3976                                -class => "list"}, esc_path($t->{'name'}));
3977                if (S_ISLNK(oct $t->{'mode'})) {
3978                        my $link_target = git_get_link_target($t->{'hash'});
3979                        if ($link_target) {
3980                                my $norm_target = normalize_link_target($link_target, $basedir);
3981                                if (defined $norm_target) {
3982                                        print " -> " .
3983                                              $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
3984                                                                     file_name=>$norm_target),
3985                                                       -title => $norm_target}, esc_path($link_target));
3986                                } else {
3987                                        print " -> " . esc_path($link_target);
3988                                }
3989                        }
3990                }
3991                print "</td>\n";
3992                print "<td class=\"link\">";
3993                print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
3994                                             file_name=>"$basedir$t->{'name'}", %base_key)},
3995                              "blob");
3996                if ($have_blame) {
3997                        print " | " .
3998                              $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
3999                                                     file_name=>"$basedir$t->{'name'}", %base_key)},
4000                                      "blame");
4001                }
4002                if (defined $hash_base) {
4003                        print " | " .
4004                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4005                                                     hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4006                                      "history");
4007                }
4008                print " | " .
4009                        $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4010                                               file_name=>"$basedir$t->{'name'}")},
4011                                "raw");
4012                print "</td>\n";
4013
4014        } elsif ($t->{'type'} eq "tree") {
4015                print "<td class=\"list\">";
4016                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4017                                             file_name=>"$basedir$t->{'name'}",
4018                                             %base_key)},
4019                              esc_path($t->{'name'}));
4020                print "</td>\n";
4021                print "<td class=\"link\">";
4022                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4023                                             file_name=>"$basedir$t->{'name'}",
4024                                             %base_key)},
4025                              "tree");
4026                if (defined $hash_base) {
4027                        print " | " .
4028                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4029                                                     file_name=>"$basedir$t->{'name'}")},
4030                                      "history");
4031                }
4032                print "</td>\n";
4033        } else {
4034                # unknown object: we can only present history for it
4035                # (this includes 'commit' object, i.e. submodule support)
4036                print "<td class=\"list\">" .
4037                      esc_path($t->{'name'}) .
4038                      "</td>\n";
4039                print "<td class=\"link\">";
4040                if (defined $hash_base) {
4041                        print $cgi->a({-href => href(action=>"history",
4042                                                     hash_base=>$hash_base,
4043                                                     file_name=>"$basedir$t->{'name'}")},
4044                                      "history");
4045                }
4046                print "</td>\n";
4047        }
4048}
4049
4050## ......................................................................
4051## functions printing large fragments of HTML
4052
4053# get pre-image filenames for merge (combined) diff
4054sub fill_from_file_info {
4055        my ($diff, @parents) = @_;
4056
4057        $diff->{'from_file'} = [ ];
4058        $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4059        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4060                if ($diff->{'status'}[$i] eq 'R' ||
4061                    $diff->{'status'}[$i] eq 'C') {
4062                        $diff->{'from_file'}[$i] =
4063                                git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4064                }
4065        }
4066
4067        return $diff;
4068}
4069
4070# is current raw difftree line of file deletion
4071sub is_deleted {
4072        my $diffinfo = shift;
4073
4074        return $diffinfo->{'to_id'} eq ('0' x 40);
4075}
4076
4077# does patch correspond to [previous] difftree raw line
4078# $diffinfo  - hashref of parsed raw diff format
4079# $patchinfo - hashref of parsed patch diff format
4080#              (the same keys as in $diffinfo)
4081sub is_patch_split {
4082        my ($diffinfo, $patchinfo) = @_;
4083
4084        return defined $diffinfo && defined $patchinfo
4085                && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4086}
4087
4088
4089sub git_difftree_body {
4090        my ($difftree, $hash, @parents) = @_;
4091        my ($parent) = $parents[0];
4092        my $have_blame = gitweb_check_feature('blame');
4093        print "<div class=\"list_head\">\n";
4094        if ($#{$difftree} > 10) {
4095                print(($#{$difftree} + 1) . " files changed:\n");
4096        }
4097        print "</div>\n";
4098
4099        print "<table class=\"" .
4100              (@parents > 1 ? "combined " : "") .
4101              "diff_tree\">\n";
4102
4103        # header only for combined diff in 'commitdiff' view
4104        my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4105        if ($has_header) {
4106                # table header
4107                print "<thead><tr>\n" .
4108                       "<th></th><th></th>\n"; # filename, patchN link
4109                for (my $i = 0; $i < @parents; $i++) {
4110                        my $par = $parents[$i];
4111                        print "<th>" .
4112                              $cgi->a({-href => href(action=>"commitdiff",
4113                                                     hash=>$hash, hash_parent=>$par),
4114                                       -title => 'commitdiff to parent number ' .
4115                                                  ($i+1) . ': ' . substr($par,0,7)},
4116                                      $i+1) .
4117                              "&nbsp;</th>\n";
4118                }
4119                print "</tr></thead>\n<tbody>\n";
4120        }
4121
4122        my $alternate = 1;
4123        my $patchno = 0;
4124        foreach my $line (@{$difftree}) {
4125                my $diff = parsed_difftree_line($line);
4126
4127                if ($alternate) {
4128                        print "<tr class=\"dark\">\n";
4129                } else {
4130                        print "<tr class=\"light\">\n";
4131                }
4132                $alternate ^= 1;
4133
4134                if (exists $diff->{'nparents'}) { # combined diff
4135
4136                        fill_from_file_info($diff, @parents)
4137                                unless exists $diff->{'from_file'};
4138
4139                        if (!is_deleted($diff)) {
4140                                # file exists in the result (child) commit
4141                                print "<td>" .
4142                                      $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4143                                                             file_name=>$diff->{'to_file'},
4144                                                             hash_base=>$hash),
4145                                              -class => "list"}, esc_path($diff->{'to_file'})) .
4146                                      "</td>\n";
4147                        } else {
4148                                print "<td>" .
4149                                      esc_path($diff->{'to_file'}) .
4150                                      "</td>\n";
4151                        }
4152
4153                        if ($action eq 'commitdiff') {
4154                                # link to patch
4155                                $patchno++;
4156                                print "<td class=\"link\">" .
4157                                      $cgi->a({-href => "#patch$patchno"}, "patch") .
4158                                      " | " .
4159                                      "</td>\n";
4160                        }
4161
4162                        my $has_history = 0;
4163                        my $not_deleted = 0;
4164                        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4165                                my $hash_parent = $parents[$i];
4166                                my $from_hash = $diff->{'from_id'}[$i];
4167                                my $from_path = $diff->{'from_file'}[$i];
4168                                my $status = $diff->{'status'}[$i];
4169
4170                                $has_history ||= ($status ne 'A');
4171                                $not_deleted ||= ($status ne 'D');
4172
4173                                if ($status eq 'A') {
4174                                        print "<td  class=\"link\" align=\"right\"> | </td>\n";
4175                                } elsif ($status eq 'D') {
4176                                        print "<td class=\"link\">" .
4177                                              $cgi->a({-href => href(action=>"blob",
4178                                                                     hash_base=>$hash,
4179                                                                     hash=>$from_hash,
4180                                                                     file_name=>$from_path)},
4181                                                      "blob" . ($i+1)) .
4182                                              " | </td>\n";
4183                                } else {
4184                                        if ($diff->{'to_id'} eq $from_hash) {
4185                                                print "<td class=\"link nochange\">";
4186                                        } else {
4187                                                print "<td class=\"link\">";
4188                                        }
4189                                        print $cgi->a({-href => href(action=>"blobdiff",
4190                                                                     hash=>$diff->{'to_id'},
4191                                                                     hash_parent=>$from_hash,
4192                                                                     hash_base=>$hash,
4193                                                                     hash_parent_base=>$hash_parent,
4194                                                                     file_name=>$diff->{'to_file'},
4195                                                                     file_parent=>$from_path)},
4196                                                      "diff" . ($i+1)) .
4197                                              " | </td>\n";
4198                                }
4199                        }
4200
4201                        print "<td class=\"link\">";
4202                        if ($not_deleted) {
4203                                print $cgi->a({-href => href(action=>"blob",
4204                                                             hash=>$diff->{'to_id'},
4205                                                             file_name=>$diff->{'to_file'},
4206                                                             hash_base=>$hash)},
4207                                              "blob");
4208                                print " | " if ($has_history);
4209                        }
4210                        if ($has_history) {
4211                                print $cgi->a({-href => href(action=>"history",
4212                                                             file_name=>$diff->{'to_file'},
4213                                                             hash_base=>$hash)},
4214                                              "history");
4215                        }
4216                        print "</td>\n";
4217
4218                        print "</tr>\n";
4219                        next; # instead of 'else' clause, to avoid extra indent
4220                }
4221                # else ordinary diff
4222
4223                my ($to_mode_oct, $to_mode_str, $to_file_type);
4224                my ($from_mode_oct, $from_mode_str, $from_file_type);
4225                if ($diff->{'to_mode'} ne ('0' x 6)) {
4226                        $to_mode_oct = oct $diff->{'to_mode'};
4227                        if (S_ISREG($to_mode_oct)) { # only for regular file
4228                                $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4229                        }
4230                        $to_file_type = file_type($diff->{'to_mode'});
4231                }
4232                if ($diff->{'from_mode'} ne ('0' x 6)) {
4233                        $from_mode_oct = oct $diff->{'from_mode'};
4234                        if (S_ISREG($to_mode_oct)) { # only for regular file
4235                                $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4236                        }
4237                        $from_file_type = file_type($diff->{'from_mode'});
4238                }
4239
4240                if ($diff->{'status'} eq "A") { # created
4241                        my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4242                        $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4243                        $mode_chng   .= "]</span>";
4244                        print "<td>";
4245                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4246                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4247                                      -class => "list"}, esc_path($diff->{'file'}));
4248                        print "</td>\n";
4249                        print "<td>$mode_chng</td>\n";
4250                        print "<td class=\"link\">";
4251                        if ($action eq 'commitdiff') {
4252                                # link to patch
4253                                $patchno++;
4254                                print $cgi->a({-href => "#patch$patchno"}, "patch");
4255                                print " | ";
4256                        }
4257                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4258                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4259                                      "blob");
4260                        print "</td>\n";
4261
4262                } elsif ($diff->{'status'} eq "D") { # deleted
4263                        my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4264                        print "<td>";
4265                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4266                                                     hash_base=>$parent, file_name=>$diff->{'file'}),
4267                                       -class => "list"}, esc_path($diff->{'file'}));
4268                        print "</td>\n";
4269                        print "<td>$mode_chng</td>\n";
4270                        print "<td class=\"link\">";
4271                        if ($action eq 'commitdiff') {
4272                                # link to patch
4273                                $patchno++;
4274                                print $cgi->a({-href => "#patch$patchno"}, "patch");
4275                                print " | ";
4276                        }
4277                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4278                                                     hash_base=>$parent, file_name=>$diff->{'file'})},
4279                                      "blob") . " | ";
4280                        if ($have_blame) {
4281                                print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4282                                                             file_name=>$diff->{'file'})},
4283                                              "blame") . " | ";
4284                        }
4285                        print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4286                                                     file_name=>$diff->{'file'})},
4287                                      "history");
4288                        print "</td>\n";
4289
4290                } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4291                        my $mode_chnge = "";
4292                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4293                                $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4294                                if ($from_file_type ne $to_file_type) {
4295                                        $mode_chnge .= " from $from_file_type to $to_file_type";
4296                                }
4297                                if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4298                                        if ($from_mode_str && $to_mode_str) {
4299                                                $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4300                                        } elsif ($to_mode_str) {
4301                                                $mode_chnge .= " mode: $to_mode_str";
4302                                        }
4303                                }
4304                                $mode_chnge .= "]</span>\n";
4305                        }
4306                        print "<td>";
4307                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4308                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4309                                      -class => "list"}, esc_path($diff->{'file'}));
4310                        print "</td>\n";
4311                        print "<td>$mode_chnge</td>\n";
4312                        print "<td class=\"link\">";
4313                        if ($action eq 'commitdiff') {
4314                                # link to patch
4315                                $patchno++;
4316                                print $cgi->a({-href => "#patch$patchno"}, "patch") .
4317                                      " | ";
4318                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4319                                # "commit" view and modified file (not onlu mode changed)
4320                                print $cgi->a({-href => href(action=>"blobdiff",
4321                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4322                                                             hash_base=>$hash, hash_parent_base=>$parent,
4323                                                             file_name=>$diff->{'file'})},
4324                                              "diff") .
4325                                      " | ";
4326                        }
4327                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4328                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4329                                       "blob") . " | ";
4330                        if ($have_blame) {
4331                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4332                                                             file_name=>$diff->{'file'})},
4333                                              "blame") . " | ";
4334                        }
4335                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4336                                                     file_name=>$diff->{'file'})},
4337                                      "history");
4338                        print "</td>\n";
4339
4340                } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4341                        my %status_name = ('R' => 'moved', 'C' => 'copied');
4342                        my $nstatus = $status_name{$diff->{'status'}};
4343                        my $mode_chng = "";
4344                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4345                                # mode also for directories, so we cannot use $to_mode_str
4346                                $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4347                        }
4348                        print "<td>" .
4349                              $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4350                                                     hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4351                                      -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4352                              "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4353                              $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4354                                                     hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4355                                      -class => "list"}, esc_path($diff->{'from_file'})) .
4356                              " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4357                              "<td class=\"link\">";
4358                        if ($action eq 'commitdiff') {
4359                                # link to patch
4360                                $patchno++;
4361                                print $cgi->a({-href => "#patch$patchno"}, "patch") .
4362                                      " | ";
4363                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4364                                # "commit" view and modified file (not only pure rename or copy)
4365                                print $cgi->a({-href => href(action=>"blobdiff",
4366                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4367                                                             hash_base=>$hash, hash_parent_base=>$parent,
4368                                                             file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4369                                              "diff") .
4370                                      " | ";
4371                        }
4372                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4373                                                     hash_base=>$parent, file_name=>$diff->{'to_file'})},
4374                                      "blob") . " | ";
4375                        if ($have_blame) {
4376                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4377                                                             file_name=>$diff->{'to_file'})},
4378                                              "blame") . " | ";
4379                        }
4380                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4381                                                    file_name=>$diff->{'to_file'})},
4382                                      "history");
4383                        print "</td>\n";
4384
4385                } # we should not encounter Unmerged (U) or Unknown (X) status
4386                print "</tr>\n";
4387        }
4388        print "</tbody>" if $has_header;
4389        print "</table>\n";
4390}
4391
4392sub git_patchset_body {
4393        my ($fd, $difftree, $hash, @hash_parents) = @_;
4394        my ($hash_parent) = $hash_parents[0];
4395
4396        my $is_combined = (@hash_parents > 1);
4397        my $patch_idx = 0;
4398        my $patch_number = 0;
4399        my $patch_line;
4400        my $diffinfo;
4401        my $to_name;
4402        my (%from, %to);
4403
4404        print "<div class=\"patchset\">\n";
4405
4406        # skip to first patch
4407        while ($patch_line = <$fd>) {
4408                chomp $patch_line;
4409
4410                last if ($patch_line =~ m/^diff /);
4411        }
4412
4413 PATCH:
4414        while ($patch_line) {
4415
4416                # parse "git diff" header line
4417                if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
4418                        # $1 is from_name, which we do not use
4419                        $to_name = unquote($2);
4420                        $to_name =~ s!^b/!!;
4421                } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
4422                        # $1 is 'cc' or 'combined', which we do not use
4423                        $to_name = unquote($2);
4424                } else {
4425                        $to_name = undef;
4426                }
4427
4428                # check if current patch belong to current raw line
4429                # and parse raw git-diff line if needed
4430                if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
4431                        # this is continuation of a split patch
4432                        print "<div class=\"patch cont\">\n";
4433                } else {
4434                        # advance raw git-diff output if needed
4435                        $patch_idx++ if defined $diffinfo;
4436
4437                        # read and prepare patch information
4438                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4439
4440                        # compact combined diff output can have some patches skipped
4441                        # find which patch (using pathname of result) we are at now;
4442                        if ($is_combined) {
4443                                while ($to_name ne $diffinfo->{'to_file'}) {
4444                                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4445                                              format_diff_cc_simplified($diffinfo, @hash_parents) .
4446                                              "</div>\n";  # class="patch"
4447
4448                                        $patch_idx++;
4449                                        $patch_number++;
4450
4451                                        last if $patch_idx > $#$difftree;
4452                                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4453                                }
4454                        }
4455
4456                        # modifies %from, %to hashes
4457                        parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
4458
4459                        # this is first patch for raw difftree line with $patch_idx index
4460                        # we index @$difftree array from 0, but number patches from 1
4461                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
4462                }
4463
4464                # git diff header
4465                #assert($patch_line =~ m/^diff /) if DEBUG;
4466                #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
4467                $patch_number++;
4468                # print "git diff" header
4469                print format_git_diff_header_line($patch_line, $diffinfo,
4470                                                  \%from, \%to);
4471
4472                # print extended diff header
4473                print "<div class=\"diff extended_header\">\n";
4474        EXTENDED_HEADER:
4475                while ($patch_line = <$fd>) {
4476                        chomp $patch_line;
4477
4478                        last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
4479
4480                        print format_extended_diff_header_line($patch_line, $diffinfo,
4481                                                               \%from, \%to);
4482                }
4483                print "</div>\n"; # class="diff extended_header"
4484
4485                # from-file/to-file diff header
4486                if (! $patch_line) {
4487                        print "</div>\n"; # class="patch"
4488                        last PATCH;
4489                }
4490                next PATCH if ($patch_line =~ m/^diff /);
4491                #assert($patch_line =~ m/^---/) if DEBUG;
4492
4493                my $last_patch_line = $patch_line;
4494                $patch_line = <$fd>;
4495                chomp $patch_line;
4496                #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
4497
4498                print format_diff_from_to_header($last_patch_line, $patch_line,
4499                                                 $diffinfo, \%from, \%to,
4500                                                 @hash_parents);
4501
4502                # the patch itself
4503        LINE:
4504                while ($patch_line = <$fd>) {
4505                        chomp $patch_line;
4506
4507                        next PATCH if ($patch_line =~ m/^diff /);
4508
4509                        print format_diff_line($patch_line, \%from, \%to);
4510                }
4511
4512        } continue {
4513                print "</div>\n"; # class="patch"
4514        }
4515
4516        # for compact combined (--cc) format, with chunk and patch simplification
4517        # the patchset might be empty, but there might be unprocessed raw lines
4518        for (++$patch_idx if $patch_number > 0;
4519             $patch_idx < @$difftree;
4520             ++$patch_idx) {
4521                # read and prepare patch information
4522                $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4523
4524                # generate anchor for "patch" links in difftree / whatchanged part
4525                print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4526                      format_diff_cc_simplified($diffinfo, @hash_parents) .
4527                      "</div>\n";  # class="patch"
4528
4529                $patch_number++;
4530        }
4531
4532        if ($patch_number == 0) {
4533                if (@hash_parents > 1) {
4534                        print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
4535                } else {
4536                        print "<div class=\"diff nodifferences\">No differences found</div>\n";
4537                }
4538        }
4539
4540        print "</div>\n"; # class="patchset"
4541}
4542
4543# . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
4544
4545# fills project list info (age, description, owner, forks) for each
4546# project in the list, removing invalid projects from returned list
4547# NOTE: modifies $projlist, but does not remove entries from it
4548sub fill_project_list_info {
4549        my ($projlist, $check_forks) = @_;
4550        my @projects;
4551
4552        my $show_ctags = gitweb_check_feature('ctags');
4553 PROJECT:
4554        foreach my $pr (@$projlist) {
4555                my (@activity) = git_get_last_activity($pr->{'path'});
4556                unless (@activity) {
4557                        next PROJECT;
4558                }
4559                ($pr->{'age'}, $pr->{'age_string'}) = @activity;
4560                if (!defined $pr->{'descr'}) {
4561                        my $descr = git_get_project_description($pr->{'path'}) || "";
4562                        $descr = to_utf8($descr);
4563                        $pr->{'descr_long'} = $descr;
4564                        $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
4565                }
4566                if (!defined $pr->{'owner'}) {
4567                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
4568                }
4569                if ($check_forks) {
4570                        my $pname = $pr->{'path'};
4571                        if (($pname =~ s/\.git$//) &&
4572                            ($pname !~ /\/$/) &&
4573                            (-d "$projectroot/$pname")) {
4574                                $pr->{'forks'} = "-d $projectroot/$pname";
4575                        } else {
4576                                $pr->{'forks'} = 0;
4577                        }
4578                }
4579                $show_ctags and $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
4580                push @projects, $pr;
4581        }
4582
4583        return @projects;
4584}
4585
4586# print 'sort by' <th> element, generating 'sort by $name' replay link
4587# if that order is not selected
4588sub print_sort_th {
4589        print format_sort_th(@_);
4590}
4591
4592sub format_sort_th {
4593        my ($name, $order, $header) = @_;
4594        my $sort_th = "";
4595        $header ||= ucfirst($name);
4596
4597        if ($order eq $name) {
4598                $sort_th .= "<th>$header</th>\n";
4599        } else {
4600                $sort_th .= "<th>" .
4601                            $cgi->a({-href => href(-replay=>1, order=>$name),
4602                                     -class => "header"}, $header) .
4603                            "</th>\n";
4604        }
4605
4606        return $sort_th;
4607}
4608
4609sub git_project_list_body {
4610        # actually uses global variable $project
4611        my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
4612
4613        my $check_forks = gitweb_check_feature('forks');
4614        my @projects = fill_project_list_info($projlist, $check_forks);
4615
4616        $order ||= $default_projects_order;
4617        $from = 0 unless defined $from;
4618        $to = $#projects if (!defined $to || $#projects < $to);
4619
4620        my %order_info = (
4621                project => { key => 'path', type => 'str' },
4622                descr => { key => 'descr_long', type => 'str' },
4623                owner => { key => 'owner', type => 'str' },
4624                age => { key => 'age', type => 'num' }
4625        );
4626        my $oi = $order_info{$order};
4627        if ($oi->{'type'} eq 'str') {
4628                @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @projects;
4629        } else {
4630                @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @projects;
4631        }
4632
4633        my $show_ctags = gitweb_check_feature('ctags');
4634        if ($show_ctags) {
4635                my %ctags;
4636                foreach my $p (@projects) {
4637                        foreach my $ct (keys %{$p->{'ctags'}}) {
4638                                $ctags{$ct} += $p->{'ctags'}->{$ct};
4639                        }
4640                }
4641                my $cloud = git_populate_project_tagcloud(\%ctags);
4642                print git_show_project_tagcloud($cloud, 64);
4643        }
4644
4645        print "<table class=\"project_list\">\n";
4646        unless ($no_header) {
4647                print "<tr>\n";
4648                if ($check_forks) {
4649                        print "<th></th>\n";
4650                }
4651                print_sort_th('project', $order, 'Project');
4652                print_sort_th('descr', $order, 'Description');
4653                print_sort_th('owner', $order, 'Owner');
4654                print_sort_th('age', $order, 'Last Change');
4655                print "<th></th>\n" . # for links
4656                      "</tr>\n";
4657        }
4658        my $alternate = 1;
4659        my $tagfilter = $cgi->param('by_tag');
4660        for (my $i = $from; $i <= $to; $i++) {
4661                my $pr = $projects[$i];
4662
4663                next if $tagfilter and $show_ctags and not grep { lc $_ eq lc $tagfilter } keys %{$pr->{'ctags'}};
4664                next if $searchtext and not $pr->{'path'} =~ /$searchtext/
4665                        and not $pr->{'descr_long'} =~ /$searchtext/;
4666                # Weed out forks or non-matching entries of search
4667                if ($check_forks) {
4668                        my $forkbase = $project; $forkbase ||= ''; $forkbase =~ s#\.git$#/#;
4669                        $forkbase="^$forkbase" if $forkbase;
4670                        next if not $searchtext and not $tagfilter and $show_ctags
4671                                and $pr->{'path'} =~ m#$forkbase.*/.*#; # regexp-safe
4672                }
4673
4674                if ($alternate) {
4675                        print "<tr class=\"dark\">\n";
4676                } else {
4677                        print "<tr class=\"light\">\n";
4678                }
4679                $alternate ^= 1;
4680                if ($check_forks) {
4681                        print "<td>";
4682                        if ($pr->{'forks'}) {
4683                                print "<!-- $pr->{'forks'} -->\n";
4684                                print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "+");
4685                        }
4686                        print "</td>\n";
4687                }
4688                print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4689                                        -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
4690                      "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4691                                        -class => "list", -title => $pr->{'descr_long'}},
4692                                        esc_html($pr->{'descr'})) . "</td>\n" .
4693                      "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
4694                print "<td class=\"". age_class($pr->{'age'}) . "\">" .
4695                      (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
4696                      "<td class=\"link\">" .
4697                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
4698                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
4699                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
4700                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
4701                      ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
4702                      "</td>\n" .
4703                      "</tr>\n";
4704        }
4705        if (defined $extra) {
4706                print "<tr>\n";
4707                if ($check_forks) {
4708                        print "<td></td>\n";
4709                }
4710                print "<td colspan=\"5\">$extra</td>\n" .
4711                      "</tr>\n";
4712        }
4713        print "</table>\n";
4714}
4715
4716sub git_log_body {
4717        # uses global variable $project
4718        my ($commitlist, $from, $to, $refs, $extra) = @_;
4719
4720        $from = 0 unless defined $from;
4721        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4722
4723        for (my $i = 0; $i <= $to; $i++) {
4724                my %co = %{$commitlist->[$i]};
4725                next if !%co;
4726                my $commit = $co{'id'};
4727                my $ref = format_ref_marker($refs, $commit);
4728                my %ad = parse_date($co{'author_epoch'});
4729                git_print_header_div('commit',
4730                               "<span class=\"age\">$co{'age_string'}</span>" .
4731                               esc_html($co{'title'}) . $ref,
4732                               $commit);
4733                print "<div class=\"title_text\">\n" .
4734                      "<div class=\"log_link\">\n" .
4735                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
4736                      " | " .
4737                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
4738                      " | " .
4739                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
4740                      "<br/>\n" .
4741                      "</div>\n";
4742                      git_print_authorship(\%co, -tag => 'span');
4743                      print "<br/>\n</div>\n";
4744
4745                print "<div class=\"log_body\">\n";
4746                git_print_log($co{'comment'}, -final_empty_line=> 1);
4747                print "</div>\n";
4748        }
4749        if ($extra) {
4750                print "<div class=\"page_nav\">\n";
4751                print "$extra\n";
4752                print "</div>\n";
4753        }
4754}
4755
4756sub git_shortlog_body {
4757        # uses global variable $project
4758        my ($commitlist, $from, $to, $refs, $extra) = @_;
4759
4760        $from = 0 unless defined $from;
4761        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4762
4763        print "<table class=\"shortlog\">\n";
4764        my $alternate = 1;
4765        for (my $i = $from; $i <= $to; $i++) {
4766                my %co = %{$commitlist->[$i]};
4767                my $commit = $co{'id'};
4768                my $ref = format_ref_marker($refs, $commit);
4769                if ($alternate) {
4770                        print "<tr class=\"dark\">\n";
4771                } else {
4772                        print "<tr class=\"light\">\n";
4773                }
4774                $alternate ^= 1;
4775                # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
4776                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4777                      format_author_html('td', \%co, 10) . "<td>";
4778                print format_subject_html($co{'title'}, $co{'title_short'},
4779                                          href(action=>"commit", hash=>$commit), $ref);
4780                print "</td>\n" .
4781                      "<td class=\"link\">" .
4782                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
4783                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
4784                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
4785                my $snapshot_links = format_snapshot_links($commit);
4786                if (defined $snapshot_links) {
4787                        print " | " . $snapshot_links;
4788                }
4789                print "</td>\n" .
4790                      "</tr>\n";
4791        }
4792        if (defined $extra) {
4793                print "<tr>\n" .
4794                      "<td colspan=\"4\">$extra</td>\n" .
4795                      "</tr>\n";
4796        }
4797        print "</table>\n";
4798}
4799
4800sub git_history_body {
4801        # Warning: assumes constant type (blob or tree) during history
4802        my ($commitlist, $from, $to, $refs, $extra,
4803            $file_name, $file_hash, $ftype) = @_;
4804
4805        $from = 0 unless defined $from;
4806        $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
4807
4808        print "<table class=\"history\">\n";
4809        my $alternate = 1;
4810        for (my $i = $from; $i <= $to; $i++) {
4811                my %co = %{$commitlist->[$i]};
4812                if (!%co) {
4813                        next;
4814                }
4815                my $commit = $co{'id'};
4816
4817                my $ref = format_ref_marker($refs, $commit);
4818
4819                if ($alternate) {
4820                        print "<tr class=\"dark\">\n";
4821                } else {
4822                        print "<tr class=\"light\">\n";
4823                }
4824                $alternate ^= 1;
4825                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4826        # shortlog:   format_author_html('td', \%co, 10)
4827                      format_author_html('td', \%co, 15, 3) . "<td>";
4828                # originally git_history used chop_str($co{'title'}, 50)
4829                print format_subject_html($co{'title'}, $co{'title_short'},
4830                                          href(action=>"commit", hash=>$commit), $ref);
4831                print "</td>\n" .
4832                      "<td class=\"link\">" .
4833                      $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
4834                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
4835
4836                if ($ftype eq 'blob') {
4837                        my $blob_current = $file_hash;
4838                        my $blob_parent  = git_get_hash_by_path($commit, $file_name);
4839                        if (defined $blob_current && defined $blob_parent &&
4840                                        $blob_current ne $blob_parent) {
4841                                print " | " .
4842                                        $cgi->a({-href => href(action=>"blobdiff",
4843                                                               hash=>$blob_current, hash_parent=>$blob_parent,
4844                                                               hash_base=>$hash_base, hash_parent_base=>$commit,
4845                                                               file_name=>$file_name)},
4846                                                "diff to current");
4847                        }
4848                }
4849                print "</td>\n" .
4850                      "</tr>\n";
4851        }
4852        if (defined $extra) {
4853                print "<tr>\n" .
4854                      "<td colspan=\"4\">$extra</td>\n" .
4855                      "</tr>\n";
4856        }
4857        print "</table>\n";
4858}
4859
4860sub git_tags_body {
4861        # uses global variable $project
4862        my ($taglist, $from, $to, $extra) = @_;
4863        $from = 0 unless defined $from;
4864        $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
4865
4866        print "<table class=\"tags\">\n";
4867        my $alternate = 1;
4868        for (my $i = $from; $i <= $to; $i++) {
4869                my $entry = $taglist->[$i];
4870                my %tag = %$entry;
4871                my $comment = $tag{'subject'};
4872                my $comment_short;
4873                if (defined $comment) {
4874                        $comment_short = chop_str($comment, 30, 5);
4875                }
4876                if ($alternate) {
4877                        print "<tr class=\"dark\">\n";
4878                } else {
4879                        print "<tr class=\"light\">\n";
4880                }
4881                $alternate ^= 1;
4882                if (defined $tag{'age'}) {
4883                        print "<td><i>$tag{'age'}</i></td>\n";
4884                } else {
4885                        print "<td></td>\n";
4886                }
4887                print "<td>" .
4888                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
4889                               -class => "list name"}, esc_html($tag{'name'})) .
4890                      "</td>\n" .
4891                      "<td>";
4892                if (defined $comment) {
4893                        print format_subject_html($comment, $comment_short,
4894                                                  href(action=>"tag", hash=>$tag{'id'}));
4895                }
4896                print "</td>\n" .
4897                      "<td class=\"selflink\">";
4898                if ($tag{'type'} eq "tag") {
4899                        print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
4900                } else {
4901                        print "&nbsp;";
4902                }
4903                print "</td>\n" .
4904                      "<td class=\"link\">" . " | " .
4905                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
4906                if ($tag{'reftype'} eq "commit") {
4907                        print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
4908                              " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
4909                } elsif ($tag{'reftype'} eq "blob") {
4910                        print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
4911                }
4912                print "</td>\n" .
4913                      "</tr>";
4914        }
4915        if (defined $extra) {
4916                print "<tr>\n" .
4917                      "<td colspan=\"5\">$extra</td>\n" .
4918                      "</tr>\n";
4919        }
4920        print "</table>\n";
4921}
4922
4923sub git_heads_body {
4924        # uses global variable $project
4925        my ($headlist, $head, $from, $to, $extra) = @_;
4926        $from = 0 unless defined $from;
4927        $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
4928
4929        print "<table class=\"heads\">\n";
4930        my $alternate = 1;
4931        for (my $i = $from; $i <= $to; $i++) {
4932                my $entry = $headlist->[$i];
4933                my %ref = %$entry;
4934                my $curr = $ref{'id'} eq $head;
4935                if ($alternate) {
4936                        print "<tr class=\"dark\">\n";
4937                } else {
4938                        print "<tr class=\"light\">\n";
4939                }
4940                $alternate ^= 1;
4941                print "<td><i>$ref{'age'}</i></td>\n" .
4942                      ($curr ? "<td class=\"current_head\">" : "<td>") .
4943                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
4944                               -class => "list name"},esc_html($ref{'name'})) .
4945                      "</td>\n" .
4946                      "<td class=\"link\">" .
4947                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
4948                      $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
4949                      $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'name'})}, "tree") .
4950                      "</td>\n" .
4951                      "</tr>";
4952        }
4953        if (defined $extra) {
4954                print "<tr>\n" .
4955                      "<td colspan=\"3\">$extra</td>\n" .
4956                      "</tr>\n";
4957        }
4958        print "</table>\n";
4959}
4960
4961sub git_search_grep_body {
4962        my ($commitlist, $from, $to, $extra) = @_;
4963        $from = 0 unless defined $from;
4964        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4965
4966        print "<table class=\"commit_search\">\n";
4967        my $alternate = 1;
4968        for (my $i = $from; $i <= $to; $i++) {
4969                my %co = %{$commitlist->[$i]};
4970                if (!%co) {
4971                        next;
4972                }
4973                my $commit = $co{'id'};
4974                if ($alternate) {
4975                        print "<tr class=\"dark\">\n";
4976                } else {
4977                        print "<tr class=\"light\">\n";
4978                }
4979                $alternate ^= 1;
4980                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4981                      format_author_html('td', \%co, 15, 5) .
4982                      "<td>" .
4983                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
4984                               -class => "list subject"},
4985                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
4986                my $comment = $co{'comment'};
4987                foreach my $line (@$comment) {
4988                        if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
4989                                my ($lead, $match, $trail) = ($1, $2, $3);
4990                                $match = chop_str($match, 70, 5, 'center');
4991                                my $contextlen = int((80 - length($match))/2);
4992                                $contextlen = 30 if ($contextlen > 30);
4993                                $lead  = chop_str($lead,  $contextlen, 10, 'left');
4994                                $trail = chop_str($trail, $contextlen, 10, 'right');
4995
4996                                $lead  = esc_html($lead);
4997                                $match = esc_html($match);
4998                                $trail = esc_html($trail);
4999
5000                                print "$lead<span class=\"match\">$match</span>$trail<br />";
5001                        }
5002                }
5003                print "</td>\n" .
5004                      "<td class=\"link\">" .
5005                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5006                      " | " .
5007                      $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5008                      " | " .
5009                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5010                print "</td>\n" .
5011                      "</tr>\n";
5012        }
5013        if (defined $extra) {
5014                print "<tr>\n" .
5015                      "<td colspan=\"3\">$extra</td>\n" .
5016                      "</tr>\n";
5017        }
5018        print "</table>\n";
5019}
5020
5021## ======================================================================
5022## ======================================================================
5023## actions
5024
5025sub git_project_list {
5026        my $order = $input_params{'order'};
5027        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5028                die_error(400, "Unknown order parameter");
5029        }
5030
5031        my @list = git_get_projects_list();
5032        if (!@list) {
5033                die_error(404, "No projects found");
5034        }
5035
5036        git_header_html();
5037        if (defined $home_text && -f $home_text) {
5038                print "<div class=\"index_include\">\n";
5039                insert_file($home_text);
5040                print "</div>\n";
5041        }
5042        print $cgi->startform(-method => "get") .
5043              "<p class=\"projsearch\">Search:\n" .
5044              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
5045              "</p>" .
5046              $cgi->end_form() . "\n";
5047        git_project_list_body(\@list, $order);
5048        git_footer_html();
5049}
5050
5051sub git_forks {
5052        my $order = $input_params{'order'};
5053        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5054                die_error(400, "Unknown order parameter");
5055        }
5056
5057        my @list = git_get_projects_list($project);
5058        if (!@list) {
5059                die_error(404, "No forks found");
5060        }
5061
5062        git_header_html();
5063        git_print_page_nav('','');
5064        git_print_header_div('summary', "$project forks");
5065        git_project_list_body(\@list, $order);
5066        git_footer_html();
5067}
5068
5069sub git_project_index {
5070        my @projects = git_get_projects_list($project);
5071
5072        print $cgi->header(
5073                -type => 'text/plain',
5074                -charset => 'utf-8',
5075                -content_disposition => 'inline; filename="index.aux"');
5076
5077        foreach my $pr (@projects) {
5078                if (!exists $pr->{'owner'}) {
5079                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
5080                }
5081
5082                my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
5083                # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
5084                $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5085                $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5086                $path  =~ s/ /\+/g;
5087                $owner =~ s/ /\+/g;
5088
5089                print "$path $owner\n";
5090        }
5091}
5092
5093sub git_summary {
5094        my $descr = git_get_project_description($project) || "none";
5095        my %co = parse_commit("HEAD");
5096        my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
5097        my $head = $co{'id'};
5098
5099        my $owner = git_get_project_owner($project);
5100
5101        my $refs = git_get_references();
5102        # These get_*_list functions return one more to allow us to see if
5103        # there are more ...
5104        my @taglist  = git_get_tags_list(16);
5105        my @headlist = git_get_heads_list(16);
5106        my @forklist;
5107        my $check_forks = gitweb_check_feature('forks');
5108
5109        if ($check_forks) {
5110                @forklist = git_get_projects_list($project);
5111        }
5112
5113        git_header_html();
5114        git_print_page_nav('summary','', $head);
5115
5116        print "<div class=\"title\">&nbsp;</div>\n";
5117        print "<table class=\"projects_list\">\n" .
5118              "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
5119              "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
5120        if (defined $cd{'rfc2822'}) {
5121                print "<tr id=\"metadata_lchange\"><td>last change</td><td>$cd{'rfc2822'}</td></tr>\n";
5122        }
5123
5124        # use per project git URL list in $projectroot/$project/cloneurl
5125        # or make project git URL from git base URL and project name
5126        my $url_tag = "URL";
5127        my @url_list = git_get_project_url_list($project);
5128        @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
5129        foreach my $git_url (@url_list) {
5130                next unless $git_url;
5131                print "<tr class=\"metadata_url\"><td>$url_tag</td><td>$git_url</td></tr>\n";
5132                $url_tag = "";
5133        }
5134
5135        # Tag cloud
5136        my $show_ctags = gitweb_check_feature('ctags');
5137        if ($show_ctags) {
5138                my $ctags = git_get_project_ctags($project);
5139                my $cloud = git_populate_project_tagcloud($ctags);
5140                print "<tr id=\"metadata_ctags\"><td>Content tags:<br />";
5141                print "</td>\n<td>" unless %$ctags;
5142                print "<form action=\"$show_ctags\" method=\"post\"><input type=\"hidden\" name=\"p\" value=\"$project\" />Add: <input type=\"text\" name=\"t\" size=\"8\" /></form>";
5143                print "</td>\n<td>" if %$ctags;
5144                print git_show_project_tagcloud($cloud, 48);
5145                print "</td></tr>";
5146        }
5147
5148        print "</table>\n";
5149
5150        # If XSS prevention is on, we don't include README.html.
5151        # TODO: Allow a readme in some safe format.
5152        if (!$prevent_xss && -s "$projectroot/$project/README.html") {
5153                print "<div class=\"title\">readme</div>\n" .
5154                      "<div class=\"readme\">\n";
5155                insert_file("$projectroot/$project/README.html");
5156                print "\n</div>\n"; # class="readme"
5157        }
5158
5159        # we need to request one more than 16 (0..15) to check if
5160        # those 16 are all
5161        my @commitlist = $head ? parse_commits($head, 17) : ();
5162        if (@commitlist) {
5163                git_print_header_div('shortlog');
5164                git_shortlog_body(\@commitlist, 0, 15, $refs,
5165                                  $#commitlist <=  15 ? undef :
5166                                  $cgi->a({-href => href(action=>"shortlog")}, "..."));
5167        }
5168
5169        if (@taglist) {
5170                git_print_header_div('tags');
5171                git_tags_body(\@taglist, 0, 15,
5172                              $#taglist <=  15 ? undef :
5173                              $cgi->a({-href => href(action=>"tags")}, "..."));
5174        }
5175
5176        if (@headlist) {
5177                git_print_header_div('heads');
5178                git_heads_body(\@headlist, $head, 0, 15,
5179                               $#headlist <= 15 ? undef :
5180                               $cgi->a({-href => href(action=>"heads")}, "..."));
5181        }
5182
5183        if (@forklist) {
5184                git_print_header_div('forks');
5185                git_project_list_body(\@forklist, 'age', 0, 15,
5186                                      $#forklist <= 15 ? undef :
5187                                      $cgi->a({-href => href(action=>"forks")}, "..."),
5188                                      'no_header');
5189        }
5190
5191        git_footer_html();
5192}
5193
5194sub git_tag {
5195        my $head = git_get_head_hash($project);
5196        git_header_html();
5197        git_print_page_nav('','', $head,undef,$head);
5198        my %tag = parse_tag($hash);
5199
5200        if (! %tag) {
5201                die_error(404, "Unknown tag object");
5202        }
5203
5204        git_print_header_div('commit', esc_html($tag{'name'}), $hash);
5205        print "<div class=\"title_text\">\n" .
5206              "<table class=\"object_header\">\n" .
5207              "<tr>\n" .
5208              "<td>object</td>\n" .
5209              "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5210                               $tag{'object'}) . "</td>\n" .
5211              "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5212                                              $tag{'type'}) . "</td>\n" .
5213              "</tr>\n";
5214        if (defined($tag{'author'})) {
5215                git_print_authorship_rows(\%tag, 'author');
5216        }
5217        print "</table>\n\n" .
5218              "</div>\n";
5219        print "<div class=\"page_body\">";
5220        my $comment = $tag{'comment'};
5221        foreach my $line (@$comment) {
5222                chomp $line;
5223                print esc_html($line, -nbsp=>1) . "<br/>\n";
5224        }
5225        print "</div>\n";
5226        git_footer_html();
5227}
5228
5229sub git_blame_common {
5230        my $format = shift || 'porcelain';
5231        if ($format eq 'porcelain' && $cgi->param('js')) {
5232                $format = 'incremental';
5233                $action = 'blame_incremental'; # for page title etc
5234        }
5235
5236        # permissions
5237        gitweb_check_feature('blame')
5238                or die_error(403, "Blame view not allowed");
5239
5240        # error checking
5241        die_error(400, "No file name given") unless $file_name;
5242        $hash_base ||= git_get_head_hash($project);
5243        die_error(404, "Couldn't find base commit") unless $hash_base;
5244        my %co = parse_commit($hash_base)
5245                or die_error(404, "Commit not found");
5246        my $ftype = "blob";
5247        if (!defined $hash) {
5248                $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
5249                        or die_error(404, "Error looking up file");
5250        } else {
5251                $ftype = git_get_type($hash);
5252                if ($ftype !~ "blob") {
5253                        die_error(400, "Object is not a blob");
5254                }
5255        }
5256
5257        my $fd;
5258        if ($format eq 'incremental') {
5259                # get file contents (as base)
5260                open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
5261                        or die_error(500, "Open git-cat-file failed");
5262        } elsif ($format eq 'data') {
5263                # run git-blame --incremental
5264                open $fd, "-|", git_cmd(), "blame", "--incremental",
5265                        $hash_base, "--", $file_name
5266                        or die_error(500, "Open git-blame --incremental failed");
5267        } else {
5268                # run git-blame --porcelain
5269                open $fd, "-|", git_cmd(), "blame", '-p',
5270                        $hash_base, '--', $file_name
5271                        or die_error(500, "Open git-blame --porcelain failed");
5272        }
5273
5274        # incremental blame data returns early
5275        if ($format eq 'data') {
5276                print $cgi->header(
5277                        -type=>"text/plain", -charset => "utf-8",
5278                        -status=> "200 OK");
5279                local $| = 1; # output autoflush
5280                print while <$fd>;
5281                close $fd
5282                        or print "ERROR $!\n";
5283
5284                print 'END';
5285                if (defined $t0 && gitweb_check_feature('timed')) {
5286                        print ' '.
5287                              Time::HiRes::tv_interval($t0, [Time::HiRes::gettimeofday()]).
5288                              ' '.$number_of_git_cmds;
5289                }
5290                print "\n";
5291
5292                return;
5293        }
5294
5295        # page header
5296        git_header_html();
5297        my $formats_nav =
5298                $cgi->a({-href => href(action=>"blob", -replay=>1)},
5299                        "blob") .
5300                " | ";
5301        if ($format eq 'incremental') {
5302                $formats_nav .=
5303                        $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
5304                                "blame") . " (non-incremental)";
5305        } else {
5306                $formats_nav .=
5307                        $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
5308                                "blame") . " (incremental)";
5309        }
5310        $formats_nav .=
5311                " | " .
5312                $cgi->a({-href => href(action=>"history", -replay=>1)},
5313                        "history") .
5314                " | " .
5315                $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
5316                        "HEAD");
5317        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5318        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5319        git_print_page_path($file_name, $ftype, $hash_base);
5320
5321        # page body
5322        if ($format eq 'incremental') {
5323                print "<noscript>\n<div class=\"error\"><center><b>\n".
5324                      "This page requires JavaScript to run.\n Use ".
5325                      $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
5326                              'this page').
5327                      " instead.\n".
5328                      "</b></center></div>\n</noscript>\n";
5329
5330                print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
5331        }
5332
5333        print qq!<div class="page_body">\n!;
5334        print qq!<div id="progress_info">... / ...</div>\n!
5335                if ($format eq 'incremental');
5336        print qq!<table id="blame_table" class="blame" width="100%">\n!.
5337              #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
5338              qq!<thead>\n!.
5339              qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
5340              qq!</thead>\n!.
5341              qq!<tbody>\n!;
5342
5343        my @rev_color = qw(light dark);
5344        my $num_colors = scalar(@rev_color);
5345        my $current_color = 0;
5346
5347        if ($format eq 'incremental') {
5348                my $color_class = $rev_color[$current_color];
5349
5350                #contents of a file
5351                my $linenr = 0;
5352        LINE:
5353                while (my $line = <$fd>) {
5354                        chomp $line;
5355                        $linenr++;
5356
5357                        print qq!<tr id="l$linenr" class="$color_class">!.
5358                              qq!<td class="sha1"><a href=""> </a></td>!.
5359                              qq!<td class="linenr">!.
5360                              qq!<a class="linenr" href="">$linenr</a></td>!;
5361                        print qq!<td class="pre">! . esc_html($line) . "</td>\n";
5362                        print qq!</tr>\n!;
5363                }
5364
5365        } else { # porcelain, i.e. ordinary blame
5366                my %metainfo = (); # saves information about commits
5367
5368                # blame data
5369        LINE:
5370                while (my $line = <$fd>) {
5371                        chomp $line;
5372                        # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
5373                        # no <lines in group> for subsequent lines in group of lines
5374                        my ($full_rev, $orig_lineno, $lineno, $group_size) =
5375                           ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
5376                        if (!exists $metainfo{$full_rev}) {
5377                                $metainfo{$full_rev} = { 'nprevious' => 0 };
5378                        }
5379                        my $meta = $metainfo{$full_rev};
5380                        my $data;
5381                        while ($data = <$fd>) {
5382                                chomp $data;
5383                                last if ($data =~ s/^\t//); # contents of line
5384                                if ($data =~ /^(\S+)(?: (.*))?$/) {
5385                                        $meta->{$1} = $2 unless exists $meta->{$1};
5386                                }
5387                                if ($data =~ /^previous /) {
5388                                        $meta->{'nprevious'}++;
5389                                }
5390                        }
5391                        my $short_rev = substr($full_rev, 0, 8);
5392                        my $author = $meta->{'author'};
5393                        my %date =
5394                                parse_date($meta->{'author-time'}, $meta->{'author-tz'});
5395                        my $date = $date{'iso-tz'};
5396                        if ($group_size) {
5397                                $current_color = ($current_color + 1) % $num_colors;
5398                        }
5399                        my $tr_class = $rev_color[$current_color];
5400                        $tr_class .= ' boundary' if (exists $meta->{'boundary'});
5401                        $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
5402                        $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
5403                        print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
5404                        if ($group_size) {
5405                                print "<td class=\"sha1\"";
5406                                print " title=\"". esc_html($author) . ", $date\"";
5407                                print " rowspan=\"$group_size\"" if ($group_size > 1);
5408                                print ">";
5409                                print $cgi->a({-href => href(action=>"commit",
5410                                                             hash=>$full_rev,
5411                                                             file_name=>$file_name)},
5412                                              esc_html($short_rev));
5413                                if ($group_size >= 2) {
5414                                        my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
5415                                        if (@author_initials) {
5416                                                print "<br />" .
5417                                                      esc_html(join('', @author_initials));
5418                                                #           or join('.', ...)
5419                                        }
5420                                }
5421                                print "</td>\n";
5422                        }
5423                        # 'previous' <sha1 of parent commit> <filename at commit>
5424                        if (exists $meta->{'previous'} &&
5425                            $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
5426                                $meta->{'parent'} = $1;
5427                                $meta->{'file_parent'} = unquote($2);
5428                        }
5429                        my $linenr_commit =
5430                                exists($meta->{'parent'}) ?
5431                                $meta->{'parent'} : $full_rev;
5432                        my $linenr_filename =
5433                                exists($meta->{'file_parent'}) ?
5434                                $meta->{'file_parent'} : unquote($meta->{'filename'});
5435                        my $blamed = href(action => 'blame',
5436                                          file_name => $linenr_filename,
5437                                          hash_base => $linenr_commit);
5438                        print "<td class=\"linenr\">";
5439                        print $cgi->a({ -href => "$blamed#l$orig_lineno",
5440                                        -class => "linenr" },
5441                                      esc_html($lineno));
5442                        print "</td>";
5443                        print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
5444                        print "</tr>\n";
5445                } # end while
5446
5447        }
5448
5449        # footer
5450        print "</tbody>\n".
5451              "</table>\n"; # class="blame"
5452        print "</div>\n";   # class="blame_body"
5453        close $fd
5454                or print "Reading blob failed\n";
5455
5456        git_footer_html();
5457}
5458
5459sub git_blame {
5460        git_blame_common();
5461}
5462
5463sub git_blame_incremental {
5464        git_blame_common('incremental');
5465}
5466
5467sub git_blame_data {
5468        git_blame_common('data');
5469}
5470
5471sub git_tags {
5472        my $head = git_get_head_hash($project);
5473        git_header_html();
5474        git_print_page_nav('','', $head,undef,$head);
5475        git_print_header_div('summary', $project);
5476
5477        my @tagslist = git_get_tags_list();
5478        if (@tagslist) {
5479                git_tags_body(\@tagslist);
5480        }
5481        git_footer_html();
5482}
5483
5484sub git_heads {
5485        my $head = git_get_head_hash($project);
5486        git_header_html();
5487        git_print_page_nav('','', $head,undef,$head);
5488        git_print_header_div('summary', $project);
5489
5490        my @headslist = git_get_heads_list();
5491        if (@headslist) {
5492                git_heads_body(\@headslist, $head);
5493        }
5494        git_footer_html();
5495}
5496
5497sub git_blob_plain {
5498        my $type = shift;
5499        my $expires;
5500
5501        if (!defined $hash) {
5502                if (defined $file_name) {
5503                        my $base = $hash_base || git_get_head_hash($project);
5504                        $hash = git_get_hash_by_path($base, $file_name, "blob")
5505                                or die_error(404, "Cannot find file");
5506                } else {
5507                        die_error(400, "No file name defined");
5508                }
5509        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5510                # blobs defined by non-textual hash id's can be cached
5511                $expires = "+1d";
5512        }
5513
5514        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5515                or die_error(500, "Open git-cat-file blob '$hash' failed");
5516
5517        # content-type (can include charset)
5518        $type = blob_contenttype($fd, $file_name, $type);
5519
5520        # "save as" filename, even when no $file_name is given
5521        my $save_as = "$hash";
5522        if (defined $file_name) {
5523                $save_as = $file_name;
5524        } elsif ($type =~ m/^text\//) {
5525                $save_as .= '.txt';
5526        }
5527
5528        # With XSS prevention on, blobs of all types except a few known safe
5529        # ones are served with "Content-Disposition: attachment" to make sure
5530        # they don't run in our security domain.  For certain image types,
5531        # blob view writes an <img> tag referring to blob_plain view, and we
5532        # want to be sure not to break that by serving the image as an
5533        # attachment (though Firefox 3 doesn't seem to care).
5534        my $sandbox = $prevent_xss &&
5535                $type !~ m!^(?:text/plain|image/(?:gif|png|jpeg))$!;
5536
5537        print $cgi->header(
5538                -type => $type,
5539                -expires => $expires,
5540                -content_disposition =>
5541                        ($sandbox ? 'attachment' : 'inline')
5542                        . '; filename="' . $save_as . '"');
5543        local $/ = undef;
5544        binmode STDOUT, ':raw';
5545        print <$fd>;
5546        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
5547        close $fd;
5548}
5549
5550sub git_blob {
5551        my $expires;
5552
5553        if (!defined $hash) {
5554                if (defined $file_name) {
5555                        my $base = $hash_base || git_get_head_hash($project);
5556                        $hash = git_get_hash_by_path($base, $file_name, "blob")
5557                                or die_error(404, "Cannot find file");
5558                } else {
5559                        die_error(400, "No file name defined");
5560                }
5561        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5562                # blobs defined by non-textual hash id's can be cached
5563                $expires = "+1d";
5564        }
5565
5566        my $have_blame = gitweb_check_feature('blame');
5567        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5568                or die_error(500, "Couldn't cat $file_name, $hash");
5569        my $mimetype = blob_mimetype($fd, $file_name);
5570        # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
5571        if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
5572                close $fd;
5573                return git_blob_plain($mimetype);
5574        }
5575        # we can have blame only for text/* mimetype
5576        $have_blame &&= ($mimetype =~ m!^text/!);
5577
5578        my $highlight = gitweb_check_feature('highlight');
5579        my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
5580        $fd = run_highlighter($fd, $highlight, $syntax)
5581                if $syntax;
5582
5583        git_header_html(undef, $expires);
5584        my $formats_nav = '';
5585        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
5586                if (defined $file_name) {
5587                        if ($have_blame) {
5588                                $formats_nav .=
5589                                        $cgi->a({-href => href(action=>"blame", -replay=>1)},
5590                                                "blame") .
5591                                        " | ";
5592                        }
5593                        $formats_nav .=
5594                                $cgi->a({-href => href(action=>"history", -replay=>1)},
5595                                        "history") .
5596                                " | " .
5597                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5598                                        "raw") .
5599                                " | " .
5600                                $cgi->a({-href => href(action=>"blob",
5601                                                       hash_base=>"HEAD", file_name=>$file_name)},
5602                                        "HEAD");
5603                } else {
5604                        $formats_nav .=
5605                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5606                                        "raw");
5607                }
5608                git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5609                git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5610        } else {
5611                print "<div class=\"page_nav\">\n" .
5612                      "<br/><br/></div>\n" .
5613                      "<div class=\"title\">$hash</div>\n";
5614        }
5615        git_print_page_path($file_name, "blob", $hash_base);
5616        print "<div class=\"page_body\">\n";
5617        if ($mimetype =~ m!^image/!) {
5618                print qq!<img type="$mimetype"!;
5619                if ($file_name) {
5620                        print qq! alt="$file_name" title="$file_name"!;
5621                }
5622                print qq! src="! .
5623                      href(action=>"blob_plain", hash=>$hash,
5624                           hash_base=>$hash_base, file_name=>$file_name) .
5625                      qq!" />\n!;
5626        } else {
5627                my $nr;
5628                while (my $line = <$fd>) {
5629                        chomp $line;
5630                        $nr++;
5631                        $line = untabify($line);
5632                        printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
5633                               $nr, href(-replay => 1), $nr, $nr, $syntax ? $line : esc_html($line, -nbsp=>1);
5634                }
5635        }
5636        close $fd
5637                or print "Reading blob failed.\n";
5638        print "</div>";
5639        git_footer_html();
5640}
5641
5642sub git_tree {
5643        if (!defined $hash_base) {
5644                $hash_base = "HEAD";
5645        }
5646        if (!defined $hash) {
5647                if (defined $file_name) {
5648                        $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
5649                } else {
5650                        $hash = $hash_base;
5651                }
5652        }
5653        die_error(404, "No such tree") unless defined($hash);
5654
5655        my $show_sizes = gitweb_check_feature('show-sizes');
5656        my $have_blame = gitweb_check_feature('blame');
5657
5658        my @entries = ();
5659        {
5660                local $/ = "\0";
5661                open my $fd, "-|", git_cmd(), "ls-tree", '-z',
5662                        ($show_sizes ? '-l' : ()), @extra_options, $hash
5663                        or die_error(500, "Open git-ls-tree failed");
5664                @entries = map { chomp; $_ } <$fd>;
5665                close $fd
5666                        or die_error(404, "Reading tree failed");
5667        }
5668
5669        my $refs = git_get_references();
5670        my $ref = format_ref_marker($refs, $hash_base);
5671        git_header_html();
5672        my $basedir = '';
5673        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
5674                my @views_nav = ();
5675                if (defined $file_name) {
5676                        push @views_nav,
5677                                $cgi->a({-href => href(action=>"history", -replay=>1)},
5678                                        "history"),
5679                                $cgi->a({-href => href(action=>"tree",
5680                                                       hash_base=>"HEAD", file_name=>$file_name)},
5681                                        "HEAD"),
5682                }
5683                my $snapshot_links = format_snapshot_links($hash);
5684                if (defined $snapshot_links) {
5685                        # FIXME: Should be available when we have no hash base as well.
5686                        push @views_nav, $snapshot_links;
5687                }
5688                git_print_page_nav('tree','', $hash_base, undef, undef,
5689                                   join(' | ', @views_nav));
5690                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
5691        } else {
5692                undef $hash_base;
5693                print "<div class=\"page_nav\">\n";
5694                print "<br/><br/></div>\n";
5695                print "<div class=\"title\">$hash</div>\n";
5696        }
5697        if (defined $file_name) {
5698                $basedir = $file_name;
5699                if ($basedir ne '' && substr($basedir, -1) ne '/') {
5700                        $basedir .= '/';
5701                }
5702                git_print_page_path($file_name, 'tree', $hash_base);
5703        }
5704        print "<div class=\"page_body\">\n";
5705        print "<table class=\"tree\">\n";
5706        my $alternate = 1;
5707        # '..' (top directory) link if possible
5708        if (defined $hash_base &&
5709            defined $file_name && $file_name =~ m![^/]+$!) {
5710                if ($alternate) {
5711                        print "<tr class=\"dark\">\n";
5712                } else {
5713                        print "<tr class=\"light\">\n";
5714                }
5715                $alternate ^= 1;
5716
5717                my $up = $file_name;
5718                $up =~ s!/?[^/]+$!!;
5719                undef $up unless $up;
5720                # based on git_print_tree_entry
5721                print '<td class="mode">' . mode_str('040000') . "</td>\n";
5722                print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
5723                print '<td class="list">';
5724                print $cgi->a({-href => href(action=>"tree",
5725                                             hash_base=>$hash_base,
5726                                             file_name=>$up)},
5727                              "..");
5728                print "</td>\n";
5729                print "<td class=\"link\"></td>\n";
5730
5731                print "</tr>\n";
5732        }
5733        foreach my $line (@entries) {
5734                my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
5735
5736                if ($alternate) {
5737                        print "<tr class=\"dark\">\n";
5738                } else {
5739                        print "<tr class=\"light\">\n";
5740                }
5741                $alternate ^= 1;
5742
5743                git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
5744
5745                print "</tr>\n";
5746        }
5747        print "</table>\n" .
5748              "</div>";
5749        git_footer_html();
5750}
5751
5752sub snapshot_name {
5753        my ($project, $hash) = @_;
5754
5755        # path/to/project.git  -> project
5756        # path/to/project/.git -> project
5757        my $name = to_utf8($project);
5758        $name =~ s,([^/])/*\.git$,$1,;
5759        $name = basename($name);
5760        # sanitize name
5761        $name =~ s/[[:cntrl:]]/?/g;
5762
5763        my $ver = $hash;
5764        if ($hash =~ /^[0-9a-fA-F]+$/) {
5765                # shorten SHA-1 hash
5766                my $full_hash = git_get_full_hash($project, $hash);
5767                if ($full_hash =~ /^$hash/ && length($hash) > 7) {
5768                        $ver = git_get_short_hash($project, $hash);
5769                }
5770        } elsif ($hash =~ m!^refs/tags/(.*)$!) {
5771                # tags don't need shortened SHA-1 hash
5772                $ver = $1;
5773        } else {
5774                # branches and other need shortened SHA-1 hash
5775                if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
5776                        $ver = $1;
5777                }
5778                $ver .= '-' . git_get_short_hash($project, $hash);
5779        }
5780        # in case of hierarchical branch names
5781        $ver =~ s!/!.!g;
5782
5783        # name = project-version_string
5784        $name = "$name-$ver";
5785
5786        return wantarray ? ($name, $name) : $name;
5787}
5788
5789sub git_snapshot {
5790        my $format = $input_params{'snapshot_format'};
5791        if (!@snapshot_fmts) {
5792                die_error(403, "Snapshots not allowed");
5793        }
5794        # default to first supported snapshot format
5795        $format ||= $snapshot_fmts[0];
5796        if ($format !~ m/^[a-z0-9]+$/) {
5797                die_error(400, "Invalid snapshot format parameter");
5798        } elsif (!exists($known_snapshot_formats{$format})) {
5799                die_error(400, "Unknown snapshot format");
5800        } elsif ($known_snapshot_formats{$format}{'disabled'}) {
5801                die_error(403, "Snapshot format not allowed");
5802        } elsif (!grep($_ eq $format, @snapshot_fmts)) {
5803                die_error(403, "Unsupported snapshot format");
5804        }
5805
5806        my $type = git_get_type("$hash^{}");
5807        if (!$type) {
5808                die_error(404, 'Object does not exist');
5809        }  elsif ($type eq 'blob') {
5810                die_error(400, 'Object is not a tree-ish');
5811        }
5812
5813        my ($name, $prefix) = snapshot_name($project, $hash);
5814        my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
5815        my $cmd = quote_command(
5816                git_cmd(), 'archive',
5817                "--format=$known_snapshot_formats{$format}{'format'}",
5818                "--prefix=$prefix/", $hash);
5819        if (exists $known_snapshot_formats{$format}{'compressor'}) {
5820                $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
5821        }
5822
5823        $filename =~ s/(["\\])/\\$1/g;
5824        print $cgi->header(
5825                -type => $known_snapshot_formats{$format}{'type'},
5826                -content_disposition => 'inline; filename="' . $filename . '"',
5827                -status => '200 OK');
5828
5829        open my $fd, "-|", $cmd
5830                or die_error(500, "Execute git-archive failed");
5831        binmode STDOUT, ':raw';
5832        print <$fd>;
5833        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
5834        close $fd;
5835}
5836
5837sub git_log_generic {
5838        my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
5839
5840        my $head = git_get_head_hash($project);
5841        if (!defined $base) {
5842                $base = $head;
5843        }
5844        if (!defined $page) {
5845                $page = 0;
5846        }
5847        my $refs = git_get_references();
5848
5849        my $commit_hash = $base;
5850        if (defined $parent) {
5851                $commit_hash = "$parent..$base";
5852        }
5853        my @commitlist =
5854                parse_commits($commit_hash, 101, (100 * $page),
5855                              defined $file_name ? ($file_name, "--full-history") : ());
5856
5857        my $ftype;
5858        if (!defined $file_hash && defined $file_name) {
5859                # some commits could have deleted file in question,
5860                # and not have it in tree, but one of them has to have it
5861                for (my $i = 0; $i < @commitlist; $i++) {
5862                        $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
5863                        last if defined $file_hash;
5864                }
5865        }
5866        if (defined $file_hash) {
5867                $ftype = git_get_type($file_hash);
5868        }
5869        if (defined $file_name && !defined $ftype) {
5870                die_error(500, "Unknown type of object");
5871        }
5872        my %co;
5873        if (defined $file_name) {
5874                %co = parse_commit($base)
5875                        or die_error(404, "Unknown commit object");
5876        }
5877
5878
5879        my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
5880        my $next_link = '';
5881        if ($#commitlist >= 100) {
5882                $next_link =
5883                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
5884                                 -accesskey => "n", -title => "Alt-n"}, "next");
5885        }
5886        my $patch_max = gitweb_get_feature('patches');
5887        if ($patch_max && !defined $file_name) {
5888                if ($patch_max < 0 || @commitlist <= $patch_max) {
5889                        $paging_nav .= " &sdot; " .
5890                                $cgi->a({-href => href(action=>"patches", -replay=>1)},
5891                                        "patches");
5892                }
5893        }
5894
5895        git_header_html();
5896        git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
5897        if (defined $file_name) {
5898                git_print_header_div('commit', esc_html($co{'title'}), $base);
5899        } else {
5900                git_print_header_div('summary', $project)
5901        }
5902        git_print_page_path($file_name, $ftype, $hash_base)
5903                if (defined $file_name);
5904
5905        $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
5906                     $file_name, $file_hash, $ftype);
5907
5908        git_footer_html();
5909}
5910
5911sub git_log {
5912        git_log_generic('log', \&git_log_body,
5913                        $hash, $hash_parent);
5914}
5915
5916sub git_commit {
5917        $hash ||= $hash_base || "HEAD";
5918        my %co = parse_commit($hash)
5919            or die_error(404, "Unknown commit object");
5920
5921        my $parent  = $co{'parent'};
5922        my $parents = $co{'parents'}; # listref
5923
5924        # we need to prepare $formats_nav before any parameter munging
5925        my $formats_nav;
5926        if (!defined $parent) {
5927                # --root commitdiff
5928                $formats_nav .= '(initial)';
5929        } elsif (@$parents == 1) {
5930                # single parent commit
5931                $formats_nav .=
5932                        '(parent: ' .
5933                        $cgi->a({-href => href(action=>"commit",
5934                                               hash=>$parent)},
5935                                esc_html(substr($parent, 0, 7))) .
5936                        ')';
5937        } else {
5938                # merge commit
5939                $formats_nav .=
5940                        '(merge: ' .
5941                        join(' ', map {
5942                                $cgi->a({-href => href(action=>"commit",
5943                                                       hash=>$_)},
5944                                        esc_html(substr($_, 0, 7)));
5945                        } @$parents ) .
5946                        ')';
5947        }
5948        if (gitweb_check_feature('patches') && @$parents <= 1) {
5949                $formats_nav .= " | " .
5950                        $cgi->a({-href => href(action=>"patch", -replay=>1)},
5951                                "patch");
5952        }
5953
5954        if (!defined $parent) {
5955                $parent = "--root";
5956        }
5957        my @difftree;
5958        open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
5959                @diff_opts,
5960                (@$parents <= 1 ? $parent : '-c'),
5961                $hash, "--"
5962                or die_error(500, "Open git-diff-tree failed");
5963        @difftree = map { chomp; $_ } <$fd>;
5964        close $fd or die_error(404, "Reading git-diff-tree failed");
5965
5966        # non-textual hash id's can be cached
5967        my $expires;
5968        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5969                $expires = "+1d";
5970        }
5971        my $refs = git_get_references();
5972        my $ref = format_ref_marker($refs, $co{'id'});
5973
5974        git_header_html(undef, $expires);
5975        git_print_page_nav('commit', '',
5976                           $hash, $co{'tree'}, $hash,
5977                           $formats_nav);
5978
5979        if (defined $co{'parent'}) {
5980                git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
5981        } else {
5982                git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
5983        }
5984        print "<div class=\"title_text\">\n" .
5985              "<table class=\"object_header\">\n";
5986        git_print_authorship_rows(\%co);
5987        print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
5988        print "<tr>" .
5989              "<td>tree</td>" .
5990              "<td class=\"sha1\">" .
5991              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
5992                       class => "list"}, $co{'tree'}) .
5993              "</td>" .
5994              "<td class=\"link\">" .
5995              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
5996                      "tree");
5997        my $snapshot_links = format_snapshot_links($hash);
5998        if (defined $snapshot_links) {
5999                print " | " . $snapshot_links;
6000        }
6001        print "</td>" .
6002              "</tr>\n";
6003
6004        foreach my $par (@$parents) {
6005                print "<tr>" .
6006                      "<td>parent</td>" .
6007                      "<td class=\"sha1\">" .
6008                      $cgi->a({-href => href(action=>"commit", hash=>$par),
6009                               class => "list"}, $par) .
6010                      "</td>" .
6011                      "<td class=\"link\">" .
6012                      $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
6013                      " | " .
6014                      $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
6015                      "</td>" .
6016                      "</tr>\n";
6017        }
6018        print "</table>".
6019              "</div>\n";
6020
6021        print "<div class=\"page_body\">\n";
6022        git_print_log($co{'comment'});
6023        print "</div>\n";
6024
6025        git_difftree_body(\@difftree, $hash, @$parents);
6026
6027        git_footer_html();
6028}
6029
6030sub git_object {
6031        # object is defined by:
6032        # - hash or hash_base alone
6033        # - hash_base and file_name
6034        my $type;
6035
6036        # - hash or hash_base alone
6037        if ($hash || ($hash_base && !defined $file_name)) {
6038                my $object_id = $hash || $hash_base;
6039
6040                open my $fd, "-|", quote_command(
6041                        git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
6042                        or die_error(404, "Object does not exist");
6043                $type = <$fd>;
6044                chomp $type;
6045                close $fd
6046                        or die_error(404, "Object does not exist");
6047
6048        # - hash_base and file_name
6049        } elsif ($hash_base && defined $file_name) {
6050                $file_name =~ s,/+$,,;
6051
6052                system(git_cmd(), "cat-file", '-e', $hash_base) == 0
6053                        or die_error(404, "Base object does not exist");
6054
6055                # here errors should not hapen
6056                open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
6057                        or die_error(500, "Open git-ls-tree failed");
6058                my $line = <$fd>;
6059                close $fd;
6060
6061                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
6062                unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
6063                        die_error(404, "File or directory for given base does not exist");
6064                }
6065                $type = $2;
6066                $hash = $3;
6067        } else {
6068                die_error(400, "Not enough information to find object");
6069        }
6070
6071        print $cgi->redirect(-uri => href(action=>$type, -full=>1,
6072                                          hash=>$hash, hash_base=>$hash_base,
6073                                          file_name=>$file_name),
6074                             -status => '302 Found');
6075}
6076
6077sub git_blobdiff {
6078        my $format = shift || 'html';
6079
6080        my $fd;
6081        my @difftree;
6082        my %diffinfo;
6083        my $expires;
6084
6085        # preparing $fd and %diffinfo for git_patchset_body
6086        # new style URI
6087        if (defined $hash_base && defined $hash_parent_base) {
6088                if (defined $file_name) {
6089                        # read raw output
6090                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6091                                $hash_parent_base, $hash_base,
6092                                "--", (defined $file_parent ? $file_parent : ()), $file_name
6093                                or die_error(500, "Open git-diff-tree failed");
6094                        @difftree = map { chomp; $_ } <$fd>;
6095                        close $fd
6096                                or die_error(404, "Reading git-diff-tree failed");
6097                        @difftree
6098                                or die_error(404, "Blob diff not found");
6099
6100                } elsif (defined $hash &&
6101                         $hash =~ /[0-9a-fA-F]{40}/) {
6102                        # try to find filename from $hash
6103
6104                        # read filtered raw output
6105                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6106                                $hash_parent_base, $hash_base, "--"
6107                                or die_error(500, "Open git-diff-tree failed");
6108                        @difftree =
6109                                # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
6110                                # $hash == to_id
6111                                grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
6112                                map { chomp; $_ } <$fd>;
6113                        close $fd
6114                                or die_error(404, "Reading git-diff-tree failed");
6115                        @difftree
6116                                or die_error(404, "Blob diff not found");
6117
6118                } else {
6119                        die_error(400, "Missing one of the blob diff parameters");
6120                }
6121
6122                if (@difftree > 1) {
6123                        die_error(400, "Ambiguous blob diff specification");
6124                }
6125
6126                %diffinfo = parse_difftree_raw_line($difftree[0]);
6127                $file_parent ||= $diffinfo{'from_file'} || $file_name;
6128                $file_name   ||= $diffinfo{'to_file'};
6129
6130                $hash_parent ||= $diffinfo{'from_id'};
6131                $hash        ||= $diffinfo{'to_id'};
6132
6133                # non-textual hash id's can be cached
6134                if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
6135                    $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
6136                        $expires = '+1d';
6137                }
6138
6139                # open patch output
6140                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6141                        '-p', ($format eq 'html' ? "--full-index" : ()),
6142                        $hash_parent_base, $hash_base,
6143                        "--", (defined $file_parent ? $file_parent : ()), $file_name
6144                        or die_error(500, "Open git-diff-tree failed");
6145        }
6146
6147        # old/legacy style URI -- not generated anymore since 1.4.3.
6148        if (!%diffinfo) {
6149                die_error('404 Not Found', "Missing one of the blob diff parameters")
6150        }
6151
6152        # header
6153        if ($format eq 'html') {
6154                my $formats_nav =
6155                        $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
6156                                "raw");
6157                git_header_html(undef, $expires);
6158                if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6159                        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6160                        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6161                } else {
6162                        print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
6163                        print "<div class=\"title\">$hash vs $hash_parent</div>\n";
6164                }
6165                if (defined $file_name) {
6166                        git_print_page_path($file_name, "blob", $hash_base);
6167                } else {
6168                        print "<div class=\"page_path\"></div>\n";
6169                }
6170
6171        } elsif ($format eq 'plain') {
6172                print $cgi->header(
6173                        -type => 'text/plain',
6174                        -charset => 'utf-8',
6175                        -expires => $expires,
6176                        -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
6177
6178                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6179
6180        } else {
6181                die_error(400, "Unknown blobdiff format");
6182        }
6183
6184        # patch
6185        if ($format eq 'html') {
6186                print "<div class=\"page_body\">\n";
6187
6188                git_patchset_body($fd, [ \%diffinfo ], $hash_base, $hash_parent_base);
6189                close $fd;
6190
6191                print "</div>\n"; # class="page_body"
6192                git_footer_html();
6193
6194        } else {
6195                while (my $line = <$fd>) {
6196                        $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
6197                        $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
6198
6199                        print $line;
6200
6201                        last if $line =~ m!^\+\+\+!;
6202                }
6203                local $/ = undef;
6204                print <$fd>;
6205                close $fd;
6206        }
6207}
6208
6209sub git_blobdiff_plain {
6210        git_blobdiff('plain');
6211}
6212
6213sub git_commitdiff {
6214        my %params = @_;
6215        my $format = $params{-format} || 'html';
6216
6217        my ($patch_max) = gitweb_get_feature('patches');
6218        if ($format eq 'patch') {
6219                die_error(403, "Patch view not allowed") unless $patch_max;
6220        }
6221
6222        $hash ||= $hash_base || "HEAD";
6223        my %co = parse_commit($hash)
6224            or die_error(404, "Unknown commit object");
6225
6226        # choose format for commitdiff for merge
6227        if (! defined $hash_parent && @{$co{'parents'}} > 1) {
6228                $hash_parent = '--cc';
6229        }
6230        # we need to prepare $formats_nav before almost any parameter munging
6231        my $formats_nav;
6232        if ($format eq 'html') {
6233                $formats_nav =
6234                        $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
6235                                "raw");
6236                if ($patch_max && @{$co{'parents'}} <= 1) {
6237                        $formats_nav .= " | " .
6238                                $cgi->a({-href => href(action=>"patch", -replay=>1)},
6239                                        "patch");
6240                }
6241
6242                if (defined $hash_parent &&
6243                    $hash_parent ne '-c' && $hash_parent ne '--cc') {
6244                        # commitdiff with two commits given
6245                        my $hash_parent_short = $hash_parent;
6246                        if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
6247                                $hash_parent_short = substr($hash_parent, 0, 7);
6248                        }
6249                        $formats_nav .=
6250                                ' (from';
6251                        for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
6252                                if ($co{'parents'}[$i] eq $hash_parent) {
6253                                        $formats_nav .= ' parent ' . ($i+1);
6254                                        last;
6255                                }
6256                        }
6257                        $formats_nav .= ': ' .
6258                                $cgi->a({-href => href(action=>"commitdiff",
6259                                                       hash=>$hash_parent)},
6260                                        esc_html($hash_parent_short)) .
6261                                ')';
6262                } elsif (!$co{'parent'}) {
6263                        # --root commitdiff
6264                        $formats_nav .= ' (initial)';
6265                } elsif (scalar @{$co{'parents'}} == 1) {
6266                        # single parent commit
6267                        $formats_nav .=
6268                                ' (parent: ' .
6269                                $cgi->a({-href => href(action=>"commitdiff",
6270                                                       hash=>$co{'parent'})},
6271                                        esc_html(substr($co{'parent'}, 0, 7))) .
6272                                ')';
6273                } else {
6274                        # merge commit
6275                        if ($hash_parent eq '--cc') {
6276                                $formats_nav .= ' | ' .
6277                                        $cgi->a({-href => href(action=>"commitdiff",
6278                                                               hash=>$hash, hash_parent=>'-c')},
6279                                                'combined');
6280                        } else { # $hash_parent eq '-c'
6281                                $formats_nav .= ' | ' .
6282                                        $cgi->a({-href => href(action=>"commitdiff",
6283                                                               hash=>$hash, hash_parent=>'--cc')},
6284                                                'compact');
6285                        }
6286                        $formats_nav .=
6287                                ' (merge: ' .
6288                                join(' ', map {
6289                                        $cgi->a({-href => href(action=>"commitdiff",
6290                                                               hash=>$_)},
6291                                                esc_html(substr($_, 0, 7)));
6292                                } @{$co{'parents'}} ) .
6293                                ')';
6294                }
6295        }
6296
6297        my $hash_parent_param = $hash_parent;
6298        if (!defined $hash_parent_param) {
6299                # --cc for multiple parents, --root for parentless
6300                $hash_parent_param =
6301                        @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
6302        }
6303
6304        # read commitdiff
6305        my $fd;
6306        my @difftree;
6307        if ($format eq 'html') {
6308                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6309                        "--no-commit-id", "--patch-with-raw", "--full-index",
6310                        $hash_parent_param, $hash, "--"
6311                        or die_error(500, "Open git-diff-tree failed");
6312
6313                while (my $line = <$fd>) {
6314                        chomp $line;
6315                        # empty line ends raw part of diff-tree output
6316                        last unless $line;
6317                        push @difftree, scalar parse_difftree_raw_line($line);
6318                }
6319
6320        } elsif ($format eq 'plain') {
6321                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6322                        '-p', $hash_parent_param, $hash, "--"
6323                        or die_error(500, "Open git-diff-tree failed");
6324        } elsif ($format eq 'patch') {
6325                # For commit ranges, we limit the output to the number of
6326                # patches specified in the 'patches' feature.
6327                # For single commits, we limit the output to a single patch,
6328                # diverging from the git-format-patch default.
6329                my @commit_spec = ();
6330                if ($hash_parent) {
6331                        if ($patch_max > 0) {
6332                                push @commit_spec, "-$patch_max";
6333                        }
6334                        push @commit_spec, '-n', "$hash_parent..$hash";
6335                } else {
6336                        if ($params{-single}) {
6337                                push @commit_spec, '-1';
6338                        } else {
6339                                if ($patch_max > 0) {
6340                                        push @commit_spec, "-$patch_max";
6341                                }
6342                                push @commit_spec, "-n";
6343                        }
6344                        push @commit_spec, '--root', $hash;
6345                }
6346                open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
6347                        '--encoding=utf8', '--stdout', @commit_spec
6348                        or die_error(500, "Open git-format-patch failed");
6349        } else {
6350                die_error(400, "Unknown commitdiff format");
6351        }
6352
6353        # non-textual hash id's can be cached
6354        my $expires;
6355        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6356                $expires = "+1d";
6357        }
6358
6359        # write commit message
6360        if ($format eq 'html') {
6361                my $refs = git_get_references();
6362                my $ref = format_ref_marker($refs, $co{'id'});
6363
6364                git_header_html(undef, $expires);
6365                git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
6366                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
6367                print "<div class=\"title_text\">\n" .
6368                      "<table class=\"object_header\">\n";
6369                git_print_authorship_rows(\%co);
6370                print "</table>".
6371                      "</div>\n";
6372                print "<div class=\"page_body\">\n";
6373                if (@{$co{'comment'}} > 1) {
6374                        print "<div class=\"log\">\n";
6375                        git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
6376                        print "</div>\n"; # class="log"
6377                }
6378
6379        } elsif ($format eq 'plain') {
6380                my $refs = git_get_references("tags");
6381                my $tagname = git_get_rev_name_tags($hash);
6382                my $filename = basename($project) . "-$hash.patch";
6383
6384                print $cgi->header(
6385                        -type => 'text/plain',
6386                        -charset => 'utf-8',
6387                        -expires => $expires,
6388                        -content_disposition => 'inline; filename="' . "$filename" . '"');
6389                my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
6390                print "From: " . to_utf8($co{'author'}) . "\n";
6391                print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
6392                print "Subject: " . to_utf8($co{'title'}) . "\n";
6393
6394                print "X-Git-Tag: $tagname\n" if $tagname;
6395                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6396
6397                foreach my $line (@{$co{'comment'}}) {
6398                        print to_utf8($line) . "\n";
6399                }
6400                print "---\n\n";
6401        } elsif ($format eq 'patch') {
6402                my $filename = basename($project) . "-$hash.patch";
6403
6404                print $cgi->header(
6405                        -type => 'text/plain',
6406                        -charset => 'utf-8',
6407                        -expires => $expires,
6408                        -content_disposition => 'inline; filename="' . "$filename" . '"');
6409        }
6410
6411        # write patch
6412        if ($format eq 'html') {
6413                my $use_parents = !defined $hash_parent ||
6414                        $hash_parent eq '-c' || $hash_parent eq '--cc';
6415                git_difftree_body(\@difftree, $hash,
6416                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
6417                print "<br/>\n";
6418
6419                git_patchset_body($fd, \@difftree, $hash,
6420                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
6421                close $fd;
6422                print "</div>\n"; # class="page_body"
6423                git_footer_html();
6424
6425        } elsif ($format eq 'plain') {
6426                local $/ = undef;
6427                print <$fd>;
6428                close $fd
6429                        or print "Reading git-diff-tree failed\n";
6430        } elsif ($format eq 'patch') {
6431                local $/ = undef;
6432                print <$fd>;
6433                close $fd
6434                        or print "Reading git-format-patch failed\n";
6435        }
6436}
6437
6438sub git_commitdiff_plain {
6439        git_commitdiff(-format => 'plain');
6440}
6441
6442# format-patch-style patches
6443sub git_patch {
6444        git_commitdiff(-format => 'patch', -single => 1);
6445}
6446
6447sub git_patches {
6448        git_commitdiff(-format => 'patch');
6449}
6450
6451sub git_history {
6452        git_log_generic('history', \&git_history_body,
6453                        $hash_base, $hash_parent_base,
6454                        $file_name, $hash);
6455}
6456
6457sub git_search {
6458        gitweb_check_feature('search') or die_error(403, "Search is disabled");
6459        if (!defined $searchtext) {
6460                die_error(400, "Text field is empty");
6461        }
6462        if (!defined $hash) {
6463                $hash = git_get_head_hash($project);
6464        }
6465        my %co = parse_commit($hash);
6466        if (!%co) {
6467                die_error(404, "Unknown commit object");
6468        }
6469        if (!defined $page) {
6470                $page = 0;
6471        }
6472
6473        $searchtype ||= 'commit';
6474        if ($searchtype eq 'pickaxe') {
6475                # pickaxe may take all resources of your box and run for several minutes
6476                # with every query - so decide by yourself how public you make this feature
6477                gitweb_check_feature('pickaxe')
6478                    or die_error(403, "Pickaxe is disabled");
6479        }
6480        if ($searchtype eq 'grep') {
6481                gitweb_check_feature('grep')
6482                    or die_error(403, "Grep is disabled");
6483        }
6484
6485        git_header_html();
6486
6487        if ($searchtype eq 'commit' or $searchtype eq 'author' or $searchtype eq 'committer') {
6488                my $greptype;
6489                if ($searchtype eq 'commit') {
6490                        $greptype = "--grep=";
6491                } elsif ($searchtype eq 'author') {
6492                        $greptype = "--author=";
6493                } elsif ($searchtype eq 'committer') {
6494                        $greptype = "--committer=";
6495                }
6496                $greptype .= $searchtext;
6497                my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
6498                                               $greptype, '--regexp-ignore-case',
6499                                               $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
6500
6501                my $paging_nav = '';
6502                if ($page > 0) {
6503                        $paging_nav .=
6504                                $cgi->a({-href => href(action=>"search", hash=>$hash,
6505                                                       searchtext=>$searchtext,
6506                                                       searchtype=>$searchtype)},
6507                                        "first");
6508                        $paging_nav .= " &sdot; " .
6509                                $cgi->a({-href => href(-replay=>1, page=>$page-1),
6510                                         -accesskey => "p", -title => "Alt-p"}, "prev");
6511                } else {
6512                        $paging_nav .= "first";
6513                        $paging_nav .= " &sdot; prev";
6514                }
6515                my $next_link = '';
6516                if ($#commitlist >= 100) {
6517                        $next_link =
6518                                $cgi->a({-href => href(-replay=>1, page=>$page+1),
6519                                         -accesskey => "n", -title => "Alt-n"}, "next");
6520                        $paging_nav .= " &sdot; $next_link";
6521                } else {
6522                        $paging_nav .= " &sdot; next";
6523                }
6524
6525                git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
6526                git_print_header_div('commit', esc_html($co{'title'}), $hash);
6527                if ($page == 0 && !@commitlist) {
6528                        print "<p>No match.</p>\n";
6529                } else {
6530                        git_search_grep_body(\@commitlist, 0, 99, $next_link);
6531                }
6532        }
6533
6534        if ($searchtype eq 'pickaxe') {
6535                git_print_page_nav('','', $hash,$co{'tree'},$hash);
6536                git_print_header_div('commit', esc_html($co{'title'}), $hash);
6537
6538                print "<table class=\"pickaxe search\">\n";
6539                my $alternate = 1;
6540                local $/ = "\n";
6541                open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
6542                        '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
6543                        ($search_use_regexp ? '--pickaxe-regex' : ());
6544                undef %co;
6545                my @files;
6546                while (my $line = <$fd>) {
6547                        chomp $line;
6548                        next unless $line;
6549
6550                        my %set = parse_difftree_raw_line($line);
6551                        if (defined $set{'commit'}) {
6552                                # finish previous commit
6553                                if (%co) {
6554                                        print "</td>\n" .
6555                                              "<td class=\"link\">" .
6556                                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6557                                              " | " .
6558                                              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6559                                        print "</td>\n" .
6560                                              "</tr>\n";
6561                                }
6562
6563                                if ($alternate) {
6564                                        print "<tr class=\"dark\">\n";
6565                                } else {
6566                                        print "<tr class=\"light\">\n";
6567                                }
6568                                $alternate ^= 1;
6569                                %co = parse_commit($set{'commit'});
6570                                my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6571                                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6572                                      "<td><i>$author</i></td>\n" .
6573                                      "<td>" .
6574                                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6575                                              -class => "list subject"},
6576                                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
6577                        } elsif (defined $set{'to_id'}) {
6578                                next if ($set{'to_id'} =~ m/^0{40}$/);
6579
6580                                print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6581                                                             hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6582                                              -class => "list"},
6583                                              "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6584                                      "<br/>\n";
6585                        }
6586                }
6587                close $fd;
6588
6589                # finish last commit (warning: repetition!)
6590                if (%co) {
6591                        print "</td>\n" .
6592                              "<td class=\"link\">" .
6593                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6594                              " | " .
6595                              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6596                        print "</td>\n" .
6597                              "</tr>\n";
6598                }
6599
6600                print "</table>\n";
6601        }
6602
6603        if ($searchtype eq 'grep') {
6604                git_print_page_nav('','', $hash,$co{'tree'},$hash);
6605                git_print_header_div('commit', esc_html($co{'title'}), $hash);
6606
6607                print "<table class=\"grep_search\">\n";
6608                my $alternate = 1;
6609                my $matches = 0;
6610                local $/ = "\n";
6611                open my $fd, "-|", git_cmd(), 'grep', '-n',
6612                        $search_use_regexp ? ('-E', '-i') : '-F',
6613                        $searchtext, $co{'tree'};
6614                my $lastfile = '';
6615                while (my $line = <$fd>) {
6616                        chomp $line;
6617                        my ($file, $lno, $ltext, $binary);
6618                        last if ($matches++ > 1000);
6619                        if ($line =~ /^Binary file (.+) matches$/) {
6620                                $file = $1;
6621                                $binary = 1;
6622                        } else {
6623                                (undef, $file, $lno, $ltext) = split(/:/, $line, 4);
6624                        }
6625                        if ($file ne $lastfile) {
6626                                $lastfile and print "</td></tr>\n";
6627                                if ($alternate++) {
6628                                        print "<tr class=\"dark\">\n";
6629                                } else {
6630                                        print "<tr class=\"light\">\n";
6631                                }
6632                                print "<td class=\"list\">".
6633                                        $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6634                                                               file_name=>"$file"),
6635                                                -class => "list"}, esc_path($file));
6636                                print "</td><td>\n";
6637                                $lastfile = $file;
6638                        }
6639                        if ($binary) {
6640                                print "<div class=\"binary\">Binary file</div>\n";
6641                        } else {
6642                                $ltext = untabify($ltext);
6643                                if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6644                                        $ltext = esc_html($1, -nbsp=>1);
6645                                        $ltext .= '<span class="match">';
6646                                        $ltext .= esc_html($2, -nbsp=>1);
6647                                        $ltext .= '</span>';
6648                                        $ltext .= esc_html($3, -nbsp=>1);
6649                                } else {
6650                                        $ltext = esc_html($ltext, -nbsp=>1);
6651                                }
6652                                print "<div class=\"pre\">" .
6653                                        $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6654                                                               file_name=>"$file").'#l'.$lno,
6655                                                -class => "linenr"}, sprintf('%4i', $lno))
6656                                        . ' ' .  $ltext . "</div>\n";
6657                        }
6658                }
6659                if ($lastfile) {
6660                        print "</td></tr>\n";
6661                        if ($matches > 1000) {
6662                                print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6663                        }
6664                } else {
6665                        print "<div class=\"diff nodifferences\">No matches found</div>\n";
6666                }
6667                close $fd;
6668
6669                print "</table>\n";
6670        }
6671        git_footer_html();
6672}
6673
6674sub git_search_help {
6675        git_header_html();
6676        git_print_page_nav('','', $hash,$hash,$hash);
6677        print <<EOT;
6678<p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
6679regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
6680the pattern entered is recognized as the POSIX extended
6681<a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
6682insensitive).</p>
6683<dl>
6684<dt><b>commit</b></dt>
6685<dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
6686EOT
6687        my $have_grep = gitweb_check_feature('grep');
6688        if ($have_grep) {
6689                print <<EOT;
6690<dt><b>grep</b></dt>
6691<dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
6692    a different one) are searched for the given pattern. On large trees, this search can take
6693a while and put some strain on the server, so please use it with some consideration. Note that
6694due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
6695case-sensitive.</dd>
6696EOT
6697        }
6698        print <<EOT;
6699<dt><b>author</b></dt>
6700<dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
6701<dt><b>committer</b></dt>
6702<dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
6703EOT
6704        my $have_pickaxe = gitweb_check_feature('pickaxe');
6705        if ($have_pickaxe) {
6706                print <<EOT;
6707<dt><b>pickaxe</b></dt>
6708<dd>All commits that caused the string to appear or disappear from any file (changes that
6709added, removed or "modified" the string) will be listed. This search can take a while and
6710takes a lot of strain on the server, so please use it wisely. Note that since you may be
6711interested even in changes just changing the case as well, this search is case sensitive.</dd>
6712EOT
6713        }
6714        print "</dl>\n";
6715        git_footer_html();
6716}
6717
6718sub git_shortlog {
6719        git_log_generic('shortlog', \&git_shortlog_body,
6720                        $hash, $hash_parent);
6721}
6722
6723## ......................................................................
6724## feeds (RSS, Atom; OPML)
6725
6726sub git_feed {
6727        my $format = shift || 'atom';
6728        my $have_blame = gitweb_check_feature('blame');
6729
6730        # Atom: http://www.atomenabled.org/developers/syndication/
6731        # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
6732        if ($format ne 'rss' && $format ne 'atom') {
6733                die_error(400, "Unknown web feed format");
6734        }
6735
6736        # log/feed of current (HEAD) branch, log of given branch, history of file/directory
6737        my $head = $hash || 'HEAD';
6738        my @commitlist = parse_commits($head, 150, 0, $file_name);
6739
6740        my %latest_commit;
6741        my %latest_date;
6742        my $content_type = "application/$format+xml";
6743        if (defined $cgi->http('HTTP_ACCEPT') &&
6744                 $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
6745                # browser (feed reader) prefers text/xml
6746                $content_type = 'text/xml';
6747        }
6748        if (defined($commitlist[0])) {
6749                %latest_commit = %{$commitlist[0]};
6750                my $latest_epoch = $latest_commit{'committer_epoch'};
6751                %latest_date   = parse_date($latest_epoch);
6752                my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
6753                if (defined $if_modified) {
6754                        my $since;
6755                        if (eval { require HTTP::Date; 1; }) {
6756                                $since = HTTP::Date::str2time($if_modified);
6757                        } elsif (eval { require Time::ParseDate; 1; }) {
6758                                $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
6759                        }
6760                        if (defined $since && $latest_epoch <= $since) {
6761                                print $cgi->header(
6762                                        -type => $content_type,
6763                                        -charset => 'utf-8',
6764                                        -last_modified => $latest_date{'rfc2822'},
6765                                        -status => '304 Not Modified');
6766                                return;
6767                        }
6768                }
6769                print $cgi->header(
6770                        -type => $content_type,
6771                        -charset => 'utf-8',
6772                        -last_modified => $latest_date{'rfc2822'});
6773        } else {
6774                print $cgi->header(
6775                        -type => $content_type,
6776                        -charset => 'utf-8');
6777        }
6778
6779        # Optimization: skip generating the body if client asks only
6780        # for Last-Modified date.
6781        return if ($cgi->request_method() eq 'HEAD');
6782
6783        # header variables
6784        my $title = "$site_name - $project/$action";
6785        my $feed_type = 'log';
6786        if (defined $hash) {
6787                $title .= " - '$hash'";
6788                $feed_type = 'branch log';
6789                if (defined $file_name) {
6790                        $title .= " :: $file_name";
6791                        $feed_type = 'history';
6792                }
6793        } elsif (defined $file_name) {
6794                $title .= " - $file_name";
6795                $feed_type = 'history';
6796        }
6797        $title .= " $feed_type";
6798        my $descr = git_get_project_description($project);
6799        if (defined $descr) {
6800                $descr = esc_html($descr);
6801        } else {
6802                $descr = "$project " .
6803                         ($format eq 'rss' ? 'RSS' : 'Atom') .
6804                         " feed";
6805        }
6806        my $owner = git_get_project_owner($project);
6807        $owner = esc_html($owner);
6808
6809        #header
6810        my $alt_url;
6811        if (defined $file_name) {
6812                $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
6813        } elsif (defined $hash) {
6814                $alt_url = href(-full=>1, action=>"log", hash=>$hash);
6815        } else {
6816                $alt_url = href(-full=>1, action=>"summary");
6817        }
6818        print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
6819        if ($format eq 'rss') {
6820                print <<XML;
6821<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
6822<channel>
6823XML
6824                print "<title>$title</title>\n" .
6825                      "<link>$alt_url</link>\n" .
6826                      "<description>$descr</description>\n" .
6827                      "<language>en</language>\n" .
6828                      # project owner is responsible for 'editorial' content
6829                      "<managingEditor>$owner</managingEditor>\n";
6830                if (defined $logo || defined $favicon) {
6831                        # prefer the logo to the favicon, since RSS
6832                        # doesn't allow both
6833                        my $img = esc_url($logo || $favicon);
6834                        print "<image>\n" .
6835                              "<url>$img</url>\n" .
6836                              "<title>$title</title>\n" .
6837                              "<link>$alt_url</link>\n" .
6838                              "</image>\n";
6839                }
6840                if (%latest_date) {
6841                        print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
6842                        print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
6843                }
6844                print "<generator>gitweb v.$version/$git_version</generator>\n";
6845        } elsif ($format eq 'atom') {
6846                print <<XML;
6847<feed xmlns="http://www.w3.org/2005/Atom">
6848XML
6849                print "<title>$title</title>\n" .
6850                      "<subtitle>$descr</subtitle>\n" .
6851                      '<link rel="alternate" type="text/html" href="' .
6852                      $alt_url . '" />' . "\n" .
6853                      '<link rel="self" type="' . $content_type . '" href="' .
6854                      $cgi->self_url() . '" />' . "\n" .
6855                      "<id>" . href(-full=>1) . "</id>\n" .
6856                      # use project owner for feed author
6857                      "<author><name>$owner</name></author>\n";
6858                if (defined $favicon) {
6859                        print "<icon>" . esc_url($favicon) . "</icon>\n";
6860                }
6861                if (defined $logo_url) {
6862                        # not twice as wide as tall: 72 x 27 pixels
6863                        print "<logo>" . esc_url($logo) . "</logo>\n";
6864                }
6865                if (! %latest_date) {
6866                        # dummy date to keep the feed valid until commits trickle in:
6867                        print "<updated>1970-01-01T00:00:00Z</updated>\n";
6868                } else {
6869                        print "<updated>$latest_date{'iso-8601'}</updated>\n";
6870                }
6871                print "<generator version='$version/$git_version'>gitweb</generator>\n";
6872        }
6873
6874        # contents
6875        for (my $i = 0; $i <= $#commitlist; $i++) {
6876                my %co = %{$commitlist[$i]};
6877                my $commit = $co{'id'};
6878                # we read 150, we always show 30 and the ones more recent than 48 hours
6879                if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
6880                        last;
6881                }
6882                my %cd = parse_date($co{'author_epoch'});
6883
6884                # get list of changed files
6885                open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6886                        $co{'parent'} || "--root",
6887                        $co{'id'}, "--", (defined $file_name ? $file_name : ())
6888                        or next;
6889                my @difftree = map { chomp; $_ } <$fd>;
6890                close $fd
6891                        or next;
6892
6893                # print element (entry, item)
6894                my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
6895                if ($format eq 'rss') {
6896                        print "<item>\n" .
6897                              "<title>" . esc_html($co{'title'}) . "</title>\n" .
6898                              "<author>" . esc_html($co{'author'}) . "</author>\n" .
6899                              "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
6900                              "<guid isPermaLink=\"true\">$co_url</guid>\n" .
6901                              "<link>$co_url</link>\n" .
6902                              "<description>" . esc_html($co{'title'}) . "</description>\n" .
6903                              "<content:encoded>" .
6904                              "<![CDATA[\n";
6905                } elsif ($format eq 'atom') {
6906                        print "<entry>\n" .
6907                              "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
6908                              "<updated>$cd{'iso-8601'}</updated>\n" .
6909                              "<author>\n" .
6910                              "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
6911                        if ($co{'author_email'}) {
6912                                print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
6913                        }
6914                        print "</author>\n" .
6915                              # use committer for contributor
6916                              "<contributor>\n" .
6917                              "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
6918                        if ($co{'committer_email'}) {
6919                                print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
6920                        }
6921                        print "</contributor>\n" .
6922                              "<published>$cd{'iso-8601'}</published>\n" .
6923                              "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
6924                              "<id>$co_url</id>\n" .
6925                              "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
6926                              "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
6927                }
6928                my $comment = $co{'comment'};
6929                print "<pre>\n";
6930                foreach my $line (@$comment) {
6931                        $line = esc_html($line);
6932                        print "$line\n";
6933                }
6934                print "</pre><ul>\n";
6935                foreach my $difftree_line (@difftree) {
6936                        my %difftree = parse_difftree_raw_line($difftree_line);
6937                        next if !$difftree{'from_id'};
6938
6939                        my $file = $difftree{'file'} || $difftree{'to_file'};
6940
6941                        print "<li>" .
6942                              "[" .
6943                              $cgi->a({-href => href(-full=>1, action=>"blobdiff",
6944                                                     hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
6945                                                     hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
6946                                                     file_name=>$file, file_parent=>$difftree{'from_file'}),
6947                                      -title => "diff"}, 'D');
6948                        if ($have_blame) {
6949                                print $cgi->a({-href => href(-full=>1, action=>"blame",
6950                                                             file_name=>$file, hash_base=>$commit),
6951                                              -title => "blame"}, 'B');
6952                        }
6953                        # if this is not a feed of a file history
6954                        if (!defined $file_name || $file_name ne $file) {
6955                                print $cgi->a({-href => href(-full=>1, action=>"history",
6956                                                             file_name=>$file, hash=>$commit),
6957                                              -title => "history"}, 'H');
6958                        }
6959                        $file = esc_path($file);
6960                        print "] ".
6961                              "$file</li>\n";
6962                }
6963                if ($format eq 'rss') {
6964                        print "</ul>]]>\n" .
6965                              "</content:encoded>\n" .
6966                              "</item>\n";
6967                } elsif ($format eq 'atom') {
6968                        print "</ul>\n</div>\n" .
6969                              "</content>\n" .
6970                              "</entry>\n";
6971                }
6972        }
6973
6974        # end of feed
6975        if ($format eq 'rss') {
6976                print "</channel>\n</rss>\n";
6977        } elsif ($format eq 'atom') {
6978                print "</feed>\n";
6979        }
6980}
6981
6982sub git_rss {
6983        git_feed('rss');
6984}
6985
6986sub git_atom {
6987        git_feed('atom');
6988}
6989
6990sub git_opml {
6991        my @list = git_get_projects_list();
6992
6993        print $cgi->header(
6994                -type => 'text/xml',
6995                -charset => 'utf-8',
6996                -content_disposition => 'inline; filename="opml.xml"');
6997
6998        print <<XML;
6999<?xml version="1.0" encoding="utf-8"?>
7000<opml version="1.0">
7001<head>
7002  <title>$site_name OPML Export</title>
7003</head>
7004<body>
7005<outline text="git RSS feeds">
7006XML
7007
7008        foreach my $pr (@list) {
7009                my %proj = %$pr;
7010                my $head = git_get_head_hash($proj{'path'});
7011                if (!defined $head) {
7012                        next;
7013                }
7014                $git_dir = "$projectroot/$proj{'path'}";
7015                my %co = parse_commit($head);
7016                if (!%co) {
7017                        next;
7018                }
7019
7020                my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7021                my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7022                my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7023                print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7024        }
7025        print <<XML;
7026</outline>
7027</body>
7028</opml>
7029XML
7030}