gitweb / gitweb.perlon commit Merge branch 'maint-1.7.1' into maint-1.7.2 (6a7f71d)
   1#!/usr/bin/perl
   2
   3# gitweb - simple web interface to track changes in git repositories
   4#
   5# (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
   6# (C) 2005, Christian Gierke
   7#
   8# This program is licensed under the GPLv2
   9
  10use strict;
  11use warnings;
  12use CGI qw(:standard :escapeHTML -nosticky);
  13use CGI::Util qw(unescape);
  14use CGI::Carp qw(fatalsToBrowser set_message);
  15use Encode;
  16use Fcntl ':mode';
  17use File::Find qw();
  18use File::Basename qw(basename);
  19binmode STDOUT, ':utf8';
  20
  21our $t0;
  22if (eval { require Time::HiRes; 1; }) {
  23        $t0 = [Time::HiRes::gettimeofday()];
  24}
  25our $number_of_git_cmds = 0;
  26
  27BEGIN {
  28        CGI->compile() if $ENV{'MOD_PERL'};
  29}
  30
  31our $version = "++GIT_VERSION++";
  32
  33our ($my_url, $my_uri, $base_url, $path_info, $home_link);
  34sub evaluate_uri {
  35        our $cgi;
  36
  37        our $my_url = $cgi->url();
  38        our $my_uri = $cgi->url(-absolute => 1);
  39
  40        # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
  41        # needed and used only for URLs with nonempty PATH_INFO
  42        our $base_url = $my_url;
  43
  44        # When the script is used as DirectoryIndex, the URL does not contain the name
  45        # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
  46        # have to do it ourselves. We make $path_info global because it's also used
  47        # later on.
  48        #
  49        # Another issue with the script being the DirectoryIndex is that the resulting
  50        # $my_url data is not the full script URL: this is good, because we want
  51        # generated links to keep implying the script name if it wasn't explicitly
  52        # indicated in the URL we're handling, but it means that $my_url cannot be used
  53        # as base URL.
  54        # Therefore, if we needed to strip PATH_INFO, then we know that we have
  55        # to build the base URL ourselves:
  56        our $path_info = $ENV{"PATH_INFO"};
  57        if ($path_info) {
  58                if ($my_url =~ s,\Q$path_info\E$,, &&
  59                    $my_uri =~ s,\Q$path_info\E$,, &&
  60                    defined $ENV{'SCRIPT_NAME'}) {
  61                        $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
  62                }
  63        }
  64
  65        # target of the home link on top of all pages
  66        our $home_link = $my_uri || "/";
  67}
  68
  69# core git executable to use
  70# this can just be "git" if your webserver has a sensible PATH
  71our $GIT = "++GIT_BINDIR++/git";
  72
  73# absolute fs-path which will be prepended to the project path
  74#our $projectroot = "/pub/scm";
  75our $projectroot = "++GITWEB_PROJECTROOT++";
  76
  77# fs traversing limit for getting project list
  78# the number is relative to the projectroot
  79our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
  80
  81# string of the home link on top of all pages
  82our $home_link_str = "++GITWEB_HOME_LINK_STR++";
  83
  84# name of your site or organization to appear in page titles
  85# replace this with something more descriptive for clearer bookmarks
  86our $site_name = "++GITWEB_SITENAME++"
  87                 || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
  88
  89# filename of html text to include at top of each page
  90our $site_header = "++GITWEB_SITE_HEADER++";
  91# html text to include at home page
  92our $home_text = "++GITWEB_HOMETEXT++";
  93# filename of html text to include at bottom of each page
  94our $site_footer = "++GITWEB_SITE_FOOTER++";
  95
  96# URI of stylesheets
  97our @stylesheets = ("++GITWEB_CSS++");
  98# URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
  99our $stylesheet = undef;
 100# URI of GIT logo (72x27 size)
 101our $logo = "++GITWEB_LOGO++";
 102# URI of GIT favicon, assumed to be image/png type
 103our $favicon = "++GITWEB_FAVICON++";
 104# URI of gitweb.js (JavaScript code for gitweb)
 105our $javascript = "++GITWEB_JS++";
 106
 107# URI and label (title) of GIT logo link
 108#our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
 109#our $logo_label = "git documentation";
 110our $logo_url = "http://git-scm.com/";
 111our $logo_label = "git homepage";
 112
 113# source of projects list
 114our $projects_list = "++GITWEB_LIST++";
 115
 116# the width (in characters) of the projects list "Description" column
 117our $projects_list_description_width = 25;
 118
 119# default order of projects list
 120# valid values are none, project, descr, owner, and age
 121our $default_projects_order = "project";
 122
 123# show repository only if this file exists
 124# (only effective if this variable evaluates to true)
 125our $export_ok = "++GITWEB_EXPORT_OK++";
 126
 127# show repository only if this subroutine returns true
 128# when given the path to the project, for example:
 129#    sub { return -e "$_[0]/git-daemon-export-ok"; }
 130our $export_auth_hook = undef;
 131
 132# only allow viewing of repositories also shown on the overview page
 133our $strict_export = "++GITWEB_STRICT_EXPORT++";
 134
 135# list of git base URLs used for URL to where fetch project from,
 136# i.e. full URL is "$git_base_url/$project"
 137our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
 138
 139# default blob_plain mimetype and default charset for text/plain blob
 140our $default_blob_plain_mimetype = 'text/plain';
 141our $default_text_plain_charset  = undef;
 142
 143# file to use for guessing MIME types before trying /etc/mime.types
 144# (relative to the current git repository)
 145our $mimetypes_file = undef;
 146
 147# assume this charset if line contains non-UTF-8 characters;
 148# it should be valid encoding (see Encoding::Supported(3pm) for list),
 149# for which encoding all byte sequences are valid, for example
 150# 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
 151# could be even 'utf-8' for the old behavior)
 152our $fallback_encoding = 'latin1';
 153
 154# rename detection options for git-diff and git-diff-tree
 155# - default is '-M', with the cost proportional to
 156#   (number of removed files) * (number of new files).
 157# - more costly is '-C' (which implies '-M'), with the cost proportional to
 158#   (number of changed files + number of removed files) * (number of new files)
 159# - even more costly is '-C', '--find-copies-harder' with cost
 160#   (number of files in the original tree) * (number of new files)
 161# - one might want to include '-B' option, e.g. '-B', '-M'
 162our @diff_opts = ('-M'); # taken from git_commit
 163
 164# Disables features that would allow repository owners to inject script into
 165# the gitweb domain.
 166our $prevent_xss = 0;
 167
 168# information about snapshot formats that gitweb is capable of serving
 169our %known_snapshot_formats = (
 170        # name => {
 171        #       'display' => display name,
 172        #       'type' => mime type,
 173        #       'suffix' => filename suffix,
 174        #       'format' => --format for git-archive,
 175        #       'compressor' => [compressor command and arguments]
 176        #                       (array reference, optional)
 177        #       'disabled' => boolean (optional)}
 178        #
 179        'tgz' => {
 180                'display' => 'tar.gz',
 181                'type' => 'application/x-gzip',
 182                'suffix' => '.tar.gz',
 183                'format' => 'tar',
 184                'compressor' => ['gzip']},
 185
 186        'tbz2' => {
 187                'display' => 'tar.bz2',
 188                'type' => 'application/x-bzip2',
 189                'suffix' => '.tar.bz2',
 190                'format' => 'tar',
 191                'compressor' => ['bzip2']},
 192
 193        'txz' => {
 194                'display' => 'tar.xz',
 195                'type' => 'application/x-xz',
 196                'suffix' => '.tar.xz',
 197                'format' => 'tar',
 198                'compressor' => ['xz'],
 199                'disabled' => 1},
 200
 201        'zip' => {
 202                'display' => 'zip',
 203                'type' => 'application/x-zip',
 204                'suffix' => '.zip',
 205                'format' => 'zip'},
 206);
 207
 208# Aliases so we understand old gitweb.snapshot values in repository
 209# configuration.
 210our %known_snapshot_format_aliases = (
 211        'gzip'  => 'tgz',
 212        'bzip2' => 'tbz2',
 213        'xz'    => 'txz',
 214
 215        # backward compatibility: legacy gitweb config support
 216        'x-gzip' => undef, 'gz' => undef,
 217        'x-bzip2' => undef, 'bz2' => undef,
 218        'x-zip' => undef, '' => undef,
 219);
 220
 221# Pixel sizes for icons and avatars. If the default font sizes or lineheights
 222# are changed, it may be appropriate to change these values too via
 223# $GITWEB_CONFIG.
 224our %avatar_size = (
 225        'default' => 16,
 226        'double'  => 32
 227);
 228
 229# Used to set the maximum load that we will still respond to gitweb queries.
 230# If server load exceed this value then return "503 server busy" error.
 231# If gitweb cannot determined server load, it is taken to be 0.
 232# Leave it undefined (or set to 'undef') to turn off load checking.
 233our $maxload = 300;
 234
 235# You define site-wide feature defaults here; override them with
 236# $GITWEB_CONFIG as necessary.
 237our %feature = (
 238        # feature => {
 239        #       'sub' => feature-sub (subroutine),
 240        #       'override' => allow-override (boolean),
 241        #       'default' => [ default options...] (array reference)}
 242        #
 243        # if feature is overridable (it means that allow-override has true value),
 244        # then feature-sub will be called with default options as parameters;
 245        # return value of feature-sub indicates if to enable specified feature
 246        #
 247        # if there is no 'sub' key (no feature-sub), then feature cannot be
 248        # overridden
 249        #
 250        # use gitweb_get_feature(<feature>) to retrieve the <feature> value
 251        # (an array) or gitweb_check_feature(<feature>) to check if <feature>
 252        # is enabled
 253
 254        # Enable the 'blame' blob view, showing the last commit that modified
 255        # each line in the file. This can be very CPU-intensive.
 256
 257        # To enable system wide have in $GITWEB_CONFIG
 258        # $feature{'blame'}{'default'} = [1];
 259        # To have project specific config enable override in $GITWEB_CONFIG
 260        # $feature{'blame'}{'override'} = 1;
 261        # and in project config gitweb.blame = 0|1;
 262        'blame' => {
 263                'sub' => sub { feature_bool('blame', @_) },
 264                'override' => 0,
 265                'default' => [0]},
 266
 267        # Enable the 'snapshot' link, providing a compressed archive of any
 268        # tree. This can potentially generate high traffic if you have large
 269        # project.
 270
 271        # Value is a list of formats defined in %known_snapshot_formats that
 272        # you wish to offer.
 273        # To disable system wide have in $GITWEB_CONFIG
 274        # $feature{'snapshot'}{'default'} = [];
 275        # To have project specific config enable override in $GITWEB_CONFIG
 276        # $feature{'snapshot'}{'override'} = 1;
 277        # and in project config, a comma-separated list of formats or "none"
 278        # to disable.  Example: gitweb.snapshot = tbz2,zip;
 279        'snapshot' => {
 280                'sub' => \&feature_snapshot,
 281                'override' => 0,
 282                'default' => ['tgz']},
 283
 284        # Enable text search, which will list the commits which match author,
 285        # committer or commit text to a given string.  Enabled by default.
 286        # Project specific override is not supported.
 287        'search' => {
 288                'override' => 0,
 289                'default' => [1]},
 290
 291        # Enable grep search, which will list the files in currently selected
 292        # tree containing the given string. Enabled by default. This can be
 293        # potentially CPU-intensive, of course.
 294
 295        # To enable system wide have in $GITWEB_CONFIG
 296        # $feature{'grep'}{'default'} = [1];
 297        # To have project specific config enable override in $GITWEB_CONFIG
 298        # $feature{'grep'}{'override'} = 1;
 299        # and in project config gitweb.grep = 0|1;
 300        'grep' => {
 301                'sub' => sub { feature_bool('grep', @_) },
 302                'override' => 0,
 303                'default' => [1]},
 304
 305        # Enable the pickaxe search, which will list the commits that modified
 306        # a given string in a file. This can be practical and quite faster
 307        # alternative to 'blame', but still potentially CPU-intensive.
 308
 309        # To enable system wide have in $GITWEB_CONFIG
 310        # $feature{'pickaxe'}{'default'} = [1];
 311        # To have project specific config enable override in $GITWEB_CONFIG
 312        # $feature{'pickaxe'}{'override'} = 1;
 313        # and in project config gitweb.pickaxe = 0|1;
 314        'pickaxe' => {
 315                'sub' => sub { feature_bool('pickaxe', @_) },
 316                'override' => 0,
 317                'default' => [1]},
 318
 319        # Enable showing size of blobs in a 'tree' view, in a separate
 320        # column, similar to what 'ls -l' does.  This cost a bit of IO.
 321
 322        # To disable system wide have in $GITWEB_CONFIG
 323        # $feature{'show-sizes'}{'default'} = [0];
 324        # To have project specific config enable override in $GITWEB_CONFIG
 325        # $feature{'show-sizes'}{'override'} = 1;
 326        # and in project config gitweb.showsizes = 0|1;
 327        'show-sizes' => {
 328                'sub' => sub { feature_bool('showsizes', @_) },
 329                'override' => 0,
 330                'default' => [1]},
 331
 332        # Make gitweb use an alternative format of the URLs which can be
 333        # more readable and natural-looking: project name is embedded
 334        # directly in the path and the query string contains other
 335        # auxiliary information. All gitweb installations recognize
 336        # URL in either format; this configures in which formats gitweb
 337        # generates links.
 338
 339        # To enable system wide have in $GITWEB_CONFIG
 340        # $feature{'pathinfo'}{'default'} = [1];
 341        # Project specific override is not supported.
 342
 343        # Note that you will need to change the default location of CSS,
 344        # favicon, logo and possibly other files to an absolute URL. Also,
 345        # if gitweb.cgi serves as your indexfile, you will need to force
 346        # $my_uri to contain the script name in your $GITWEB_CONFIG.
 347        'pathinfo' => {
 348                'override' => 0,
 349                'default' => [0]},
 350
 351        # Make gitweb consider projects in project root subdirectories
 352        # to be forks of existing projects. Given project $projname.git,
 353        # projects matching $projname/*.git will not be shown in the main
 354        # projects list, instead a '+' mark will be added to $projname
 355        # there and a 'forks' view will be enabled for the project, listing
 356        # all the forks. If project list is taken from a file, forks have
 357        # to be listed after the main project.
 358
 359        # To enable system wide have in $GITWEB_CONFIG
 360        # $feature{'forks'}{'default'} = [1];
 361        # Project specific override is not supported.
 362        'forks' => {
 363                'override' => 0,
 364                'default' => [0]},
 365
 366        # Insert custom links to the action bar of all project pages.
 367        # This enables you mainly to link to third-party scripts integrating
 368        # into gitweb; e.g. git-browser for graphical history representation
 369        # or custom web-based repository administration interface.
 370
 371        # The 'default' value consists of a list of triplets in the form
 372        # (label, link, position) where position is the label after which
 373        # to insert the link and link is a format string where %n expands
 374        # to the project name, %f to the project path within the filesystem,
 375        # %h to the current hash (h gitweb parameter) and %b to the current
 376        # hash base (hb gitweb parameter); %% expands to %.
 377
 378        # To enable system wide have in $GITWEB_CONFIG e.g.
 379        # $feature{'actions'}{'default'} = [('graphiclog',
 380        #       '/git-browser/by-commit.html?r=%n', 'summary')];
 381        # Project specific override is not supported.
 382        'actions' => {
 383                'override' => 0,
 384                'default' => []},
 385
 386        # Allow gitweb scan project content tags described in ctags/
 387        # of project repository, and display the popular Web 2.0-ish
 388        # "tag cloud" near the project list. Note that this is something
 389        # COMPLETELY different from the normal Git tags.
 390
 391        # gitweb by itself can show existing tags, but it does not handle
 392        # tagging itself; you need an external application for that.
 393        # For an example script, check Girocco's cgi/tagproj.cgi.
 394        # You may want to install the HTML::TagCloud Perl module to get
 395        # a pretty tag cloud instead of just a list of tags.
 396
 397        # To enable system wide have in $GITWEB_CONFIG
 398        # $feature{'ctags'}{'default'} = ['path_to_tag_script'];
 399        # Project specific override is not supported.
 400        'ctags' => {
 401                'override' => 0,
 402                'default' => [0]},
 403
 404        # The maximum number of patches in a patchset generated in patch
 405        # view. Set this to 0 or undef to disable patch view, or to a
 406        # negative number to remove any limit.
 407
 408        # To disable system wide have in $GITWEB_CONFIG
 409        # $feature{'patches'}{'default'} = [0];
 410        # To have project specific config enable override in $GITWEB_CONFIG
 411        # $feature{'patches'}{'override'} = 1;
 412        # and in project config gitweb.patches = 0|n;
 413        # where n is the maximum number of patches allowed in a patchset.
 414        'patches' => {
 415                'sub' => \&feature_patches,
 416                'override' => 0,
 417                'default' => [16]},
 418
 419        # Avatar support. When this feature is enabled, views such as
 420        # shortlog or commit will display an avatar associated with
 421        # the email of the committer(s) and/or author(s).
 422
 423        # Currently available providers are gravatar and picon.
 424        # If an unknown provider is specified, the feature is disabled.
 425
 426        # Gravatar depends on Digest::MD5.
 427        # Picon currently relies on the indiana.edu database.
 428
 429        # To enable system wide have in $GITWEB_CONFIG
 430        # $feature{'avatar'}{'default'} = ['<provider>'];
 431        # where <provider> is either gravatar or picon.
 432        # To have project specific config enable override in $GITWEB_CONFIG
 433        # $feature{'avatar'}{'override'} = 1;
 434        # and in project config gitweb.avatar = <provider>;
 435        'avatar' => {
 436                'sub' => \&feature_avatar,
 437                'override' => 0,
 438                'default' => ['']},
 439
 440        # Enable displaying how much time and how many git commands
 441        # it took to generate and display page.  Disabled by default.
 442        # Project specific override is not supported.
 443        'timed' => {
 444                'override' => 0,
 445                'default' => [0]},
 446
 447        # Enable turning some links into links to actions which require
 448        # JavaScript to run (like 'blame_incremental').  Not enabled by
 449        # default.  Project specific override is currently not supported.
 450        'javascript-actions' => {
 451                'override' => 0,
 452                'default' => [0]},
 453
 454        # Syntax highlighting support. This is based on Daniel Svensson's
 455        # and Sham Chukoury's work in gitweb-xmms2.git.
 456        # It requires the 'highlight' program present in $PATH,
 457        # and therefore is disabled by default.
 458
 459        # To enable system wide have in $GITWEB_CONFIG
 460        # $feature{'highlight'}{'default'} = [1];
 461
 462        'highlight' => {
 463                'sub' => sub { feature_bool('highlight', @_) },
 464                'override' => 0,
 465                'default' => [0]},
 466);
 467
 468sub gitweb_get_feature {
 469        my ($name) = @_;
 470        return unless exists $feature{$name};
 471        my ($sub, $override, @defaults) = (
 472                $feature{$name}{'sub'},
 473                $feature{$name}{'override'},
 474                @{$feature{$name}{'default'}});
 475        # project specific override is possible only if we have project
 476        our $git_dir; # global variable, declared later
 477        if (!$override || !defined $git_dir) {
 478                return @defaults;
 479        }
 480        if (!defined $sub) {
 481                warn "feature $name is not overridable";
 482                return @defaults;
 483        }
 484        return $sub->(@defaults);
 485}
 486
 487# A wrapper to check if a given feature is enabled.
 488# With this, you can say
 489#
 490#   my $bool_feat = gitweb_check_feature('bool_feat');
 491#   gitweb_check_feature('bool_feat') or somecode;
 492#
 493# instead of
 494#
 495#   my ($bool_feat) = gitweb_get_feature('bool_feat');
 496#   (gitweb_get_feature('bool_feat'))[0] or somecode;
 497#
 498sub gitweb_check_feature {
 499        return (gitweb_get_feature(@_))[0];
 500}
 501
 502
 503sub feature_bool {
 504        my $key = shift;
 505        my ($val) = git_get_project_config($key, '--bool');
 506
 507        if (!defined $val) {
 508                return ($_[0]);
 509        } elsif ($val eq 'true') {
 510                return (1);
 511        } elsif ($val eq 'false') {
 512                return (0);
 513        }
 514}
 515
 516sub feature_snapshot {
 517        my (@fmts) = @_;
 518
 519        my ($val) = git_get_project_config('snapshot');
 520
 521        if ($val) {
 522                @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
 523        }
 524
 525        return @fmts;
 526}
 527
 528sub feature_patches {
 529        my @val = (git_get_project_config('patches', '--int'));
 530
 531        if (@val) {
 532                return @val;
 533        }
 534
 535        return ($_[0]);
 536}
 537
 538sub feature_avatar {
 539        my @val = (git_get_project_config('avatar'));
 540
 541        return @val ? @val : @_;
 542}
 543
 544# checking HEAD file with -e is fragile if the repository was
 545# initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
 546# and then pruned.
 547sub check_head_link {
 548        my ($dir) = @_;
 549        my $headfile = "$dir/HEAD";
 550        return ((-e $headfile) ||
 551                (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
 552}
 553
 554sub check_export_ok {
 555        my ($dir) = @_;
 556        return (check_head_link($dir) &&
 557                (!$export_ok || -e "$dir/$export_ok") &&
 558                (!$export_auth_hook || $export_auth_hook->($dir)));
 559}
 560
 561# process alternate names for backward compatibility
 562# filter out unsupported (unknown) snapshot formats
 563sub filter_snapshot_fmts {
 564        my @fmts = @_;
 565
 566        @fmts = map {
 567                exists $known_snapshot_format_aliases{$_} ?
 568                       $known_snapshot_format_aliases{$_} : $_} @fmts;
 569        @fmts = grep {
 570                exists $known_snapshot_formats{$_} &&
 571                !$known_snapshot_formats{$_}{'disabled'}} @fmts;
 572}
 573
 574our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM);
 575sub evaluate_gitweb_config {
 576        our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
 577        our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
 578        # die if there are errors parsing config file
 579        if (-e $GITWEB_CONFIG) {
 580                do $GITWEB_CONFIG;
 581                die $@ if $@;
 582        } elsif (-e $GITWEB_CONFIG_SYSTEM) {
 583                do $GITWEB_CONFIG_SYSTEM;
 584                die $@ if $@;
 585        }
 586}
 587
 588# Get loadavg of system, to compare against $maxload.
 589# Currently it requires '/proc/loadavg' present to get loadavg;
 590# if it is not present it returns 0, which means no load checking.
 591sub get_loadavg {
 592        if( -e '/proc/loadavg' ){
 593                open my $fd, '<', '/proc/loadavg'
 594                        or return 0;
 595                my @load = split(/\s+/, scalar <$fd>);
 596                close $fd;
 597
 598                # The first three columns measure CPU and IO utilization of the last one,
 599                # five, and 10 minute periods.  The fourth column shows the number of
 600                # currently running processes and the total number of processes in the m/n
 601                # format.  The last column displays the last process ID used.
 602                return $load[0] || 0;
 603        }
 604        # additional checks for load average should go here for things that don't export
 605        # /proc/loadavg
 606
 607        return 0;
 608}
 609
 610# version of the core git binary
 611our $git_version;
 612sub evaluate_git_version {
 613        our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
 614        $number_of_git_cmds++;
 615}
 616
 617sub check_loadavg {
 618        if (defined $maxload && get_loadavg() > $maxload) {
 619                die_error(503, "The load average on the server is too high");
 620        }
 621}
 622
 623# ======================================================================
 624# input validation and dispatch
 625
 626# input parameters can be collected from a variety of sources (presently, CGI
 627# and PATH_INFO), so we define an %input_params hash that collects them all
 628# together during validation: this allows subsequent uses (e.g. href()) to be
 629# agnostic of the parameter origin
 630
 631our %input_params = ();
 632
 633# input parameters are stored with the long parameter name as key. This will
 634# also be used in the href subroutine to convert parameters to their CGI
 635# equivalent, and since the href() usage is the most frequent one, we store
 636# the name -> CGI key mapping here, instead of the reverse.
 637#
 638# XXX: Warning: If you touch this, check the search form for updating,
 639# too.
 640
 641our @cgi_param_mapping = (
 642        project => "p",
 643        action => "a",
 644        file_name => "f",
 645        file_parent => "fp",
 646        hash => "h",
 647        hash_parent => "hp",
 648        hash_base => "hb",
 649        hash_parent_base => "hpb",
 650        page => "pg",
 651        order => "o",
 652        searchtext => "s",
 653        searchtype => "st",
 654        snapshot_format => "sf",
 655        extra_options => "opt",
 656        search_use_regexp => "sr",
 657        # this must be last entry (for manipulation from JavaScript)
 658        javascript => "js"
 659);
 660our %cgi_param_mapping = @cgi_param_mapping;
 661
 662# we will also need to know the possible actions, for validation
 663our %actions = (
 664        "blame" => \&git_blame,
 665        "blame_incremental" => \&git_blame_incremental,
 666        "blame_data" => \&git_blame_data,
 667        "blobdiff" => \&git_blobdiff,
 668        "blobdiff_plain" => \&git_blobdiff_plain,
 669        "blob" => \&git_blob,
 670        "blob_plain" => \&git_blob_plain,
 671        "commitdiff" => \&git_commitdiff,
 672        "commitdiff_plain" => \&git_commitdiff_plain,
 673        "commit" => \&git_commit,
 674        "forks" => \&git_forks,
 675        "heads" => \&git_heads,
 676        "history" => \&git_history,
 677        "log" => \&git_log,
 678        "patch" => \&git_patch,
 679        "patches" => \&git_patches,
 680        "rss" => \&git_rss,
 681        "atom" => \&git_atom,
 682        "search" => \&git_search,
 683        "search_help" => \&git_search_help,
 684        "shortlog" => \&git_shortlog,
 685        "summary" => \&git_summary,
 686        "tag" => \&git_tag,
 687        "tags" => \&git_tags,
 688        "tree" => \&git_tree,
 689        "snapshot" => \&git_snapshot,
 690        "object" => \&git_object,
 691        # those below don't need $project
 692        "opml" => \&git_opml,
 693        "project_list" => \&git_project_list,
 694        "project_index" => \&git_project_index,
 695);
 696
 697# finally, we have the hash of allowed extra_options for the commands that
 698# allow them
 699our %allowed_options = (
 700        "--no-merges" => [ qw(rss atom log shortlog history) ],
 701);
 702
 703# fill %input_params with the CGI parameters. All values except for 'opt'
 704# should be single values, but opt can be an array. We should probably
 705# build an array of parameters that can be multi-valued, but since for the time
 706# being it's only this one, we just single it out
 707sub evaluate_query_params {
 708        our $cgi;
 709
 710        while (my ($name, $symbol) = each %cgi_param_mapping) {
 711                if ($symbol eq 'opt') {
 712                        $input_params{$name} = [ $cgi->param($symbol) ];
 713                } else {
 714                        $input_params{$name} = $cgi->param($symbol);
 715                }
 716        }
 717}
 718
 719# now read PATH_INFO and update the parameter list for missing parameters
 720sub evaluate_path_info {
 721        return if defined $input_params{'project'};
 722        return if !$path_info;
 723        $path_info =~ s,^/+,,;
 724        return if !$path_info;
 725
 726        # find which part of PATH_INFO is project
 727        my $project = $path_info;
 728        $project =~ s,/+$,,;
 729        while ($project && !check_head_link("$projectroot/$project")) {
 730                $project =~ s,/*[^/]*$,,;
 731        }
 732        return unless $project;
 733        $input_params{'project'} = $project;
 734
 735        # do not change any parameters if an action is given using the query string
 736        return if $input_params{'action'};
 737        $path_info =~ s,^\Q$project\E/*,,;
 738
 739        # next, check if we have an action
 740        my $action = $path_info;
 741        $action =~ s,/.*$,,;
 742        if (exists $actions{$action}) {
 743                $path_info =~ s,^$action/*,,;
 744                $input_params{'action'} = $action;
 745        }
 746
 747        # list of actions that want hash_base instead of hash, but can have no
 748        # pathname (f) parameter
 749        my @wants_base = (
 750                'tree',
 751                'history',
 752        );
 753
 754        # we want to catch
 755        # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
 756        my ($parentrefname, $parentpathname, $refname, $pathname) =
 757                ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?(.+?)(?::(.+))?$/);
 758
 759        # first, analyze the 'current' part
 760        if (defined $pathname) {
 761                # we got "branch:filename" or "branch:dir/"
 762                # we could use git_get_type(branch:pathname), but:
 763                # - it needs $git_dir
 764                # - it does a git() call
 765                # - the convention of terminating directories with a slash
 766                #   makes it superfluous
 767                # - embedding the action in the PATH_INFO would make it even
 768                #   more superfluous
 769                $pathname =~ s,^/+,,;
 770                if (!$pathname || substr($pathname, -1) eq "/") {
 771                        $input_params{'action'} ||= "tree";
 772                        $pathname =~ s,/$,,;
 773                } else {
 774                        # the default action depends on whether we had parent info
 775                        # or not
 776                        if ($parentrefname) {
 777                                $input_params{'action'} ||= "blobdiff_plain";
 778                        } else {
 779                                $input_params{'action'} ||= "blob_plain";
 780                        }
 781                }
 782                $input_params{'hash_base'} ||= $refname;
 783                $input_params{'file_name'} ||= $pathname;
 784        } elsif (defined $refname) {
 785                # we got "branch". In this case we have to choose if we have to
 786                # set hash or hash_base.
 787                #
 788                # Most of the actions without a pathname only want hash to be
 789                # set, except for the ones specified in @wants_base that want
 790                # hash_base instead. It should also be noted that hand-crafted
 791                # links having 'history' as an action and no pathname or hash
 792                # set will fail, but that happens regardless of PATH_INFO.
 793                $input_params{'action'} ||= "shortlog";
 794                if (grep { $_ eq $input_params{'action'} } @wants_base) {
 795                        $input_params{'hash_base'} ||= $refname;
 796                } else {
 797                        $input_params{'hash'} ||= $refname;
 798                }
 799        }
 800
 801        # next, handle the 'parent' part, if present
 802        if (defined $parentrefname) {
 803                # a missing pathspec defaults to the 'current' filename, allowing e.g.
 804                # someproject/blobdiff/oldrev..newrev:/filename
 805                if ($parentpathname) {
 806                        $parentpathname =~ s,^/+,,;
 807                        $parentpathname =~ s,/$,,;
 808                        $input_params{'file_parent'} ||= $parentpathname;
 809                } else {
 810                        $input_params{'file_parent'} ||= $input_params{'file_name'};
 811                }
 812                # we assume that hash_parent_base is wanted if a path was specified,
 813                # or if the action wants hash_base instead of hash
 814                if (defined $input_params{'file_parent'} ||
 815                        grep { $_ eq $input_params{'action'} } @wants_base) {
 816                        $input_params{'hash_parent_base'} ||= $parentrefname;
 817                } else {
 818                        $input_params{'hash_parent'} ||= $parentrefname;
 819                }
 820        }
 821
 822        # for the snapshot action, we allow URLs in the form
 823        # $project/snapshot/$hash.ext
 824        # where .ext determines the snapshot and gets removed from the
 825        # passed $refname to provide the $hash.
 826        #
 827        # To be able to tell that $refname includes the format extension, we
 828        # require the following two conditions to be satisfied:
 829        # - the hash input parameter MUST have been set from the $refname part
 830        #   of the URL (i.e. they must be equal)
 831        # - the snapshot format MUST NOT have been defined already (e.g. from
 832        #   CGI parameter sf)
 833        # It's also useless to try any matching unless $refname has a dot,
 834        # so we check for that too
 835        if (defined $input_params{'action'} &&
 836                $input_params{'action'} eq 'snapshot' &&
 837                defined $refname && index($refname, '.') != -1 &&
 838                $refname eq $input_params{'hash'} &&
 839                !defined $input_params{'snapshot_format'}) {
 840                # We loop over the known snapshot formats, checking for
 841                # extensions. Allowed extensions are both the defined suffix
 842                # (which includes the initial dot already) and the snapshot
 843                # format key itself, with a prepended dot
 844                while (my ($fmt, $opt) = each %known_snapshot_formats) {
 845                        my $hash = $refname;
 846                        unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
 847                                next;
 848                        }
 849                        my $sfx = $1;
 850                        # a valid suffix was found, so set the snapshot format
 851                        # and reset the hash parameter
 852                        $input_params{'snapshot_format'} = $fmt;
 853                        $input_params{'hash'} = $hash;
 854                        # we also set the format suffix to the one requested
 855                        # in the URL: this way a request for e.g. .tgz returns
 856                        # a .tgz instead of a .tar.gz
 857                        $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
 858                        last;
 859                }
 860        }
 861}
 862
 863our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
 864     $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
 865     $searchtext, $search_regexp);
 866sub evaluate_and_validate_params {
 867        our $action = $input_params{'action'};
 868        if (defined $action) {
 869                if (!validate_action($action)) {
 870                        die_error(400, "Invalid action parameter");
 871                }
 872        }
 873
 874        # parameters which are pathnames
 875        our $project = $input_params{'project'};
 876        if (defined $project) {
 877                if (!validate_project($project)) {
 878                        undef $project;
 879                        die_error(404, "No such project");
 880                }
 881        }
 882
 883        our $file_name = $input_params{'file_name'};
 884        if (defined $file_name) {
 885                if (!validate_pathname($file_name)) {
 886                        die_error(400, "Invalid file parameter");
 887                }
 888        }
 889
 890        our $file_parent = $input_params{'file_parent'};
 891        if (defined $file_parent) {
 892                if (!validate_pathname($file_parent)) {
 893                        die_error(400, "Invalid file parent parameter");
 894                }
 895        }
 896
 897        # parameters which are refnames
 898        our $hash = $input_params{'hash'};
 899        if (defined $hash) {
 900                if (!validate_refname($hash)) {
 901                        die_error(400, "Invalid hash parameter");
 902                }
 903        }
 904
 905        our $hash_parent = $input_params{'hash_parent'};
 906        if (defined $hash_parent) {
 907                if (!validate_refname($hash_parent)) {
 908                        die_error(400, "Invalid hash parent parameter");
 909                }
 910        }
 911
 912        our $hash_base = $input_params{'hash_base'};
 913        if (defined $hash_base) {
 914                if (!validate_refname($hash_base)) {
 915                        die_error(400, "Invalid hash base parameter");
 916                }
 917        }
 918
 919        our @extra_options = @{$input_params{'extra_options'}};
 920        # @extra_options is always defined, since it can only be (currently) set from
 921        # CGI, and $cgi->param() returns the empty array in array context if the param
 922        # is not set
 923        foreach my $opt (@extra_options) {
 924                if (not exists $allowed_options{$opt}) {
 925                        die_error(400, "Invalid option parameter");
 926                }
 927                if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
 928                        die_error(400, "Invalid option parameter for this action");
 929                }
 930        }
 931
 932        our $hash_parent_base = $input_params{'hash_parent_base'};
 933        if (defined $hash_parent_base) {
 934                if (!validate_refname($hash_parent_base)) {
 935                        die_error(400, "Invalid hash parent base parameter");
 936                }
 937        }
 938
 939        # other parameters
 940        our $page = $input_params{'page'};
 941        if (defined $page) {
 942                if ($page =~ m/[^0-9]/) {
 943                        die_error(400, "Invalid page parameter");
 944                }
 945        }
 946
 947        our $searchtype = $input_params{'searchtype'};
 948        if (defined $searchtype) {
 949                if ($searchtype =~ m/[^a-z]/) {
 950                        die_error(400, "Invalid searchtype parameter");
 951                }
 952        }
 953
 954        our $search_use_regexp = $input_params{'search_use_regexp'};
 955
 956        our $searchtext = $input_params{'searchtext'};
 957        our $search_regexp;
 958        if (defined $searchtext) {
 959                if (length($searchtext) < 2) {
 960                        die_error(403, "At least two characters are required for search parameter");
 961                }
 962                $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
 963        }
 964}
 965
 966# path to the current git repository
 967our $git_dir;
 968sub evaluate_git_dir {
 969        our $git_dir = "$projectroot/$project" if $project;
 970}
 971
 972our (@snapshot_fmts, $git_avatar);
 973sub configure_gitweb_features {
 974        # list of supported snapshot formats
 975        our @snapshot_fmts = gitweb_get_feature('snapshot');
 976        @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
 977
 978        # check that the avatar feature is set to a known provider name,
 979        # and for each provider check if the dependencies are satisfied.
 980        # if the provider name is invalid or the dependencies are not met,
 981        # reset $git_avatar to the empty string.
 982        our ($git_avatar) = gitweb_get_feature('avatar');
 983        if ($git_avatar eq 'gravatar') {
 984                $git_avatar = '' unless (eval { require Digest::MD5; 1; });
 985        } elsif ($git_avatar eq 'picon') {
 986                # no dependencies
 987        } else {
 988                $git_avatar = '';
 989        }
 990}
 991
 992# custom error handler: 'die <message>' is Internal Server Error
 993sub handle_errors_html {
 994        my $msg = shift; # it is already HTML escaped
 995
 996        # to avoid infinite loop where error occurs in die_error,
 997        # change handler to default handler, disabling handle_errors_html
 998        set_message("Error occured when inside die_error:\n$msg");
 999
1000        # you cannot jump out of die_error when called as error handler;
1001        # the subroutine set via CGI::Carp::set_message is called _after_
1002        # HTTP headers are already written, so it cannot write them itself
1003        die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1004}
1005set_message(\&handle_errors_html);
1006
1007# dispatch
1008sub dispatch {
1009        if (!defined $action) {
1010                if (defined $hash) {
1011                        $action = git_get_type($hash);
1012                } elsif (defined $hash_base && defined $file_name) {
1013                        $action = git_get_type("$hash_base:$file_name");
1014                } elsif (defined $project) {
1015                        $action = 'summary';
1016                } else {
1017                        $action = 'project_list';
1018                }
1019        }
1020        if (!defined($actions{$action})) {
1021                die_error(400, "Unknown action");
1022        }
1023        if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1024            !$project) {
1025                die_error(400, "Project needed");
1026        }
1027        $actions{$action}->();
1028}
1029
1030sub reset_timer {
1031        our $t0 = [Time::HiRes::gettimeofday()]
1032                if defined $t0;
1033        our $number_of_git_cmds = 0;
1034}
1035
1036sub run_request {
1037        reset_timer();
1038
1039        evaluate_uri();
1040        check_loadavg();
1041
1042        evaluate_query_params();
1043        evaluate_path_info();
1044        evaluate_and_validate_params();
1045        evaluate_git_dir();
1046
1047        configure_gitweb_features();
1048
1049        dispatch();
1050}
1051
1052our $is_last_request = sub { 1 };
1053our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1054our $CGI = 'CGI';
1055our $cgi;
1056sub configure_as_fcgi {
1057        require CGI::Fast;
1058        our $CGI = 'CGI::Fast';
1059
1060        my $request_number = 0;
1061        # let each child service 100 requests
1062        our $is_last_request = sub { ++$request_number > 100 };
1063}
1064sub evaluate_argv {
1065        my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1066        configure_as_fcgi()
1067                if $script_name =~ /\.fcgi$/;
1068
1069        return unless (@ARGV);
1070
1071        require Getopt::Long;
1072        Getopt::Long::GetOptions(
1073                'fastcgi|fcgi|f' => \&configure_as_fcgi,
1074                'nproc|n=i' => sub {
1075                        my ($arg, $val) = @_;
1076                        return unless eval { require FCGI::ProcManager; 1; };
1077                        my $proc_manager = FCGI::ProcManager->new({
1078                                n_processes => $val,
1079                        });
1080                        our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1081                        our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1082                        our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1083                },
1084        );
1085}
1086
1087sub run {
1088        evaluate_argv();
1089        evaluate_gitweb_config();
1090        evaluate_git_version();
1091
1092        # $projectroot and $projects_list might be set in gitweb config file
1093        $projects_list ||= $projectroot;
1094
1095        $pre_listen_hook->()
1096                if $pre_listen_hook;
1097
1098 REQUEST:
1099        while ($cgi = $CGI->new()) {
1100                $pre_dispatch_hook->()
1101                        if $pre_dispatch_hook;
1102
1103                run_request();
1104
1105                $pre_dispatch_hook->()
1106                        if $post_dispatch_hook;
1107
1108                last REQUEST if ($is_last_request->());
1109        }
1110
1111 DONE_GITWEB:
1112        1;
1113}
1114
1115run();
1116
1117if (defined caller) {
1118        # wrapped in a subroutine processing requests,
1119        # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1120        return;
1121} else {
1122        # pure CGI script, serving single request
1123        exit;
1124}
1125
1126## ======================================================================
1127## action links
1128
1129# possible values of extra options
1130# -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1131# -replay => 1      - start from a current view (replay with modifications)
1132# -path_info => 0|1 - don't use/use path_info URL (if possible)
1133sub href {
1134        my %params = @_;
1135        # default is to use -absolute url() i.e. $my_uri
1136        my $href = $params{-full} ? $my_url : $my_uri;
1137
1138        $params{'project'} = $project unless exists $params{'project'};
1139
1140        if ($params{-replay}) {
1141                while (my ($name, $symbol) = each %cgi_param_mapping) {
1142                        if (!exists $params{$name}) {
1143                                $params{$name} = $input_params{$name};
1144                        }
1145                }
1146        }
1147
1148        my $use_pathinfo = gitweb_check_feature('pathinfo');
1149        if (defined $params{'project'} &&
1150            (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1151                # try to put as many parameters as possible in PATH_INFO:
1152                #   - project name
1153                #   - action
1154                #   - hash_parent or hash_parent_base:/file_parent
1155                #   - hash or hash_base:/filename
1156                #   - the snapshot_format as an appropriate suffix
1157
1158                # When the script is the root DirectoryIndex for the domain,
1159                # $href here would be something like http://gitweb.example.com/
1160                # Thus, we strip any trailing / from $href, to spare us double
1161                # slashes in the final URL
1162                $href =~ s,/$,,;
1163
1164                # Then add the project name, if present
1165                $href .= "/".esc_url($params{'project'});
1166                delete $params{'project'};
1167
1168                # since we destructively absorb parameters, we keep this
1169                # boolean that remembers if we're handling a snapshot
1170                my $is_snapshot = $params{'action'} eq 'snapshot';
1171
1172                # Summary just uses the project path URL, any other action is
1173                # added to the URL
1174                if (defined $params{'action'}) {
1175                        $href .= "/".esc_url($params{'action'}) unless $params{'action'} eq 'summary';
1176                        delete $params{'action'};
1177                }
1178
1179                # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1180                # stripping nonexistent or useless pieces
1181                $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1182                        || $params{'hash_parent'} || $params{'hash'});
1183                if (defined $params{'hash_base'}) {
1184                        if (defined $params{'hash_parent_base'}) {
1185                                $href .= esc_url($params{'hash_parent_base'});
1186                                # skip the file_parent if it's the same as the file_name
1187                                if (defined $params{'file_parent'}) {
1188                                        if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1189                                                delete $params{'file_parent'};
1190                                        } elsif ($params{'file_parent'} !~ /\.\./) {
1191                                                $href .= ":/".esc_url($params{'file_parent'});
1192                                                delete $params{'file_parent'};
1193                                        }
1194                                }
1195                                $href .= "..";
1196                                delete $params{'hash_parent'};
1197                                delete $params{'hash_parent_base'};
1198                        } elsif (defined $params{'hash_parent'}) {
1199                                $href .= esc_url($params{'hash_parent'}). "..";
1200                                delete $params{'hash_parent'};
1201                        }
1202
1203                        $href .= esc_url($params{'hash_base'});
1204                        if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1205                                $href .= ":/".esc_url($params{'file_name'});
1206                                delete $params{'file_name'};
1207                        }
1208                        delete $params{'hash'};
1209                        delete $params{'hash_base'};
1210                } elsif (defined $params{'hash'}) {
1211                        $href .= esc_url($params{'hash'});
1212                        delete $params{'hash'};
1213                }
1214
1215                # If the action was a snapshot, we can absorb the
1216                # snapshot_format parameter too
1217                if ($is_snapshot) {
1218                        my $fmt = $params{'snapshot_format'};
1219                        # snapshot_format should always be defined when href()
1220                        # is called, but just in case some code forgets, we
1221                        # fall back to the default
1222                        $fmt ||= $snapshot_fmts[0];
1223                        $href .= $known_snapshot_formats{$fmt}{'suffix'};
1224                        delete $params{'snapshot_format'};
1225                }
1226        }
1227
1228        # now encode the parameters explicitly
1229        my @result = ();
1230        for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1231                my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1232                if (defined $params{$name}) {
1233                        if (ref($params{$name}) eq "ARRAY") {
1234                                foreach my $par (@{$params{$name}}) {
1235                                        push @result, $symbol . "=" . esc_param($par);
1236                                }
1237                        } else {
1238                                push @result, $symbol . "=" . esc_param($params{$name});
1239                        }
1240                }
1241        }
1242        $href .= "?" . join(';', @result) if scalar @result;
1243
1244        return $href;
1245}
1246
1247
1248## ======================================================================
1249## validation, quoting/unquoting and escaping
1250
1251sub validate_action {
1252        my $input = shift || return undef;
1253        return undef unless exists $actions{$input};
1254        return $input;
1255}
1256
1257sub validate_project {
1258        my $input = shift || return undef;
1259        if (!validate_pathname($input) ||
1260                !(-d "$projectroot/$input") ||
1261                !check_export_ok("$projectroot/$input") ||
1262                ($strict_export && !project_in_list($input))) {
1263                return undef;
1264        } else {
1265                return $input;
1266        }
1267}
1268
1269sub validate_pathname {
1270        my $input = shift || return undef;
1271
1272        # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1273        # at the beginning, at the end, and between slashes.
1274        # also this catches doubled slashes
1275        if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1276                return undef;
1277        }
1278        # no null characters
1279        if ($input =~ m!\0!) {
1280                return undef;
1281        }
1282        return $input;
1283}
1284
1285sub validate_refname {
1286        my $input = shift || return undef;
1287
1288        # textual hashes are O.K.
1289        if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1290                return $input;
1291        }
1292        # it must be correct pathname
1293        $input = validate_pathname($input)
1294                or return undef;
1295        # restrictions on ref name according to git-check-ref-format
1296        if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1297                return undef;
1298        }
1299        return $input;
1300}
1301
1302# decode sequences of octets in utf8 into Perl's internal form,
1303# which is utf-8 with utf8 flag set if needed.  gitweb writes out
1304# in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1305sub to_utf8 {
1306        my $str = shift;
1307        return undef unless defined $str;
1308        if (utf8::valid($str)) {
1309                utf8::decode($str);
1310                return $str;
1311        } else {
1312                return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1313        }
1314}
1315
1316# quote unsafe chars, but keep the slash, even when it's not
1317# correct, but quoted slashes look too horrible in bookmarks
1318sub esc_param {
1319        my $str = shift;
1320        return undef unless defined $str;
1321        $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1322        $str =~ s/ /\+/g;
1323        return $str;
1324}
1325
1326# quote unsafe chars in whole URL, so some characters cannot be quoted
1327sub esc_url {
1328        my $str = shift;
1329        return undef unless defined $str;
1330        $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1331        $str =~ s/ /\+/g;
1332        return $str;
1333}
1334
1335# quote unsafe characters in HTML attributes
1336sub esc_attr {
1337
1338        # for XHTML conformance escaping '"' to '&quot;' is not enough
1339        return esc_html(@_);
1340}
1341
1342# replace invalid utf8 character with SUBSTITUTION sequence
1343sub esc_html {
1344        my $str = shift;
1345        my %opts = @_;
1346
1347        return undef unless defined $str;
1348
1349        $str = to_utf8($str);
1350        $str = $cgi->escapeHTML($str);
1351        if ($opts{'-nbsp'}) {
1352                $str =~ s/ /&nbsp;/g;
1353        }
1354        $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1355        return $str;
1356}
1357
1358# quote control characters and escape filename to HTML
1359sub esc_path {
1360        my $str = shift;
1361        my %opts = @_;
1362
1363        return undef unless defined $str;
1364
1365        $str = to_utf8($str);
1366        $str = $cgi->escapeHTML($str);
1367        if ($opts{'-nbsp'}) {
1368                $str =~ s/ /&nbsp;/g;
1369        }
1370        $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1371        return $str;
1372}
1373
1374# Make control characters "printable", using character escape codes (CEC)
1375sub quot_cec {
1376        my $cntrl = shift;
1377        my %opts = @_;
1378        my %es = ( # character escape codes, aka escape sequences
1379                "\t" => '\t',   # tab            (HT)
1380                "\n" => '\n',   # line feed      (LF)
1381                "\r" => '\r',   # carrige return (CR)
1382                "\f" => '\f',   # form feed      (FF)
1383                "\b" => '\b',   # backspace      (BS)
1384                "\a" => '\a',   # alarm (bell)   (BEL)
1385                "\e" => '\e',   # escape         (ESC)
1386                "\013" => '\v', # vertical tab   (VT)
1387                "\000" => '\0', # nul character  (NUL)
1388        );
1389        my $chr = ( (exists $es{$cntrl})
1390                    ? $es{$cntrl}
1391                    : sprintf('\%2x', ord($cntrl)) );
1392        if ($opts{-nohtml}) {
1393                return $chr;
1394        } else {
1395                return "<span class=\"cntrl\">$chr</span>";
1396        }
1397}
1398
1399# Alternatively use unicode control pictures codepoints,
1400# Unicode "printable representation" (PR)
1401sub quot_upr {
1402        my $cntrl = shift;
1403        my %opts = @_;
1404
1405        my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1406        if ($opts{-nohtml}) {
1407                return $chr;
1408        } else {
1409                return "<span class=\"cntrl\">$chr</span>";
1410        }
1411}
1412
1413# git may return quoted and escaped filenames
1414sub unquote {
1415        my $str = shift;
1416
1417        sub unq {
1418                my $seq = shift;
1419                my %es = ( # character escape codes, aka escape sequences
1420                        't' => "\t",   # tab            (HT, TAB)
1421                        'n' => "\n",   # newline        (NL)
1422                        'r' => "\r",   # return         (CR)
1423                        'f' => "\f",   # form feed      (FF)
1424                        'b' => "\b",   # backspace      (BS)
1425                        'a' => "\a",   # alarm (bell)   (BEL)
1426                        'e' => "\e",   # escape         (ESC)
1427                        'v' => "\013", # vertical tab   (VT)
1428                );
1429
1430                if ($seq =~ m/^[0-7]{1,3}$/) {
1431                        # octal char sequence
1432                        return chr(oct($seq));
1433                } elsif (exists $es{$seq}) {
1434                        # C escape sequence, aka character escape code
1435                        return $es{$seq};
1436                }
1437                # quoted ordinary character
1438                return $seq;
1439        }
1440
1441        if ($str =~ m/^"(.*)"$/) {
1442                # needs unquoting
1443                $str = $1;
1444                $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1445        }
1446        return $str;
1447}
1448
1449# escape tabs (convert tabs to spaces)
1450sub untabify {
1451        my $line = shift;
1452
1453        while ((my $pos = index($line, "\t")) != -1) {
1454                if (my $count = (8 - ($pos % 8))) {
1455                        my $spaces = ' ' x $count;
1456                        $line =~ s/\t/$spaces/;
1457                }
1458        }
1459
1460        return $line;
1461}
1462
1463sub project_in_list {
1464        my $project = shift;
1465        my @list = git_get_projects_list();
1466        return @list && scalar(grep { $_->{'path'} eq $project } @list);
1467}
1468
1469## ----------------------------------------------------------------------
1470## HTML aware string manipulation
1471
1472# Try to chop given string on a word boundary between position
1473# $len and $len+$add_len. If there is no word boundary there,
1474# chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1475# (marking chopped part) would be longer than given string.
1476sub chop_str {
1477        my $str = shift;
1478        my $len = shift;
1479        my $add_len = shift || 10;
1480        my $where = shift || 'right'; # 'left' | 'center' | 'right'
1481
1482        # Make sure perl knows it is utf8 encoded so we don't
1483        # cut in the middle of a utf8 multibyte char.
1484        $str = to_utf8($str);
1485
1486        # allow only $len chars, but don't cut a word if it would fit in $add_len
1487        # if it doesn't fit, cut it if it's still longer than the dots we would add
1488        # remove chopped character entities entirely
1489
1490        # when chopping in the middle, distribute $len into left and right part
1491        # return early if chopping wouldn't make string shorter
1492        if ($where eq 'center') {
1493                return $str if ($len + 5 >= length($str)); # filler is length 5
1494                $len = int($len/2);
1495        } else {
1496                return $str if ($len + 4 >= length($str)); # filler is length 4
1497        }
1498
1499        # regexps: ending and beginning with word part up to $add_len
1500        my $endre = qr/.{$len}\w{0,$add_len}/;
1501        my $begre = qr/\w{0,$add_len}.{$len}/;
1502
1503        if ($where eq 'left') {
1504                $str =~ m/^(.*?)($begre)$/;
1505                my ($lead, $body) = ($1, $2);
1506                if (length($lead) > 4) {
1507                        $lead = " ...";
1508                }
1509                return "$lead$body";
1510
1511        } elsif ($where eq 'center') {
1512                $str =~ m/^($endre)(.*)$/;
1513                my ($left, $str)  = ($1, $2);
1514                $str =~ m/^(.*?)($begre)$/;
1515                my ($mid, $right) = ($1, $2);
1516                if (length($mid) > 5) {
1517                        $mid = " ... ";
1518                }
1519                return "$left$mid$right";
1520
1521        } else {
1522                $str =~ m/^($endre)(.*)$/;
1523                my $body = $1;
1524                my $tail = $2;
1525                if (length($tail) > 4) {
1526                        $tail = "... ";
1527                }
1528                return "$body$tail";
1529        }
1530}
1531
1532# takes the same arguments as chop_str, but also wraps a <span> around the
1533# result with a title attribute if it does get chopped. Additionally, the
1534# string is HTML-escaped.
1535sub chop_and_escape_str {
1536        my ($str) = @_;
1537
1538        my $chopped = chop_str(@_);
1539        if ($chopped eq $str) {
1540                return esc_html($chopped);
1541        } else {
1542                $str =~ s/[[:cntrl:]]/?/g;
1543                return $cgi->span({-title=>$str}, esc_html($chopped));
1544        }
1545}
1546
1547## ----------------------------------------------------------------------
1548## functions returning short strings
1549
1550# CSS class for given age value (in seconds)
1551sub age_class {
1552        my $age = shift;
1553
1554        if (!defined $age) {
1555                return "noage";
1556        } elsif ($age < 60*60*2) {
1557                return "age0";
1558        } elsif ($age < 60*60*24*2) {
1559                return "age1";
1560        } else {
1561                return "age2";
1562        }
1563}
1564
1565# convert age in seconds to "nn units ago" string
1566sub age_string {
1567        my $age = shift;
1568        my $age_str;
1569
1570        if ($age > 60*60*24*365*2) {
1571                $age_str = (int $age/60/60/24/365);
1572                $age_str .= " years ago";
1573        } elsif ($age > 60*60*24*(365/12)*2) {
1574                $age_str = int $age/60/60/24/(365/12);
1575                $age_str .= " months ago";
1576        } elsif ($age > 60*60*24*7*2) {
1577                $age_str = int $age/60/60/24/7;
1578                $age_str .= " weeks ago";
1579        } elsif ($age > 60*60*24*2) {
1580                $age_str = int $age/60/60/24;
1581                $age_str .= " days ago";
1582        } elsif ($age > 60*60*2) {
1583                $age_str = int $age/60/60;
1584                $age_str .= " hours ago";
1585        } elsif ($age > 60*2) {
1586                $age_str = int $age/60;
1587                $age_str .= " min ago";
1588        } elsif ($age > 2) {
1589                $age_str = int $age;
1590                $age_str .= " sec ago";
1591        } else {
1592                $age_str .= " right now";
1593        }
1594        return $age_str;
1595}
1596
1597use constant {
1598        S_IFINVALID => 0030000,
1599        S_IFGITLINK => 0160000,
1600};
1601
1602# submodule/subproject, a commit object reference
1603sub S_ISGITLINK {
1604        my $mode = shift;
1605
1606        return (($mode & S_IFMT) == S_IFGITLINK)
1607}
1608
1609# convert file mode in octal to symbolic file mode string
1610sub mode_str {
1611        my $mode = oct shift;
1612
1613        if (S_ISGITLINK($mode)) {
1614                return 'm---------';
1615        } elsif (S_ISDIR($mode & S_IFMT)) {
1616                return 'drwxr-xr-x';
1617        } elsif (S_ISLNK($mode)) {
1618                return 'lrwxrwxrwx';
1619        } elsif (S_ISREG($mode)) {
1620                # git cares only about the executable bit
1621                if ($mode & S_IXUSR) {
1622                        return '-rwxr-xr-x';
1623                } else {
1624                        return '-rw-r--r--';
1625                };
1626        } else {
1627                return '----------';
1628        }
1629}
1630
1631# convert file mode in octal to file type string
1632sub file_type {
1633        my $mode = shift;
1634
1635        if ($mode !~ m/^[0-7]+$/) {
1636                return $mode;
1637        } else {
1638                $mode = oct $mode;
1639        }
1640
1641        if (S_ISGITLINK($mode)) {
1642                return "submodule";
1643        } elsif (S_ISDIR($mode & S_IFMT)) {
1644                return "directory";
1645        } elsif (S_ISLNK($mode)) {
1646                return "symlink";
1647        } elsif (S_ISREG($mode)) {
1648                return "file";
1649        } else {
1650                return "unknown";
1651        }
1652}
1653
1654# convert file mode in octal to file type description string
1655sub file_type_long {
1656        my $mode = shift;
1657
1658        if ($mode !~ m/^[0-7]+$/) {
1659                return $mode;
1660        } else {
1661                $mode = oct $mode;
1662        }
1663
1664        if (S_ISGITLINK($mode)) {
1665                return "submodule";
1666        } elsif (S_ISDIR($mode & S_IFMT)) {
1667                return "directory";
1668        } elsif (S_ISLNK($mode)) {
1669                return "symlink";
1670        } elsif (S_ISREG($mode)) {
1671                if ($mode & S_IXUSR) {
1672                        return "executable";
1673                } else {
1674                        return "file";
1675                };
1676        } else {
1677                return "unknown";
1678        }
1679}
1680
1681
1682## ----------------------------------------------------------------------
1683## functions returning short HTML fragments, or transforming HTML fragments
1684## which don't belong to other sections
1685
1686# format line of commit message.
1687sub format_log_line_html {
1688        my $line = shift;
1689
1690        $line = esc_html($line, -nbsp=>1);
1691        $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1692                $cgi->a({-href => href(action=>"object", hash=>$1),
1693                                        -class => "text"}, $1);
1694        }eg;
1695
1696        return $line;
1697}
1698
1699# format marker of refs pointing to given object
1700
1701# the destination action is chosen based on object type and current context:
1702# - for annotated tags, we choose the tag view unless it's the current view
1703#   already, in which case we go to shortlog view
1704# - for other refs, we keep the current view if we're in history, shortlog or
1705#   log view, and select shortlog otherwise
1706sub format_ref_marker {
1707        my ($refs, $id) = @_;
1708        my $markers = '';
1709
1710        if (defined $refs->{$id}) {
1711                foreach my $ref (@{$refs->{$id}}) {
1712                        # this code exploits the fact that non-lightweight tags are the
1713                        # only indirect objects, and that they are the only objects for which
1714                        # we want to use tag instead of shortlog as action
1715                        my ($type, $name) = qw();
1716                        my $indirect = ($ref =~ s/\^\{\}$//);
1717                        # e.g. tags/v2.6.11 or heads/next
1718                        if ($ref =~ m!^(.*?)s?/(.*)$!) {
1719                                $type = $1;
1720                                $name = $2;
1721                        } else {
1722                                $type = "ref";
1723                                $name = $ref;
1724                        }
1725
1726                        my $class = $type;
1727                        $class .= " indirect" if $indirect;
1728
1729                        my $dest_action = "shortlog";
1730
1731                        if ($indirect) {
1732                                $dest_action = "tag" unless $action eq "tag";
1733                        } elsif ($action =~ /^(history|(short)?log)$/) {
1734                                $dest_action = $action;
1735                        }
1736
1737                        my $dest = "";
1738                        $dest .= "refs/" unless $ref =~ m!^refs/!;
1739                        $dest .= $ref;
1740
1741                        my $link = $cgi->a({
1742                                -href => href(
1743                                        action=>$dest_action,
1744                                        hash=>$dest
1745                                )}, $name);
1746
1747                        $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
1748                                $link . "</span>";
1749                }
1750        }
1751
1752        if ($markers) {
1753                return ' <span class="refs">'. $markers . '</span>';
1754        } else {
1755                return "";
1756        }
1757}
1758
1759# format, perhaps shortened and with markers, title line
1760sub format_subject_html {
1761        my ($long, $short, $href, $extra) = @_;
1762        $extra = '' unless defined($extra);
1763
1764        if (length($short) < length($long)) {
1765                $long =~ s/[[:cntrl:]]/?/g;
1766                return $cgi->a({-href => $href, -class => "list subject",
1767                                -title => to_utf8($long)},
1768                       esc_html($short)) . $extra;
1769        } else {
1770                return $cgi->a({-href => $href, -class => "list subject"},
1771                       esc_html($long)) . $extra;
1772        }
1773}
1774
1775# Rather than recomputing the url for an email multiple times, we cache it
1776# after the first hit. This gives a visible benefit in views where the avatar
1777# for the same email is used repeatedly (e.g. shortlog).
1778# The cache is shared by all avatar engines (currently gravatar only), which
1779# are free to use it as preferred. Since only one avatar engine is used for any
1780# given page, there's no risk for cache conflicts.
1781our %avatar_cache = ();
1782
1783# Compute the picon url for a given email, by using the picon search service over at
1784# http://www.cs.indiana.edu/picons/search.html
1785sub picon_url {
1786        my $email = lc shift;
1787        if (!$avatar_cache{$email}) {
1788                my ($user, $domain) = split('@', $email);
1789                $avatar_cache{$email} =
1790                        "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1791                        "$domain/$user/" .
1792                        "users+domains+unknown/up/single";
1793        }
1794        return $avatar_cache{$email};
1795}
1796
1797# Compute the gravatar url for a given email, if it's not in the cache already.
1798# Gravatar stores only the part of the URL before the size, since that's the
1799# one computationally more expensive. This also allows reuse of the cache for
1800# different sizes (for this particular engine).
1801sub gravatar_url {
1802        my $email = lc shift;
1803        my $size = shift;
1804        $avatar_cache{$email} ||=
1805                "http://www.gravatar.com/avatar/" .
1806                        Digest::MD5::md5_hex($email) . "?s=";
1807        return $avatar_cache{$email} . $size;
1808}
1809
1810# Insert an avatar for the given $email at the given $size if the feature
1811# is enabled.
1812sub git_get_avatar {
1813        my ($email, %opts) = @_;
1814        my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1815        my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1816        $opts{-size} ||= 'default';
1817        my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1818        my $url = "";
1819        if ($git_avatar eq 'gravatar') {
1820                $url = gravatar_url($email, $size);
1821        } elsif ($git_avatar eq 'picon') {
1822                $url = picon_url($email);
1823        }
1824        # Other providers can be added by extending the if chain, defining $url
1825        # as needed. If no variant puts something in $url, we assume avatars
1826        # are completely disabled/unavailable.
1827        if ($url) {
1828                return $pre_white .
1829                       "<img width=\"$size\" " .
1830                            "class=\"avatar\" " .
1831                            "src=\"".esc_url($url)."\" " .
1832                            "alt=\"\" " .
1833                       "/>" . $post_white;
1834        } else {
1835                return "";
1836        }
1837}
1838
1839sub format_search_author {
1840        my ($author, $searchtype, $displaytext) = @_;
1841        my $have_search = gitweb_check_feature('search');
1842
1843        if ($have_search) {
1844                my $performed = "";
1845                if ($searchtype eq 'author') {
1846                        $performed = "authored";
1847                } elsif ($searchtype eq 'committer') {
1848                        $performed = "committed";
1849                }
1850
1851                return $cgi->a({-href => href(action=>"search", hash=>$hash,
1852                                searchtext=>$author,
1853                                searchtype=>$searchtype), class=>"list",
1854                                title=>"Search for commits $performed by $author"},
1855                                $displaytext);
1856
1857        } else {
1858                return $displaytext;
1859        }
1860}
1861
1862# format the author name of the given commit with the given tag
1863# the author name is chopped and escaped according to the other
1864# optional parameters (see chop_str).
1865sub format_author_html {
1866        my $tag = shift;
1867        my $co = shift;
1868        my $author = chop_and_escape_str($co->{'author_name'}, @_);
1869        return "<$tag class=\"author\">" .
1870               format_search_author($co->{'author_name'}, "author",
1871                       git_get_avatar($co->{'author_email'}, -pad_after => 1) .
1872                       $author) .
1873               "</$tag>";
1874}
1875
1876# format git diff header line, i.e. "diff --(git|combined|cc) ..."
1877sub format_git_diff_header_line {
1878        my $line = shift;
1879        my $diffinfo = shift;
1880        my ($from, $to) = @_;
1881
1882        if ($diffinfo->{'nparents'}) {
1883                # combined diff
1884                $line =~ s!^(diff (.*?) )"?.*$!$1!;
1885                if ($to->{'href'}) {
1886                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1887                                         esc_path($to->{'file'}));
1888                } else { # file was deleted (no href)
1889                        $line .= esc_path($to->{'file'});
1890                }
1891        } else {
1892                # "ordinary" diff
1893                $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
1894                if ($from->{'href'}) {
1895                        $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
1896                                         'a/' . esc_path($from->{'file'}));
1897                } else { # file was added (no href)
1898                        $line .= 'a/' . esc_path($from->{'file'});
1899                }
1900                $line .= ' ';
1901                if ($to->{'href'}) {
1902                        $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1903                                         'b/' . esc_path($to->{'file'}));
1904                } else { # file was deleted
1905                        $line .= 'b/' . esc_path($to->{'file'});
1906                }
1907        }
1908
1909        return "<div class=\"diff header\">$line</div>\n";
1910}
1911
1912# format extended diff header line, before patch itself
1913sub format_extended_diff_header_line {
1914        my $line = shift;
1915        my $diffinfo = shift;
1916        my ($from, $to) = @_;
1917
1918        # match <path>
1919        if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
1920                $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
1921                                       esc_path($from->{'file'}));
1922        }
1923        if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
1924                $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
1925                                 esc_path($to->{'file'}));
1926        }
1927        # match single <mode>
1928        if ($line =~ m/\s(\d{6})$/) {
1929                $line .= '<span class="info"> (' .
1930                         file_type_long($1) .
1931                         ')</span>';
1932        }
1933        # match <hash>
1934        if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
1935                # can match only for combined diff
1936                $line = 'index ';
1937                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
1938                        if ($from->{'href'}[$i]) {
1939                                $line .= $cgi->a({-href=>$from->{'href'}[$i],
1940                                                  -class=>"hash"},
1941                                                 substr($diffinfo->{'from_id'}[$i],0,7));
1942                        } else {
1943                                $line .= '0' x 7;
1944                        }
1945                        # separator
1946                        $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
1947                }
1948                $line .= '..';
1949                if ($to->{'href'}) {
1950                        $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
1951                                         substr($diffinfo->{'to_id'},0,7));
1952                } else {
1953                        $line .= '0' x 7;
1954                }
1955
1956        } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
1957                # can match only for ordinary diff
1958                my ($from_link, $to_link);
1959                if ($from->{'href'}) {
1960                        $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
1961                                             substr($diffinfo->{'from_id'},0,7));
1962                } else {
1963                        $from_link = '0' x 7;
1964                }
1965                if ($to->{'href'}) {
1966                        $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
1967                                           substr($diffinfo->{'to_id'},0,7));
1968                } else {
1969                        $to_link = '0' x 7;
1970                }
1971                my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
1972                $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
1973        }
1974
1975        return $line . "<br/>\n";
1976}
1977
1978# format from-file/to-file diff header
1979sub format_diff_from_to_header {
1980        my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
1981        my $line;
1982        my $result = '';
1983
1984        $line = $from_line;
1985        #assert($line =~ m/^---/) if DEBUG;
1986        # no extra formatting for "^--- /dev/null"
1987        if (! $diffinfo->{'nparents'}) {
1988                # ordinary (single parent) diff
1989                if ($line =~ m!^--- "?a/!) {
1990                        if ($from->{'href'}) {
1991                                $line = '--- a/' .
1992                                        $cgi->a({-href=>$from->{'href'}, -class=>"path"},
1993                                                esc_path($from->{'file'}));
1994                        } else {
1995                                $line = '--- a/' .
1996                                        esc_path($from->{'file'});
1997                        }
1998                }
1999                $result .= qq!<div class="diff from_file">$line</div>\n!;
2000
2001        } else {
2002                # combined diff (merge commit)
2003                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2004                        if ($from->{'href'}[$i]) {
2005                                $line = '--- ' .
2006                                        $cgi->a({-href=>href(action=>"blobdiff",
2007                                                             hash_parent=>$diffinfo->{'from_id'}[$i],
2008                                                             hash_parent_base=>$parents[$i],
2009                                                             file_parent=>$from->{'file'}[$i],
2010                                                             hash=>$diffinfo->{'to_id'},
2011                                                             hash_base=>$hash,
2012                                                             file_name=>$to->{'file'}),
2013                                                 -class=>"path",
2014                                                 -title=>"diff" . ($i+1)},
2015                                                $i+1) .
2016                                        '/' .
2017                                        $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2018                                                esc_path($from->{'file'}[$i]));
2019                        } else {
2020                                $line = '--- /dev/null';
2021                        }
2022                        $result .= qq!<div class="diff from_file">$line</div>\n!;
2023                }
2024        }
2025
2026        $line = $to_line;
2027        #assert($line =~ m/^\+\+\+/) if DEBUG;
2028        # no extra formatting for "^+++ /dev/null"
2029        if ($line =~ m!^\+\+\+ "?b/!) {
2030                if ($to->{'href'}) {
2031                        $line = '+++ b/' .
2032                                $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2033                                        esc_path($to->{'file'}));
2034                } else {
2035                        $line = '+++ b/' .
2036                                esc_path($to->{'file'});
2037                }
2038        }
2039        $result .= qq!<div class="diff to_file">$line</div>\n!;
2040
2041        return $result;
2042}
2043
2044# create note for patch simplified by combined diff
2045sub format_diff_cc_simplified {
2046        my ($diffinfo, @parents) = @_;
2047        my $result = '';
2048
2049        $result .= "<div class=\"diff header\">" .
2050                   "diff --cc ";
2051        if (!is_deleted($diffinfo)) {
2052                $result .= $cgi->a({-href => href(action=>"blob",
2053                                                  hash_base=>$hash,
2054                                                  hash=>$diffinfo->{'to_id'},
2055                                                  file_name=>$diffinfo->{'to_file'}),
2056                                    -class => "path"},
2057                                   esc_path($diffinfo->{'to_file'}));
2058        } else {
2059                $result .= esc_path($diffinfo->{'to_file'});
2060        }
2061        $result .= "</div>\n" . # class="diff header"
2062                   "<div class=\"diff nodifferences\">" .
2063                   "Simple merge" .
2064                   "</div>\n"; # class="diff nodifferences"
2065
2066        return $result;
2067}
2068
2069# format patch (diff) line (not to be used for diff headers)
2070sub format_diff_line {
2071        my $line = shift;
2072        my ($from, $to) = @_;
2073        my $diff_class = "";
2074
2075        chomp $line;
2076
2077        if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2078                # combined diff
2079                my $prefix = substr($line, 0, scalar @{$from->{'href'}});
2080                if ($line =~ m/^\@{3}/) {
2081                        $diff_class = " chunk_header";
2082                } elsif ($line =~ m/^\\/) {
2083                        $diff_class = " incomplete";
2084                } elsif ($prefix =~ tr/+/+/) {
2085                        $diff_class = " add";
2086                } elsif ($prefix =~ tr/-/-/) {
2087                        $diff_class = " rem";
2088                }
2089        } else {
2090                # assume ordinary diff
2091                my $char = substr($line, 0, 1);
2092                if ($char eq '+') {
2093                        $diff_class = " add";
2094                } elsif ($char eq '-') {
2095                        $diff_class = " rem";
2096                } elsif ($char eq '@') {
2097                        $diff_class = " chunk_header";
2098                } elsif ($char eq "\\") {
2099                        $diff_class = " incomplete";
2100                }
2101        }
2102        $line = untabify($line);
2103        if ($from && $to && $line =~ m/^\@{2} /) {
2104                my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2105                        $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2106
2107                $from_lines = 0 unless defined $from_lines;
2108                $to_lines   = 0 unless defined $to_lines;
2109
2110                if ($from->{'href'}) {
2111                        $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2112                                             -class=>"list"}, $from_text);
2113                }
2114                if ($to->{'href'}) {
2115                        $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2116                                             -class=>"list"}, $to_text);
2117                }
2118                $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2119                        "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2120                return "<div class=\"diff$diff_class\">$line</div>\n";
2121        } elsif ($from && $to && $line =~ m/^\@{3}/) {
2122                my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2123                my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2124
2125                @from_text = split(' ', $ranges);
2126                for (my $i = 0; $i < @from_text; ++$i) {
2127                        ($from_start[$i], $from_nlines[$i]) =
2128                                (split(',', substr($from_text[$i], 1)), 0);
2129                }
2130
2131                $to_text   = pop @from_text;
2132                $to_start  = pop @from_start;
2133                $to_nlines = pop @from_nlines;
2134
2135                $line = "<span class=\"chunk_info\">$prefix ";
2136                for (my $i = 0; $i < @from_text; ++$i) {
2137                        if ($from->{'href'}[$i]) {
2138                                $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2139                                                  -class=>"list"}, $from_text[$i]);
2140                        } else {
2141                                $line .= $from_text[$i];
2142                        }
2143                        $line .= " ";
2144                }
2145                if ($to->{'href'}) {
2146                        $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2147                                          -class=>"list"}, $to_text);
2148                } else {
2149                        $line .= $to_text;
2150                }
2151                $line .= " $prefix</span>" .
2152                         "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2153                return "<div class=\"diff$diff_class\">$line</div>\n";
2154        }
2155        return "<div class=\"diff$diff_class\">" . esc_html($line, -nbsp=>1) . "</div>\n";
2156}
2157
2158# Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2159# linked.  Pass the hash of the tree/commit to snapshot.
2160sub format_snapshot_links {
2161        my ($hash) = @_;
2162        my $num_fmts = @snapshot_fmts;
2163        if ($num_fmts > 1) {
2164                # A parenthesized list of links bearing format names.
2165                # e.g. "snapshot (_tar.gz_ _zip_)"
2166                return "snapshot (" . join(' ', map
2167                        $cgi->a({
2168                                -href => href(
2169                                        action=>"snapshot",
2170                                        hash=>$hash,
2171                                        snapshot_format=>$_
2172                                )
2173                        }, $known_snapshot_formats{$_}{'display'})
2174                , @snapshot_fmts) . ")";
2175        } elsif ($num_fmts == 1) {
2176                # A single "snapshot" link whose tooltip bears the format name.
2177                # i.e. "_snapshot_"
2178                my ($fmt) = @snapshot_fmts;
2179                return
2180                        $cgi->a({
2181                                -href => href(
2182                                        action=>"snapshot",
2183                                        hash=>$hash,
2184                                        snapshot_format=>$fmt
2185                                ),
2186                                -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2187                        }, "snapshot");
2188        } else { # $num_fmts == 0
2189                return undef;
2190        }
2191}
2192
2193## ......................................................................
2194## functions returning values to be passed, perhaps after some
2195## transformation, to other functions; e.g. returning arguments to href()
2196
2197# returns hash to be passed to href to generate gitweb URL
2198# in -title key it returns description of link
2199sub get_feed_info {
2200        my $format = shift || 'Atom';
2201        my %res = (action => lc($format));
2202
2203        # feed links are possible only for project views
2204        return unless (defined $project);
2205        # some views should link to OPML, or to generic project feed,
2206        # or don't have specific feed yet (so they should use generic)
2207        return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2208
2209        my $branch;
2210        # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2211        # from tag links; this also makes possible to detect branch links
2212        if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2213            (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2214                $branch = $1;
2215        }
2216        # find log type for feed description (title)
2217        my $type = 'log';
2218        if (defined $file_name) {
2219                $type  = "history of $file_name";
2220                $type .= "/" if ($action eq 'tree');
2221                $type .= " on '$branch'" if (defined $branch);
2222        } else {
2223                $type = "log of $branch" if (defined $branch);
2224        }
2225
2226        $res{-title} = $type;
2227        $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2228        $res{'file_name'} = $file_name;
2229
2230        return %res;
2231}
2232
2233## ----------------------------------------------------------------------
2234## git utility subroutines, invoking git commands
2235
2236# returns path to the core git executable and the --git-dir parameter as list
2237sub git_cmd {
2238        $number_of_git_cmds++;
2239        return $GIT, '--git-dir='.$git_dir;
2240}
2241
2242# quote the given arguments for passing them to the shell
2243# quote_command("command", "arg 1", "arg with ' and ! characters")
2244# => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2245# Try to avoid using this function wherever possible.
2246sub quote_command {
2247        return join(' ',
2248                map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2249}
2250
2251# get HEAD ref of given project as hash
2252sub git_get_head_hash {
2253        return git_get_full_hash(shift, 'HEAD');
2254}
2255
2256sub git_get_full_hash {
2257        return git_get_hash(@_);
2258}
2259
2260sub git_get_short_hash {
2261        return git_get_hash(@_, '--short=7');
2262}
2263
2264sub git_get_hash {
2265        my ($project, $hash, @options) = @_;
2266        my $o_git_dir = $git_dir;
2267        my $retval = undef;
2268        $git_dir = "$projectroot/$project";
2269        if (open my $fd, '-|', git_cmd(), 'rev-parse',
2270            '--verify', '-q', @options, $hash) {
2271                $retval = <$fd>;
2272                chomp $retval if defined $retval;
2273                close $fd;
2274        }
2275        if (defined $o_git_dir) {
2276                $git_dir = $o_git_dir;
2277        }
2278        return $retval;
2279}
2280
2281# get type of given object
2282sub git_get_type {
2283        my $hash = shift;
2284
2285        open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2286        my $type = <$fd>;
2287        close $fd or return;
2288        chomp $type;
2289        return $type;
2290}
2291
2292# repository configuration
2293our $config_file = '';
2294our %config;
2295
2296# store multiple values for single key as anonymous array reference
2297# single values stored directly in the hash, not as [ <value> ]
2298sub hash_set_multi {
2299        my ($hash, $key, $value) = @_;
2300
2301        if (!exists $hash->{$key}) {
2302                $hash->{$key} = $value;
2303        } elsif (!ref $hash->{$key}) {
2304                $hash->{$key} = [ $hash->{$key}, $value ];
2305        } else {
2306                push @{$hash->{$key}}, $value;
2307        }
2308}
2309
2310# return hash of git project configuration
2311# optionally limited to some section, e.g. 'gitweb'
2312sub git_parse_project_config {
2313        my $section_regexp = shift;
2314        my %config;
2315
2316        local $/ = "\0";
2317
2318        open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2319                or return;
2320
2321        while (my $keyval = <$fh>) {
2322                chomp $keyval;
2323                my ($key, $value) = split(/\n/, $keyval, 2);
2324
2325                hash_set_multi(\%config, $key, $value)
2326                        if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2327        }
2328        close $fh;
2329
2330        return %config;
2331}
2332
2333# convert config value to boolean: 'true' or 'false'
2334# no value, number > 0, 'true' and 'yes' values are true
2335# rest of values are treated as false (never as error)
2336sub config_to_bool {
2337        my $val = shift;
2338
2339        return 1 if !defined $val;             # section.key
2340
2341        # strip leading and trailing whitespace
2342        $val =~ s/^\s+//;
2343        $val =~ s/\s+$//;
2344
2345        return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2346                ($val =~ /^(?:true|yes)$/i));  # section.key = true
2347}
2348
2349# convert config value to simple decimal number
2350# an optional value suffix of 'k', 'm', or 'g' will cause the value
2351# to be multiplied by 1024, 1048576, or 1073741824
2352sub config_to_int {
2353        my $val = shift;
2354
2355        # strip leading and trailing whitespace
2356        $val =~ s/^\s+//;
2357        $val =~ s/\s+$//;
2358
2359        if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2360                $unit = lc($unit);
2361                # unknown unit is treated as 1
2362                return $num * ($unit eq 'g' ? 1073741824 :
2363                               $unit eq 'm' ?    1048576 :
2364                               $unit eq 'k' ?       1024 : 1);
2365        }
2366        return $val;
2367}
2368
2369# convert config value to array reference, if needed
2370sub config_to_multi {
2371        my $val = shift;
2372
2373        return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2374}
2375
2376sub git_get_project_config {
2377        my ($key, $type) = @_;
2378
2379        return unless defined $git_dir;
2380
2381        # key sanity check
2382        return unless ($key);
2383        $key =~ s/^gitweb\.//;
2384        return if ($key =~ m/\W/);
2385
2386        # type sanity check
2387        if (defined $type) {
2388                $type =~ s/^--//;
2389                $type = undef
2390                        unless ($type eq 'bool' || $type eq 'int');
2391        }
2392
2393        # get config
2394        if (!defined $config_file ||
2395            $config_file ne "$git_dir/config") {
2396                %config = git_parse_project_config('gitweb');
2397                $config_file = "$git_dir/config";
2398        }
2399
2400        # check if config variable (key) exists
2401        return unless exists $config{"gitweb.$key"};
2402
2403        # ensure given type
2404        if (!defined $type) {
2405                return $config{"gitweb.$key"};
2406        } elsif ($type eq 'bool') {
2407                # backward compatibility: 'git config --bool' returns true/false
2408                return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2409        } elsif ($type eq 'int') {
2410                return config_to_int($config{"gitweb.$key"});
2411        }
2412        return $config{"gitweb.$key"};
2413}
2414
2415# get hash of given path at given ref
2416sub git_get_hash_by_path {
2417        my $base = shift;
2418        my $path = shift || return undef;
2419        my $type = shift;
2420
2421        $path =~ s,/+$,,;
2422
2423        open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2424                or die_error(500, "Open git-ls-tree failed");
2425        my $line = <$fd>;
2426        close $fd or return undef;
2427
2428        if (!defined $line) {
2429                # there is no tree or hash given by $path at $base
2430                return undef;
2431        }
2432
2433        #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2434        $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2435        if (defined $type && $type ne $2) {
2436                # type doesn't match
2437                return undef;
2438        }
2439        return $3;
2440}
2441
2442# get path of entry with given hash at given tree-ish (ref)
2443# used to get 'from' filename for combined diff (merge commit) for renames
2444sub git_get_path_by_hash {
2445        my $base = shift || return;
2446        my $hash = shift || return;
2447
2448        local $/ = "\0";
2449
2450        open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2451                or return undef;
2452        while (my $line = <$fd>) {
2453                chomp $line;
2454
2455                #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2456                #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2457                if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2458                        close $fd;
2459                        return $1;
2460                }
2461        }
2462        close $fd;
2463        return undef;
2464}
2465
2466## ......................................................................
2467## git utility functions, directly accessing git repository
2468
2469sub git_get_project_description {
2470        my $path = shift;
2471
2472        $git_dir = "$projectroot/$path";
2473        open my $fd, '<', "$git_dir/description"
2474                or return git_get_project_config('description');
2475        my $descr = <$fd>;
2476        close $fd;
2477        if (defined $descr) {
2478                chomp $descr;
2479        }
2480        return $descr;
2481}
2482
2483sub git_get_project_ctags {
2484        my $path = shift;
2485        my $ctags = {};
2486
2487        $git_dir = "$projectroot/$path";
2488        opendir my $dh, "$git_dir/ctags"
2489                or return $ctags;
2490        foreach (grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh)) {
2491                open my $ct, '<', $_ or next;
2492                my $val = <$ct>;
2493                chomp $val;
2494                close $ct;
2495                my $ctag = $_; $ctag =~ s#.*/##;
2496                $ctags->{$ctag} = $val;
2497        }
2498        closedir $dh;
2499        $ctags;
2500}
2501
2502sub git_populate_project_tagcloud {
2503        my $ctags = shift;
2504
2505        # First, merge different-cased tags; tags vote on casing
2506        my %ctags_lc;
2507        foreach (keys %$ctags) {
2508                $ctags_lc{lc $_}->{count} += $ctags->{$_};
2509                if (not $ctags_lc{lc $_}->{topcount}
2510                    or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2511                        $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2512                        $ctags_lc{lc $_}->{topname} = $_;
2513                }
2514        }
2515
2516        my $cloud;
2517        if (eval { require HTML::TagCloud; 1; }) {
2518                $cloud = HTML::TagCloud->new;
2519                foreach (sort keys %ctags_lc) {
2520                        # Pad the title with spaces so that the cloud looks
2521                        # less crammed.
2522                        my $title = $ctags_lc{$_}->{topname};
2523                        $title =~ s/ /&nbsp;/g;
2524                        $title =~ s/^/&nbsp;/g;
2525                        $title =~ s/$/&nbsp;/g;
2526                        $cloud->add($title, $home_link."?by_tag=".$_, $ctags_lc{$_}->{count});
2527                }
2528        } else {
2529                $cloud = \%ctags_lc;
2530        }
2531        $cloud;
2532}
2533
2534sub git_show_project_tagcloud {
2535        my ($cloud, $count) = @_;
2536        print STDERR ref($cloud)."..\n";
2537        if (ref $cloud eq 'HTML::TagCloud') {
2538                return $cloud->html_and_css($count);
2539        } else {
2540                my @tags = sort { $cloud->{$a}->{count} <=> $cloud->{$b}->{count} } keys %$cloud;
2541                return '<p align="center">' . join (', ', map {
2542                        $cgi->a({-href=>"$home_link?by_tag=$_"}, $cloud->{$_}->{topname})
2543                } splice(@tags, 0, $count)) . '</p>';
2544        }
2545}
2546
2547sub git_get_project_url_list {
2548        my $path = shift;
2549
2550        $git_dir = "$projectroot/$path";
2551        open my $fd, '<', "$git_dir/cloneurl"
2552                or return wantarray ?
2553                @{ config_to_multi(git_get_project_config('url')) } :
2554                   config_to_multi(git_get_project_config('url'));
2555        my @git_project_url_list = map { chomp; $_ } <$fd>;
2556        close $fd;
2557
2558        return wantarray ? @git_project_url_list : \@git_project_url_list;
2559}
2560
2561sub git_get_projects_list {
2562        my ($filter) = @_;
2563        my @list;
2564
2565        $filter ||= '';
2566        $filter =~ s/\.git$//;
2567
2568        my $check_forks = gitweb_check_feature('forks');
2569
2570        if (-d $projects_list) {
2571                # search in directory
2572                my $dir = $projects_list . ($filter ? "/$filter" : '');
2573                # remove the trailing "/"
2574                $dir =~ s!/+$!!;
2575                my $pfxlen = length("$dir");
2576                my $pfxdepth = ($dir =~ tr!/!!);
2577
2578                File::Find::find({
2579                        follow_fast => 1, # follow symbolic links
2580                        follow_skip => 2, # ignore duplicates
2581                        dangling_symlinks => 0, # ignore dangling symlinks, silently
2582                        wanted => sub {
2583                                # global variables
2584                                our $project_maxdepth;
2585                                our $projectroot;
2586                                # skip project-list toplevel, if we get it.
2587                                return if (m!^[/.]$!);
2588                                # only directories can be git repositories
2589                                return unless (-d $_);
2590                                # don't traverse too deep (Find is super slow on os x)
2591                                if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2592                                        $File::Find::prune = 1;
2593                                        return;
2594                                }
2595
2596                                my $subdir = substr($File::Find::name, $pfxlen + 1);
2597                                # we check related file in $projectroot
2598                                my $path = ($filter ? "$filter/" : '') . $subdir;
2599                                if (check_export_ok("$projectroot/$path")) {
2600                                        push @list, { path => $path };
2601                                        $File::Find::prune = 1;
2602                                }
2603                        },
2604                }, "$dir");
2605
2606        } elsif (-f $projects_list) {
2607                # read from file(url-encoded):
2608                # 'git%2Fgit.git Linus+Torvalds'
2609                # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2610                # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2611                my %paths;
2612                open my $fd, '<', $projects_list or return;
2613        PROJECT:
2614                while (my $line = <$fd>) {
2615                        chomp $line;
2616                        my ($path, $owner) = split ' ', $line;
2617                        $path = unescape($path);
2618                        $owner = unescape($owner);
2619                        if (!defined $path) {
2620                                next;
2621                        }
2622                        if ($filter ne '') {
2623                                # looking for forks;
2624                                my $pfx = substr($path, 0, length($filter));
2625                                if ($pfx ne $filter) {
2626                                        next PROJECT;
2627                                }
2628                                my $sfx = substr($path, length($filter));
2629                                if ($sfx !~ /^\/.*\.git$/) {
2630                                        next PROJECT;
2631                                }
2632                        } elsif ($check_forks) {
2633                        PATH:
2634                                foreach my $filter (keys %paths) {
2635                                        # looking for forks;
2636                                        my $pfx = substr($path, 0, length($filter));
2637                                        if ($pfx ne $filter) {
2638                                                next PATH;
2639                                        }
2640                                        my $sfx = substr($path, length($filter));
2641                                        if ($sfx !~ /^\/.*\.git$/) {
2642                                                next PATH;
2643                                        }
2644                                        # is a fork, don't include it in
2645                                        # the list
2646                                        next PROJECT;
2647                                }
2648                        }
2649                        if (check_export_ok("$projectroot/$path")) {
2650                                my $pr = {
2651                                        path => $path,
2652                                        owner => to_utf8($owner),
2653                                };
2654                                push @list, $pr;
2655                                (my $forks_path = $path) =~ s/\.git$//;
2656                                $paths{$forks_path}++;
2657                        }
2658                }
2659                close $fd;
2660        }
2661        return @list;
2662}
2663
2664our $gitweb_project_owner = undef;
2665sub git_get_project_list_from_file {
2666
2667        return if (defined $gitweb_project_owner);
2668
2669        $gitweb_project_owner = {};
2670        # read from file (url-encoded):
2671        # 'git%2Fgit.git Linus+Torvalds'
2672        # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2673        # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2674        if (-f $projects_list) {
2675                open(my $fd, '<', $projects_list);
2676                while (my $line = <$fd>) {
2677                        chomp $line;
2678                        my ($pr, $ow) = split ' ', $line;
2679                        $pr = unescape($pr);
2680                        $ow = unescape($ow);
2681                        $gitweb_project_owner->{$pr} = to_utf8($ow);
2682                }
2683                close $fd;
2684        }
2685}
2686
2687sub git_get_project_owner {
2688        my $project = shift;
2689        my $owner;
2690
2691        return undef unless $project;
2692        $git_dir = "$projectroot/$project";
2693
2694        if (!defined $gitweb_project_owner) {
2695                git_get_project_list_from_file();
2696        }
2697
2698        if (exists $gitweb_project_owner->{$project}) {
2699                $owner = $gitweb_project_owner->{$project};
2700        }
2701        if (!defined $owner){
2702                $owner = git_get_project_config('owner');
2703        }
2704        if (!defined $owner) {
2705                $owner = get_file_owner("$git_dir");
2706        }
2707
2708        return $owner;
2709}
2710
2711sub git_get_last_activity {
2712        my ($path) = @_;
2713        my $fd;
2714
2715        $git_dir = "$projectroot/$path";
2716        open($fd, "-|", git_cmd(), 'for-each-ref',
2717             '--format=%(committer)',
2718             '--sort=-committerdate',
2719             '--count=1',
2720             'refs/heads') or return;
2721        my $most_recent = <$fd>;
2722        close $fd or return;
2723        if (defined $most_recent &&
2724            $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
2725                my $timestamp = $1;
2726                my $age = time - $timestamp;
2727                return ($age, age_string($age));
2728        }
2729        return (undef, undef);
2730}
2731
2732sub git_get_references {
2733        my $type = shift || "";
2734        my %refs;
2735        # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
2736        # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
2737        open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
2738                ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
2739                or return;
2740
2741        while (my $line = <$fd>) {
2742                chomp $line;
2743                if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
2744                        if (defined $refs{$1}) {
2745                                push @{$refs{$1}}, $2;
2746                        } else {
2747                                $refs{$1} = [ $2 ];
2748                        }
2749                }
2750        }
2751        close $fd or return;
2752        return \%refs;
2753}
2754
2755sub git_get_rev_name_tags {
2756        my $hash = shift || return undef;
2757
2758        open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
2759                or return;
2760        my $name_rev = <$fd>;
2761        close $fd;
2762
2763        if ($name_rev =~ m|^$hash tags/(.*)$|) {
2764                return $1;
2765        } else {
2766                # catches also '$hash undefined' output
2767                return undef;
2768        }
2769}
2770
2771## ----------------------------------------------------------------------
2772## parse to hash functions
2773
2774sub parse_date {
2775        my $epoch = shift;
2776        my $tz = shift || "-0000";
2777
2778        my %date;
2779        my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
2780        my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
2781        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
2782        $date{'hour'} = $hour;
2783        $date{'minute'} = $min;
2784        $date{'mday'} = $mday;
2785        $date{'day'} = $days[$wday];
2786        $date{'month'} = $months[$mon];
2787        $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
2788                             $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
2789        $date{'mday-time'} = sprintf "%d %s %02d:%02d",
2790                             $mday, $months[$mon], $hour ,$min;
2791        $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
2792                             1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
2793
2794        $tz =~ m/^([+\-][0-9][0-9])([0-9][0-9])$/;
2795        my $local = $epoch + ((int $1 + ($2/60)) * 3600);
2796        ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
2797        $date{'hour_local'} = $hour;
2798        $date{'minute_local'} = $min;
2799        $date{'tz_local'} = $tz;
2800        $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
2801                                  1900+$year, $mon+1, $mday,
2802                                  $hour, $min, $sec, $tz);
2803        return %date;
2804}
2805
2806sub parse_tag {
2807        my $tag_id = shift;
2808        my %tag;
2809        my @comment;
2810
2811        open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
2812        $tag{'id'} = $tag_id;
2813        while (my $line = <$fd>) {
2814                chomp $line;
2815                if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
2816                        $tag{'object'} = $1;
2817                } elsif ($line =~ m/^type (.+)$/) {
2818                        $tag{'type'} = $1;
2819                } elsif ($line =~ m/^tag (.+)$/) {
2820                        $tag{'name'} = $1;
2821                } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
2822                        $tag{'author'} = $1;
2823                        $tag{'author_epoch'} = $2;
2824                        $tag{'author_tz'} = $3;
2825                        if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
2826                                $tag{'author_name'}  = $1;
2827                                $tag{'author_email'} = $2;
2828                        } else {
2829                                $tag{'author_name'} = $tag{'author'};
2830                        }
2831                } elsif ($line =~ m/--BEGIN/) {
2832                        push @comment, $line;
2833                        last;
2834                } elsif ($line eq "") {
2835                        last;
2836                }
2837        }
2838        push @comment, <$fd>;
2839        $tag{'comment'} = \@comment;
2840        close $fd or return;
2841        if (!defined $tag{'name'}) {
2842                return
2843        };
2844        return %tag
2845}
2846
2847sub parse_commit_text {
2848        my ($commit_text, $withparents) = @_;
2849        my @commit_lines = split '\n', $commit_text;
2850        my %co;
2851
2852        pop @commit_lines; # Remove '\0'
2853
2854        if (! @commit_lines) {
2855                return;
2856        }
2857
2858        my $header = shift @commit_lines;
2859        if ($header !~ m/^[0-9a-fA-F]{40}/) {
2860                return;
2861        }
2862        ($co{'id'}, my @parents) = split ' ', $header;
2863        while (my $line = shift @commit_lines) {
2864                last if $line eq "\n";
2865                if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
2866                        $co{'tree'} = $1;
2867                } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
2868                        push @parents, $1;
2869                } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
2870                        $co{'author'} = to_utf8($1);
2871                        $co{'author_epoch'} = $2;
2872                        $co{'author_tz'} = $3;
2873                        if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
2874                                $co{'author_name'}  = $1;
2875                                $co{'author_email'} = $2;
2876                        } else {
2877                                $co{'author_name'} = $co{'author'};
2878                        }
2879                } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
2880                        $co{'committer'} = to_utf8($1);
2881                        $co{'committer_epoch'} = $2;
2882                        $co{'committer_tz'} = $3;
2883                        if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
2884                                $co{'committer_name'}  = $1;
2885                                $co{'committer_email'} = $2;
2886                        } else {
2887                                $co{'committer_name'} = $co{'committer'};
2888                        }
2889                }
2890        }
2891        if (!defined $co{'tree'}) {
2892                return;
2893        };
2894        $co{'parents'} = \@parents;
2895        $co{'parent'} = $parents[0];
2896
2897        foreach my $title (@commit_lines) {
2898                $title =~ s/^    //;
2899                if ($title ne "") {
2900                        $co{'title'} = chop_str($title, 80, 5);
2901                        # remove leading stuff of merges to make the interesting part visible
2902                        if (length($title) > 50) {
2903                                $title =~ s/^Automatic //;
2904                                $title =~ s/^merge (of|with) /Merge ... /i;
2905                                if (length($title) > 50) {
2906                                        $title =~ s/(http|rsync):\/\///;
2907                                }
2908                                if (length($title) > 50) {
2909                                        $title =~ s/(master|www|rsync)\.//;
2910                                }
2911                                if (length($title) > 50) {
2912                                        $title =~ s/kernel.org:?//;
2913                                }
2914                                if (length($title) > 50) {
2915                                        $title =~ s/\/pub\/scm//;
2916                                }
2917                        }
2918                        $co{'title_short'} = chop_str($title, 50, 5);
2919                        last;
2920                }
2921        }
2922        if (! defined $co{'title'} || $co{'title'} eq "") {
2923                $co{'title'} = $co{'title_short'} = '(no commit message)';
2924        }
2925        # remove added spaces
2926        foreach my $line (@commit_lines) {
2927                $line =~ s/^    //;
2928        }
2929        $co{'comment'} = \@commit_lines;
2930
2931        my $age = time - $co{'committer_epoch'};
2932        $co{'age'} = $age;
2933        $co{'age_string'} = age_string($age);
2934        my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
2935        if ($age > 60*60*24*7*2) {
2936                $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
2937                $co{'age_string_age'} = $co{'age_string'};
2938        } else {
2939                $co{'age_string_date'} = $co{'age_string'};
2940                $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
2941        }
2942        return %co;
2943}
2944
2945sub parse_commit {
2946        my ($commit_id) = @_;
2947        my %co;
2948
2949        local $/ = "\0";
2950
2951        open my $fd, "-|", git_cmd(), "rev-list",
2952                "--parents",
2953                "--header",
2954                "--max-count=1",
2955                $commit_id,
2956                "--",
2957                or die_error(500, "Open git-rev-list failed");
2958        %co = parse_commit_text(<$fd>, 1);
2959        close $fd;
2960
2961        return %co;
2962}
2963
2964sub parse_commits {
2965        my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
2966        my @cos;
2967
2968        $maxcount ||= 1;
2969        $skip ||= 0;
2970
2971        local $/ = "\0";
2972
2973        open my $fd, "-|", git_cmd(), "rev-list",
2974                "--header",
2975                @args,
2976                ("--max-count=" . $maxcount),
2977                ("--skip=" . $skip),
2978                @extra_options,
2979                $commit_id,
2980                "--",
2981                ($filename ? ($filename) : ())
2982                or die_error(500, "Open git-rev-list failed");
2983        while (my $line = <$fd>) {
2984                my %co = parse_commit_text($line);
2985                push @cos, \%co;
2986        }
2987        close $fd;
2988
2989        return wantarray ? @cos : \@cos;
2990}
2991
2992# parse line of git-diff-tree "raw" output
2993sub parse_difftree_raw_line {
2994        my $line = shift;
2995        my %res;
2996
2997        # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
2998        # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
2999        if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3000                $res{'from_mode'} = $1;
3001                $res{'to_mode'} = $2;
3002                $res{'from_id'} = $3;
3003                $res{'to_id'} = $4;
3004                $res{'status'} = $5;
3005                $res{'similarity'} = $6;
3006                if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3007                        ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3008                } else {
3009                        $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3010                }
3011        }
3012        # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3013        # combined diff (for merge commit)
3014        elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3015                $res{'nparents'}  = length($1);
3016                $res{'from_mode'} = [ split(' ', $2) ];
3017                $res{'to_mode'} = pop @{$res{'from_mode'}};
3018                $res{'from_id'} = [ split(' ', $3) ];
3019                $res{'to_id'} = pop @{$res{'from_id'}};
3020                $res{'status'} = [ split('', $4) ];
3021                $res{'to_file'} = unquote($5);
3022        }
3023        # 'c512b523472485aef4fff9e57b229d9d243c967f'
3024        elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3025                $res{'commit'} = $1;
3026        }
3027
3028        return wantarray ? %res : \%res;
3029}
3030
3031# wrapper: return parsed line of git-diff-tree "raw" output
3032# (the argument might be raw line, or parsed info)
3033sub parsed_difftree_line {
3034        my $line_or_ref = shift;
3035
3036        if (ref($line_or_ref) eq "HASH") {
3037                # pre-parsed (or generated by hand)
3038                return $line_or_ref;
3039        } else {
3040                return parse_difftree_raw_line($line_or_ref);
3041        }
3042}
3043
3044# parse line of git-ls-tree output
3045sub parse_ls_tree_line {
3046        my $line = shift;
3047        my %opts = @_;
3048        my %res;
3049
3050        if ($opts{'-l'}) {
3051                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3052                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3053
3054                $res{'mode'} = $1;
3055                $res{'type'} = $2;
3056                $res{'hash'} = $3;
3057                $res{'size'} = $4;
3058                if ($opts{'-z'}) {
3059                        $res{'name'} = $5;
3060                } else {
3061                        $res{'name'} = unquote($5);
3062                }
3063        } else {
3064                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3065                $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3066
3067                $res{'mode'} = $1;
3068                $res{'type'} = $2;
3069                $res{'hash'} = $3;
3070                if ($opts{'-z'}) {
3071                        $res{'name'} = $4;
3072                } else {
3073                        $res{'name'} = unquote($4);
3074                }
3075        }
3076
3077        return wantarray ? %res : \%res;
3078}
3079
3080# generates _two_ hashes, references to which are passed as 2 and 3 argument
3081sub parse_from_to_diffinfo {
3082        my ($diffinfo, $from, $to, @parents) = @_;
3083
3084        if ($diffinfo->{'nparents'}) {
3085                # combined diff
3086                $from->{'file'} = [];
3087                $from->{'href'} = [];
3088                fill_from_file_info($diffinfo, @parents)
3089                        unless exists $diffinfo->{'from_file'};
3090                for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3091                        $from->{'file'}[$i] =
3092                                defined $diffinfo->{'from_file'}[$i] ?
3093                                        $diffinfo->{'from_file'}[$i] :
3094                                        $diffinfo->{'to_file'};
3095                        if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3096                                $from->{'href'}[$i] = href(action=>"blob",
3097                                                           hash_base=>$parents[$i],
3098                                                           hash=>$diffinfo->{'from_id'}[$i],
3099                                                           file_name=>$from->{'file'}[$i]);
3100                        } else {
3101                                $from->{'href'}[$i] = undef;
3102                        }
3103                }
3104        } else {
3105                # ordinary (not combined) diff
3106                $from->{'file'} = $diffinfo->{'from_file'};
3107                if ($diffinfo->{'status'} ne "A") { # not new (added) file
3108                        $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3109                                               hash=>$diffinfo->{'from_id'},
3110                                               file_name=>$from->{'file'});
3111                } else {
3112                        delete $from->{'href'};
3113                }
3114        }
3115
3116        $to->{'file'} = $diffinfo->{'to_file'};
3117        if (!is_deleted($diffinfo)) { # file exists in result
3118                $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3119                                     hash=>$diffinfo->{'to_id'},
3120                                     file_name=>$to->{'file'});
3121        } else {
3122                delete $to->{'href'};
3123        }
3124}
3125
3126## ......................................................................
3127## parse to array of hashes functions
3128
3129sub git_get_heads_list {
3130        my $limit = shift;
3131        my @headslist;
3132
3133        open my $fd, '-|', git_cmd(), 'for-each-ref',
3134                ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3135                '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3136                'refs/heads'
3137                or return;
3138        while (my $line = <$fd>) {
3139                my %ref_item;
3140
3141                chomp $line;
3142                my ($refinfo, $committerinfo) = split(/\0/, $line);
3143                my ($hash, $name, $title) = split(' ', $refinfo, 3);
3144                my ($committer, $epoch, $tz) =
3145                        ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3146                $ref_item{'fullname'}  = $name;
3147                $name =~ s!^refs/heads/!!;
3148
3149                $ref_item{'name'}  = $name;
3150                $ref_item{'id'}    = $hash;
3151                $ref_item{'title'} = $title || '(no commit message)';
3152                $ref_item{'epoch'} = $epoch;
3153                if ($epoch) {
3154                        $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3155                } else {
3156                        $ref_item{'age'} = "unknown";
3157                }
3158
3159                push @headslist, \%ref_item;
3160        }
3161        close $fd;
3162
3163        return wantarray ? @headslist : \@headslist;
3164}
3165
3166sub git_get_tags_list {
3167        my $limit = shift;
3168        my @tagslist;
3169
3170        open my $fd, '-|', git_cmd(), 'for-each-ref',
3171                ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3172                '--format=%(objectname) %(objecttype) %(refname) '.
3173                '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3174                'refs/tags'
3175                or return;
3176        while (my $line = <$fd>) {
3177                my %ref_item;
3178
3179                chomp $line;
3180                my ($refinfo, $creatorinfo) = split(/\0/, $line);
3181                my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3182                my ($creator, $epoch, $tz) =
3183                        ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3184                $ref_item{'fullname'} = $name;
3185                $name =~ s!^refs/tags/!!;
3186
3187                $ref_item{'type'} = $type;
3188                $ref_item{'id'} = $id;
3189                $ref_item{'name'} = $name;
3190                if ($type eq "tag") {
3191                        $ref_item{'subject'} = $title;
3192                        $ref_item{'reftype'} = $reftype;
3193                        $ref_item{'refid'}   = $refid;
3194                } else {
3195                        $ref_item{'reftype'} = $type;
3196                        $ref_item{'refid'}   = $id;
3197                }
3198
3199                if ($type eq "tag" || $type eq "commit") {
3200                        $ref_item{'epoch'} = $epoch;
3201                        if ($epoch) {
3202                                $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3203                        } else {
3204                                $ref_item{'age'} = "unknown";
3205                        }
3206                }
3207
3208                push @tagslist, \%ref_item;
3209        }
3210        close $fd;
3211
3212        return wantarray ? @tagslist : \@tagslist;
3213}
3214
3215## ----------------------------------------------------------------------
3216## filesystem-related functions
3217
3218sub get_file_owner {
3219        my $path = shift;
3220
3221        my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3222        my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3223        if (!defined $gcos) {
3224                return undef;
3225        }
3226        my $owner = $gcos;
3227        $owner =~ s/[,;].*$//;
3228        return to_utf8($owner);
3229}
3230
3231# assume that file exists
3232sub insert_file {
3233        my $filename = shift;
3234
3235        open my $fd, '<', $filename;
3236        print map { to_utf8($_) } <$fd>;
3237        close $fd;
3238}
3239
3240## ......................................................................
3241## mimetype related functions
3242
3243sub mimetype_guess_file {
3244        my $filename = shift;
3245        my $mimemap = shift;
3246        -r $mimemap or return undef;
3247
3248        my %mimemap;
3249        open(my $mh, '<', $mimemap) or return undef;
3250        while (<$mh>) {
3251                next if m/^#/; # skip comments
3252                my ($mimetype, $exts) = split(/\t+/);
3253                if (defined $exts) {
3254                        my @exts = split(/\s+/, $exts);
3255                        foreach my $ext (@exts) {
3256                                $mimemap{$ext} = $mimetype;
3257                        }
3258                }
3259        }
3260        close($mh);
3261
3262        $filename =~ /\.([^.]*)$/;
3263        return $mimemap{$1};
3264}
3265
3266sub mimetype_guess {
3267        my $filename = shift;
3268        my $mime;
3269        $filename =~ /\./ or return undef;
3270
3271        if ($mimetypes_file) {
3272                my $file = $mimetypes_file;
3273                if ($file !~ m!^/!) { # if it is relative path
3274                        # it is relative to project
3275                        $file = "$projectroot/$project/$file";
3276                }
3277                $mime = mimetype_guess_file($filename, $file);
3278        }
3279        $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3280        return $mime;
3281}
3282
3283sub blob_mimetype {
3284        my $fd = shift;
3285        my $filename = shift;
3286
3287        if ($filename) {
3288                my $mime = mimetype_guess($filename);
3289                $mime and return $mime;
3290        }
3291
3292        # just in case
3293        return $default_blob_plain_mimetype unless $fd;
3294
3295        if (-T $fd) {
3296                return 'text/plain';
3297        } elsif (! $filename) {
3298                return 'application/octet-stream';
3299        } elsif ($filename =~ m/\.png$/i) {
3300                return 'image/png';
3301        } elsif ($filename =~ m/\.gif$/i) {
3302                return 'image/gif';
3303        } elsif ($filename =~ m/\.jpe?g$/i) {
3304                return 'image/jpeg';
3305        } else {
3306                return 'application/octet-stream';
3307        }
3308}
3309
3310sub blob_contenttype {
3311        my ($fd, $file_name, $type) = @_;
3312
3313        $type ||= blob_mimetype($fd, $file_name);
3314        if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3315                $type .= "; charset=$default_text_plain_charset";
3316        }
3317
3318        return $type;
3319}
3320
3321# guess file syntax for syntax highlighting; return undef if no highlighting
3322# the name of syntax can (in the future) depend on syntax highlighter used
3323sub guess_file_syntax {
3324        my ($highlight, $mimetype, $file_name) = @_;
3325        return undef unless ($highlight && defined $file_name);
3326
3327        # configuration for 'highlight' (http://www.andre-simon.de/)
3328        # match by basename
3329        my %highlight_basename = (
3330                #'Program' => 'py',
3331                #'Library' => 'py',
3332                'SConstruct' => 'py', # SCons equivalent of Makefile
3333                'Makefile' => 'make',
3334        );
3335        # match by extension
3336        my %highlight_ext = (
3337                # main extensions, defining name of syntax;
3338                # see files in /usr/share/highlight/langDefs/ directory
3339                map { $_ => $_ }
3340                        qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl),
3341                # alternate extensions, see /etc/highlight/filetypes.conf
3342                'h' => 'c',
3343                map { $_ => 'cpp' } qw(cxx c++ cc),
3344                map { $_ => 'php' } qw(php3 php4),
3345                map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
3346                'mak' => 'make',
3347                map { $_ => 'xml' } qw(xhtml html htm),
3348        );
3349
3350        my $basename = basename($file_name, '.in');
3351        return $highlight_basename{$basename}
3352                if exists $highlight_basename{$basename};
3353
3354        $basename =~ /\.([^.]*)$/;
3355        my $ext = $1 or return undef;
3356        return $highlight_ext{$ext}
3357                if exists $highlight_ext{$ext};
3358
3359        return undef;
3360}
3361
3362# run highlighter and return FD of its output,
3363# or return original FD if no highlighting
3364sub run_highlighter {
3365        my ($fd, $highlight, $syntax) = @_;
3366        return $fd unless ($highlight && defined $syntax);
3367
3368        close $fd
3369                or die_error(404, "Reading blob failed");
3370        open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3371                  "highlight --xhtml --fragment --syntax $syntax |"
3372                or die_error(500, "Couldn't open file or run syntax highlighter");
3373        return $fd;
3374}
3375
3376## ======================================================================
3377## functions printing HTML: header, footer, error page
3378
3379sub get_page_title {
3380        my $title = to_utf8($site_name);
3381
3382        return $title unless (defined $project);
3383        $title .= " - " . to_utf8($project);
3384
3385        return $title unless (defined $action);
3386        $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3387
3388        return $title unless (defined $file_name);
3389        $title .= " - " . esc_path($file_name);
3390        if ($action eq "tree" && $file_name !~ m|/$|) {
3391                $title .= "/";
3392        }
3393
3394        return $title;
3395}
3396
3397sub git_header_html {
3398        my $status = shift || "200 OK";
3399        my $expires = shift;
3400        my %opts = @_;
3401
3402        my $title = get_page_title();
3403        my $content_type;
3404        # require explicit support from the UA if we are to send the page as
3405        # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3406        # we have to do this because MSIE sometimes globs '*/*', pretending to
3407        # support xhtml+xml but choking when it gets what it asked for.
3408        if (defined $cgi->http('HTTP_ACCEPT') &&
3409            $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3410            $cgi->Accept('application/xhtml+xml') != 0) {
3411                $content_type = 'application/xhtml+xml';
3412        } else {
3413                $content_type = 'text/html';
3414        }
3415        print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3416                           -status=> $status, -expires => $expires)
3417                unless ($opts{'-no_http_header'});
3418        my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3419        print <<EOF;
3420<?xml version="1.0" encoding="utf-8"?>
3421<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3422<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3423<!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3424<!-- git core binaries version $git_version -->
3425<head>
3426<meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3427<meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3428<meta name="robots" content="index, nofollow"/>
3429<title>$title</title>
3430EOF
3431        # the stylesheet, favicon etc urls won't work correctly with path_info
3432        # unless we set the appropriate base URL
3433        if ($ENV{'PATH_INFO'}) {
3434                print "<base href=\"".esc_url($base_url)."\" />\n";
3435        }
3436        # print out each stylesheet that exist, providing backwards capability
3437        # for those people who defined $stylesheet in a config file
3438        if (defined $stylesheet) {
3439                print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3440        } else {
3441                foreach my $stylesheet (@stylesheets) {
3442                        next unless $stylesheet;
3443                        print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3444                }
3445        }
3446        if (defined $project) {
3447                my %href_params = get_feed_info();
3448                if (!exists $href_params{'-title'}) {
3449                        $href_params{'-title'} = 'log';
3450                }
3451
3452                foreach my $format qw(RSS Atom) {
3453                        my $type = lc($format);
3454                        my %link_attr = (
3455                                '-rel' => 'alternate',
3456                                '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3457                                '-type' => "application/$type+xml"
3458                        );
3459
3460                        $href_params{'action'} = $type;
3461                        $link_attr{'-href'} = href(%href_params);
3462                        print "<link ".
3463                              "rel=\"$link_attr{'-rel'}\" ".
3464                              "title=\"$link_attr{'-title'}\" ".
3465                              "href=\"$link_attr{'-href'}\" ".
3466                              "type=\"$link_attr{'-type'}\" ".
3467                              "/>\n";
3468
3469                        $href_params{'extra_options'} = '--no-merges';
3470                        $link_attr{'-href'} = href(%href_params);
3471                        $link_attr{'-title'} .= ' (no merges)';
3472                        print "<link ".
3473                              "rel=\"$link_attr{'-rel'}\" ".
3474                              "title=\"$link_attr{'-title'}\" ".
3475                              "href=\"$link_attr{'-href'}\" ".
3476                              "type=\"$link_attr{'-type'}\" ".
3477                              "/>\n";
3478                }
3479
3480        } else {
3481                printf('<link rel="alternate" title="%s projects list" '.
3482                       'href="%s" type="text/plain; charset=utf-8" />'."\n",
3483                       esc_attr($site_name), href(project=>undef, action=>"project_index"));
3484                printf('<link rel="alternate" title="%s projects feeds" '.
3485                       'href="%s" type="text/x-opml" />'."\n",
3486                       esc_attr($site_name), href(project=>undef, action=>"opml"));
3487        }
3488        if (defined $favicon) {
3489                print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3490        }
3491
3492        print "</head>\n" .
3493              "<body>\n";
3494
3495        if (defined $site_header && -f $site_header) {
3496                insert_file($site_header);
3497        }
3498
3499        print "<div class=\"page_header\">\n" .
3500              $cgi->a({-href => esc_url($logo_url),
3501                       -title => $logo_label},
3502                      qq(<img src=").esc_url($logo).qq(" width="72" height="27" alt="git" class="logo"/>));
3503        print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3504        if (defined $project) {
3505                print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3506                if (defined $action) {
3507                        print " / $action";
3508                }
3509                print "\n";
3510        }
3511        print "</div>\n";
3512
3513        my $have_search = gitweb_check_feature('search');
3514        if (defined $project && $have_search) {
3515                if (!defined $searchtext) {
3516                        $searchtext = "";
3517                }
3518                my $search_hash;
3519                if (defined $hash_base) {
3520                        $search_hash = $hash_base;
3521                } elsif (defined $hash) {
3522                        $search_hash = $hash;
3523                } else {
3524                        $search_hash = "HEAD";
3525                }
3526                my $action = $my_uri;
3527                my $use_pathinfo = gitweb_check_feature('pathinfo');
3528                if ($use_pathinfo) {
3529                        $action .= "/".esc_url($project);
3530                }
3531                print $cgi->startform(-method => "get", -action => $action) .
3532                      "<div class=\"search\">\n" .
3533                      (!$use_pathinfo &&
3534                      $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3535                      $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3536                      $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3537                      $cgi->popup_menu(-name => 'st', -default => 'commit',
3538                                       -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3539                      $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3540                      " search:\n",
3541                      $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3542                      "<span title=\"Extended regular expression\">" .
3543                      $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3544                                     -checked => $search_use_regexp) .
3545                      "</span>" .
3546                      "</div>" .
3547                      $cgi->end_form() . "\n";
3548        }
3549}
3550
3551sub git_footer_html {
3552        my $feed_class = 'rss_logo';
3553
3554        print "<div class=\"page_footer\">\n";
3555        if (defined $project) {
3556                my $descr = git_get_project_description($project);
3557                if (defined $descr) {
3558                        print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3559                }
3560
3561                my %href_params = get_feed_info();
3562                if (!%href_params) {
3563                        $feed_class .= ' generic';
3564                }
3565                $href_params{'-title'} ||= 'log';
3566
3567                foreach my $format qw(RSS Atom) {
3568                        $href_params{'action'} = lc($format);
3569                        print $cgi->a({-href => href(%href_params),
3570                                      -title => "$href_params{'-title'} $format feed",
3571                                      -class => $feed_class}, $format)."\n";
3572                }
3573
3574        } else {
3575                print $cgi->a({-href => href(project=>undef, action=>"opml"),
3576                              -class => $feed_class}, "OPML") . " ";
3577                print $cgi->a({-href => href(project=>undef, action=>"project_index"),
3578                              -class => $feed_class}, "TXT") . "\n";
3579        }
3580        print "</div>\n"; # class="page_footer"
3581
3582        if (defined $t0 && gitweb_check_feature('timed')) {
3583                print "<div id=\"generating_info\">\n";
3584                print 'This page took '.
3585                      '<span id="generating_time" class="time_span">'.
3586                      Time::HiRes::tv_interval($t0, [Time::HiRes::gettimeofday()]).
3587                      ' seconds </span>'.
3588                      ' and '.
3589                      '<span id="generating_cmd">'.
3590                      $number_of_git_cmds.
3591                      '</span> git commands '.
3592                      " to generate.\n";
3593                print "</div>\n"; # class="page_footer"
3594        }
3595
3596        if (defined $site_footer && -f $site_footer) {
3597                insert_file($site_footer);
3598        }
3599
3600        print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
3601        if (defined $action &&
3602            $action eq 'blame_incremental') {
3603                print qq!<script type="text/javascript">\n!.
3604                      qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
3605                      qq!           "!. href() .qq!");\n!.
3606                      qq!</script>\n!;
3607        } elsif (gitweb_check_feature('javascript-actions')) {
3608                print qq!<script type="text/javascript">\n!.
3609                      qq!window.onload = fixLinks;\n!.
3610                      qq!</script>\n!;
3611        }
3612
3613        print "</body>\n" .
3614              "</html>";
3615}
3616
3617# die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
3618# Example: die_error(404, 'Hash not found')
3619# By convention, use the following status codes (as defined in RFC 2616):
3620# 400: Invalid or missing CGI parameters, or
3621#      requested object exists but has wrong type.
3622# 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
3623#      this server or project.
3624# 404: Requested object/revision/project doesn't exist.
3625# 500: The server isn't configured properly, or
3626#      an internal error occurred (e.g. failed assertions caused by bugs), or
3627#      an unknown error occurred (e.g. the git binary died unexpectedly).
3628# 503: The server is currently unavailable (because it is overloaded,
3629#      or down for maintenance).  Generally, this is a temporary state.
3630sub die_error {
3631        my $status = shift || 500;
3632        my $error = esc_html(shift) || "Internal Server Error";
3633        my $extra = shift;
3634        my %opts = @_;
3635
3636        my %http_responses = (
3637                400 => '400 Bad Request',
3638                403 => '403 Forbidden',
3639                404 => '404 Not Found',
3640                500 => '500 Internal Server Error',
3641                503 => '503 Service Unavailable',
3642        );
3643        git_header_html($http_responses{$status}, undef, %opts);
3644        print <<EOF;
3645<div class="page_body">
3646<br /><br />
3647$status - $error
3648<br />
3649EOF
3650        if (defined $extra) {
3651                print "<hr />\n" .
3652                      "$extra\n";
3653        }
3654        print "</div>\n";
3655
3656        git_footer_html();
3657        goto DONE_GITWEB
3658                unless ($opts{'-error_handler'});
3659}
3660
3661## ----------------------------------------------------------------------
3662## functions printing or outputting HTML: navigation
3663
3664sub git_print_page_nav {
3665        my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
3666        $extra = '' if !defined $extra; # pager or formats
3667
3668        my @navs = qw(summary shortlog log commit commitdiff tree);
3669        if ($suppress) {
3670                @navs = grep { $_ ne $suppress } @navs;
3671        }
3672
3673        my %arg = map { $_ => {action=>$_} } @navs;
3674        if (defined $head) {
3675                for (qw(commit commitdiff)) {
3676                        $arg{$_}{'hash'} = $head;
3677                }
3678                if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
3679                        for (qw(shortlog log)) {
3680                                $arg{$_}{'hash'} = $head;
3681                        }
3682                }
3683        }
3684
3685        $arg{'tree'}{'hash'} = $treehead if defined $treehead;
3686        $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
3687
3688        my @actions = gitweb_get_feature('actions');
3689        my %repl = (
3690                '%' => '%',
3691                'n' => $project,         # project name
3692                'f' => $git_dir,         # project path within filesystem
3693                'h' => $treehead || '',  # current hash ('h' parameter)
3694                'b' => $treebase || '',  # hash base ('hb' parameter)
3695        );
3696        while (@actions) {
3697                my ($label, $link, $pos) = splice(@actions,0,3);
3698                # insert
3699                @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
3700                # munch munch
3701                $link =~ s/%([%nfhb])/$repl{$1}/g;
3702                $arg{$label}{'_href'} = $link;
3703        }
3704
3705        print "<div class=\"page_nav\">\n" .
3706                (join " | ",
3707                 map { $_ eq $current ?
3708                       $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
3709                 } @navs);
3710        print "<br/>\n$extra<br/>\n" .
3711              "</div>\n";
3712}
3713
3714sub format_paging_nav {
3715        my ($action, $page, $has_next_link) = @_;
3716        my $paging_nav;
3717
3718
3719        if ($page > 0) {
3720                $paging_nav .=
3721                        $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
3722                        " &sdot; " .
3723                        $cgi->a({-href => href(-replay=>1, page=>$page-1),
3724                                 -accesskey => "p", -title => "Alt-p"}, "prev");
3725        } else {
3726                $paging_nav .= "first &sdot; prev";
3727        }
3728
3729        if ($has_next_link) {
3730                $paging_nav .= " &sdot; " .
3731                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
3732                                 -accesskey => "n", -title => "Alt-n"}, "next");
3733        } else {
3734                $paging_nav .= " &sdot; next";
3735        }
3736
3737        return $paging_nav;
3738}
3739
3740## ......................................................................
3741## functions printing or outputting HTML: div
3742
3743sub git_print_header_div {
3744        my ($action, $title, $hash, $hash_base) = @_;
3745        my %args = ();
3746
3747        $args{'action'} = $action;
3748        $args{'hash'} = $hash if $hash;
3749        $args{'hash_base'} = $hash_base if $hash_base;
3750
3751        print "<div class=\"header\">\n" .
3752              $cgi->a({-href => href(%args), -class => "title"},
3753              $title ? $title : $action) .
3754              "\n</div>\n";
3755}
3756
3757sub print_local_time {
3758        print format_local_time(@_);
3759}
3760
3761sub format_local_time {
3762        my $localtime = '';
3763        my %date = @_;
3764        if ($date{'hour_local'} < 6) {
3765                $localtime .= sprintf(" (<span class=\"atnight\">%02d:%02d</span> %s)",
3766                        $date{'hour_local'}, $date{'minute_local'}, $date{'tz_local'});
3767        } else {
3768                $localtime .= sprintf(" (%02d:%02d %s)",
3769                        $date{'hour_local'}, $date{'minute_local'}, $date{'tz_local'});
3770        }
3771
3772        return $localtime;
3773}
3774
3775# Outputs the author name and date in long form
3776sub git_print_authorship {
3777        my $co = shift;
3778        my %opts = @_;
3779        my $tag = $opts{-tag} || 'div';
3780        my $author = $co->{'author_name'};
3781
3782        my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
3783        print "<$tag class=\"author_date\">" .
3784              format_search_author($author, "author", esc_html($author)) .
3785              " [$ad{'rfc2822'}";
3786        print_local_time(%ad) if ($opts{-localtime});
3787        print "]" . git_get_avatar($co->{'author_email'}, -pad_before => 1)
3788                  . "</$tag>\n";
3789}
3790
3791# Outputs table rows containing the full author or committer information,
3792# in the format expected for 'commit' view (& similar).
3793# Parameters are a commit hash reference, followed by the list of people
3794# to output information for. If the list is empty it defaults to both
3795# author and committer.
3796sub git_print_authorship_rows {
3797        my $co = shift;
3798        # too bad we can't use @people = @_ || ('author', 'committer')
3799        my @people = @_;
3800        @people = ('author', 'committer') unless @people;
3801        foreach my $who (@people) {
3802                my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
3803                print "<tr><td>$who</td><td>" .
3804                      format_search_author($co->{"${who}_name"}, $who,
3805                               esc_html($co->{"${who}_name"})) . " " .
3806                      format_search_author($co->{"${who}_email"}, $who,
3807                               esc_html("<" . $co->{"${who}_email"} . ">")) .
3808                      "</td><td rowspan=\"2\">" .
3809                      git_get_avatar($co->{"${who}_email"}, -size => 'double') .
3810                      "</td></tr>\n" .
3811                      "<tr>" .
3812                      "<td></td><td> $wd{'rfc2822'}";
3813                print_local_time(%wd);
3814                print "</td>" .
3815                      "</tr>\n";
3816        }
3817}
3818
3819sub git_print_page_path {
3820        my $name = shift;
3821        my $type = shift;
3822        my $hb = shift;
3823
3824
3825        print "<div class=\"page_path\">";
3826        print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
3827                      -title => 'tree root'}, to_utf8("[$project]"));
3828        print " / ";
3829        if (defined $name) {
3830                my @dirname = split '/', $name;
3831                my $basename = pop @dirname;
3832                my $fullname = '';
3833
3834                foreach my $dir (@dirname) {
3835                        $fullname .= ($fullname ? '/' : '') . $dir;
3836                        print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
3837                                                     hash_base=>$hb),
3838                                      -title => $fullname}, esc_path($dir));
3839                        print " / ";
3840                }
3841                if (defined $type && $type eq 'blob') {
3842                        print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
3843                                                     hash_base=>$hb),
3844                                      -title => $name}, esc_path($basename));
3845                } elsif (defined $type && $type eq 'tree') {
3846                        print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
3847                                                     hash_base=>$hb),
3848                                      -title => $name}, esc_path($basename));
3849                        print " / ";
3850                } else {
3851                        print esc_path($basename);
3852                }
3853        }
3854        print "<br/></div>\n";
3855}
3856
3857sub git_print_log {
3858        my $log = shift;
3859        my %opts = @_;
3860
3861        if ($opts{'-remove_title'}) {
3862                # remove title, i.e. first line of log
3863                shift @$log;
3864        }
3865        # remove leading empty lines
3866        while (defined $log->[0] && $log->[0] eq "") {
3867                shift @$log;
3868        }
3869
3870        # print log
3871        my $signoff = 0;
3872        my $empty = 0;
3873        foreach my $line (@$log) {
3874                if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
3875                        $signoff = 1;
3876                        $empty = 0;
3877                        if (! $opts{'-remove_signoff'}) {
3878                                print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
3879                                next;
3880                        } else {
3881                                # remove signoff lines
3882                                next;
3883                        }
3884                } else {
3885                        $signoff = 0;
3886                }
3887
3888                # print only one empty line
3889                # do not print empty line after signoff
3890                if ($line eq "") {
3891                        next if ($empty || $signoff);
3892                        $empty = 1;
3893                } else {
3894                        $empty = 0;
3895                }
3896
3897                print format_log_line_html($line) . "<br/>\n";
3898        }
3899
3900        if ($opts{'-final_empty_line'}) {
3901                # end with single empty line
3902                print "<br/>\n" unless $empty;
3903        }
3904}
3905
3906# return link target (what link points to)
3907sub git_get_link_target {
3908        my $hash = shift;
3909        my $link_target;
3910
3911        # read link
3912        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
3913                or return;
3914        {
3915                local $/ = undef;
3916                $link_target = <$fd>;
3917        }
3918        close $fd
3919                or return;
3920
3921        return $link_target;
3922}
3923
3924# given link target, and the directory (basedir) the link is in,
3925# return target of link relative to top directory (top tree);
3926# return undef if it is not possible (including absolute links).
3927sub normalize_link_target {
3928        my ($link_target, $basedir) = @_;
3929
3930        # absolute symlinks (beginning with '/') cannot be normalized
3931        return if (substr($link_target, 0, 1) eq '/');
3932
3933        # normalize link target to path from top (root) tree (dir)
3934        my $path;
3935        if ($basedir) {
3936                $path = $basedir . '/' . $link_target;
3937        } else {
3938                # we are in top (root) tree (dir)
3939                $path = $link_target;
3940        }
3941
3942        # remove //, /./, and /../
3943        my @path_parts;
3944        foreach my $part (split('/', $path)) {
3945                # discard '.' and ''
3946                next if (!$part || $part eq '.');
3947                # handle '..'
3948                if ($part eq '..') {
3949                        if (@path_parts) {
3950                                pop @path_parts;
3951                        } else {
3952                                # link leads outside repository (outside top dir)
3953                                return;
3954                        }
3955                } else {
3956                        push @path_parts, $part;
3957                }
3958        }
3959        $path = join('/', @path_parts);
3960
3961        return $path;
3962}
3963
3964# print tree entry (row of git_tree), but without encompassing <tr> element
3965sub git_print_tree_entry {
3966        my ($t, $basedir, $hash_base, $have_blame) = @_;
3967
3968        my %base_key = ();
3969        $base_key{'hash_base'} = $hash_base if defined $hash_base;
3970
3971        # The format of a table row is: mode list link.  Where mode is
3972        # the mode of the entry, list is the name of the entry, an href,
3973        # and link is the action links of the entry.
3974
3975        print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
3976        if (exists $t->{'size'}) {
3977                print "<td class=\"size\">$t->{'size'}</td>\n";
3978        }
3979        if ($t->{'type'} eq "blob") {
3980                print "<td class=\"list\">" .
3981                        $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
3982                                               file_name=>"$basedir$t->{'name'}", %base_key),
3983                                -class => "list"}, esc_path($t->{'name'}));
3984                if (S_ISLNK(oct $t->{'mode'})) {
3985                        my $link_target = git_get_link_target($t->{'hash'});
3986                        if ($link_target) {
3987                                my $norm_target = normalize_link_target($link_target, $basedir);
3988                                if (defined $norm_target) {
3989                                        print " -> " .
3990                                              $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
3991                                                                     file_name=>$norm_target),
3992                                                       -title => $norm_target}, esc_path($link_target));
3993                                } else {
3994                                        print " -> " . esc_path($link_target);
3995                                }
3996                        }
3997                }
3998                print "</td>\n";
3999                print "<td class=\"link\">";
4000                print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4001                                             file_name=>"$basedir$t->{'name'}", %base_key)},
4002                              "blob");
4003                if ($have_blame) {
4004                        print " | " .
4005                              $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4006                                                     file_name=>"$basedir$t->{'name'}", %base_key)},
4007                                      "blame");
4008                }
4009                if (defined $hash_base) {
4010                        print " | " .
4011                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4012                                                     hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4013                                      "history");
4014                }
4015                print " | " .
4016                        $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4017                                               file_name=>"$basedir$t->{'name'}")},
4018                                "raw");
4019                print "</td>\n";
4020
4021        } elsif ($t->{'type'} eq "tree") {
4022                print "<td class=\"list\">";
4023                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4024                                             file_name=>"$basedir$t->{'name'}",
4025                                             %base_key)},
4026                              esc_path($t->{'name'}));
4027                print "</td>\n";
4028                print "<td class=\"link\">";
4029                print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4030                                             file_name=>"$basedir$t->{'name'}",
4031                                             %base_key)},
4032                              "tree");
4033                if (defined $hash_base) {
4034                        print " | " .
4035                              $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4036                                                     file_name=>"$basedir$t->{'name'}")},
4037                                      "history");
4038                }
4039                print "</td>\n";
4040        } else {
4041                # unknown object: we can only present history for it
4042                # (this includes 'commit' object, i.e. submodule support)
4043                print "<td class=\"list\">" .
4044                      esc_path($t->{'name'}) .
4045                      "</td>\n";
4046                print "<td class=\"link\">";
4047                if (defined $hash_base) {
4048                        print $cgi->a({-href => href(action=>"history",
4049                                                     hash_base=>$hash_base,
4050                                                     file_name=>"$basedir$t->{'name'}")},
4051                                      "history");
4052                }
4053                print "</td>\n";
4054        }
4055}
4056
4057## ......................................................................
4058## functions printing large fragments of HTML
4059
4060# get pre-image filenames for merge (combined) diff
4061sub fill_from_file_info {
4062        my ($diff, @parents) = @_;
4063
4064        $diff->{'from_file'} = [ ];
4065        $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4066        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4067                if ($diff->{'status'}[$i] eq 'R' ||
4068                    $diff->{'status'}[$i] eq 'C') {
4069                        $diff->{'from_file'}[$i] =
4070                                git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4071                }
4072        }
4073
4074        return $diff;
4075}
4076
4077# is current raw difftree line of file deletion
4078sub is_deleted {
4079        my $diffinfo = shift;
4080
4081        return $diffinfo->{'to_id'} eq ('0' x 40);
4082}
4083
4084# does patch correspond to [previous] difftree raw line
4085# $diffinfo  - hashref of parsed raw diff format
4086# $patchinfo - hashref of parsed patch diff format
4087#              (the same keys as in $diffinfo)
4088sub is_patch_split {
4089        my ($diffinfo, $patchinfo) = @_;
4090
4091        return defined $diffinfo && defined $patchinfo
4092                && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4093}
4094
4095
4096sub git_difftree_body {
4097        my ($difftree, $hash, @parents) = @_;
4098        my ($parent) = $parents[0];
4099        my $have_blame = gitweb_check_feature('blame');
4100        print "<div class=\"list_head\">\n";
4101        if ($#{$difftree} > 10) {
4102                print(($#{$difftree} + 1) . " files changed:\n");
4103        }
4104        print "</div>\n";
4105
4106        print "<table class=\"" .
4107              (@parents > 1 ? "combined " : "") .
4108              "diff_tree\">\n";
4109
4110        # header only for combined diff in 'commitdiff' view
4111        my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4112        if ($has_header) {
4113                # table header
4114                print "<thead><tr>\n" .
4115                       "<th></th><th></th>\n"; # filename, patchN link
4116                for (my $i = 0; $i < @parents; $i++) {
4117                        my $par = $parents[$i];
4118                        print "<th>" .
4119                              $cgi->a({-href => href(action=>"commitdiff",
4120                                                     hash=>$hash, hash_parent=>$par),
4121                                       -title => 'commitdiff to parent number ' .
4122                                                  ($i+1) . ': ' . substr($par,0,7)},
4123                                      $i+1) .
4124                              "&nbsp;</th>\n";
4125                }
4126                print "</tr></thead>\n<tbody>\n";
4127        }
4128
4129        my $alternate = 1;
4130        my $patchno = 0;
4131        foreach my $line (@{$difftree}) {
4132                my $diff = parsed_difftree_line($line);
4133
4134                if ($alternate) {
4135                        print "<tr class=\"dark\">\n";
4136                } else {
4137                        print "<tr class=\"light\">\n";
4138                }
4139                $alternate ^= 1;
4140
4141                if (exists $diff->{'nparents'}) { # combined diff
4142
4143                        fill_from_file_info($diff, @parents)
4144                                unless exists $diff->{'from_file'};
4145
4146                        if (!is_deleted($diff)) {
4147                                # file exists in the result (child) commit
4148                                print "<td>" .
4149                                      $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4150                                                             file_name=>$diff->{'to_file'},
4151                                                             hash_base=>$hash),
4152                                              -class => "list"}, esc_path($diff->{'to_file'})) .
4153                                      "</td>\n";
4154                        } else {
4155                                print "<td>" .
4156                                      esc_path($diff->{'to_file'}) .
4157                                      "</td>\n";
4158                        }
4159
4160                        if ($action eq 'commitdiff') {
4161                                # link to patch
4162                                $patchno++;
4163                                print "<td class=\"link\">" .
4164                                      $cgi->a({-href => "#patch$patchno"}, "patch") .
4165                                      " | " .
4166                                      "</td>\n";
4167                        }
4168
4169                        my $has_history = 0;
4170                        my $not_deleted = 0;
4171                        for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4172                                my $hash_parent = $parents[$i];
4173                                my $from_hash = $diff->{'from_id'}[$i];
4174                                my $from_path = $diff->{'from_file'}[$i];
4175                                my $status = $diff->{'status'}[$i];
4176
4177                                $has_history ||= ($status ne 'A');
4178                                $not_deleted ||= ($status ne 'D');
4179
4180                                if ($status eq 'A') {
4181                                        print "<td  class=\"link\" align=\"right\"> | </td>\n";
4182                                } elsif ($status eq 'D') {
4183                                        print "<td class=\"link\">" .
4184                                              $cgi->a({-href => href(action=>"blob",
4185                                                                     hash_base=>$hash,
4186                                                                     hash=>$from_hash,
4187                                                                     file_name=>$from_path)},
4188                                                      "blob" . ($i+1)) .
4189                                              " | </td>\n";
4190                                } else {
4191                                        if ($diff->{'to_id'} eq $from_hash) {
4192                                                print "<td class=\"link nochange\">";
4193                                        } else {
4194                                                print "<td class=\"link\">";
4195                                        }
4196                                        print $cgi->a({-href => href(action=>"blobdiff",
4197                                                                     hash=>$diff->{'to_id'},
4198                                                                     hash_parent=>$from_hash,
4199                                                                     hash_base=>$hash,
4200                                                                     hash_parent_base=>$hash_parent,
4201                                                                     file_name=>$diff->{'to_file'},
4202                                                                     file_parent=>$from_path)},
4203                                                      "diff" . ($i+1)) .
4204                                              " | </td>\n";
4205                                }
4206                        }
4207
4208                        print "<td class=\"link\">";
4209                        if ($not_deleted) {
4210                                print $cgi->a({-href => href(action=>"blob",
4211                                                             hash=>$diff->{'to_id'},
4212                                                             file_name=>$diff->{'to_file'},
4213                                                             hash_base=>$hash)},
4214                                              "blob");
4215                                print " | " if ($has_history);
4216                        }
4217                        if ($has_history) {
4218                                print $cgi->a({-href => href(action=>"history",
4219                                                             file_name=>$diff->{'to_file'},
4220                                                             hash_base=>$hash)},
4221                                              "history");
4222                        }
4223                        print "</td>\n";
4224
4225                        print "</tr>\n";
4226                        next; # instead of 'else' clause, to avoid extra indent
4227                }
4228                # else ordinary diff
4229
4230                my ($to_mode_oct, $to_mode_str, $to_file_type);
4231                my ($from_mode_oct, $from_mode_str, $from_file_type);
4232                if ($diff->{'to_mode'} ne ('0' x 6)) {
4233                        $to_mode_oct = oct $diff->{'to_mode'};
4234                        if (S_ISREG($to_mode_oct)) { # only for regular file
4235                                $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4236                        }
4237                        $to_file_type = file_type($diff->{'to_mode'});
4238                }
4239                if ($diff->{'from_mode'} ne ('0' x 6)) {
4240                        $from_mode_oct = oct $diff->{'from_mode'};
4241                        if (S_ISREG($to_mode_oct)) { # only for regular file
4242                                $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4243                        }
4244                        $from_file_type = file_type($diff->{'from_mode'});
4245                }
4246
4247                if ($diff->{'status'} eq "A") { # created
4248                        my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4249                        $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4250                        $mode_chng   .= "]</span>";
4251                        print "<td>";
4252                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4253                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4254                                      -class => "list"}, esc_path($diff->{'file'}));
4255                        print "</td>\n";
4256                        print "<td>$mode_chng</td>\n";
4257                        print "<td class=\"link\">";
4258                        if ($action eq 'commitdiff') {
4259                                # link to patch
4260                                $patchno++;
4261                                print $cgi->a({-href => "#patch$patchno"}, "patch");
4262                                print " | ";
4263                        }
4264                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4265                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4266                                      "blob");
4267                        print "</td>\n";
4268
4269                } elsif ($diff->{'status'} eq "D") { # deleted
4270                        my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4271                        print "<td>";
4272                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4273                                                     hash_base=>$parent, file_name=>$diff->{'file'}),
4274                                       -class => "list"}, esc_path($diff->{'file'}));
4275                        print "</td>\n";
4276                        print "<td>$mode_chng</td>\n";
4277                        print "<td class=\"link\">";
4278                        if ($action eq 'commitdiff') {
4279                                # link to patch
4280                                $patchno++;
4281                                print $cgi->a({-href => "#patch$patchno"}, "patch");
4282                                print " | ";
4283                        }
4284                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4285                                                     hash_base=>$parent, file_name=>$diff->{'file'})},
4286                                      "blob") . " | ";
4287                        if ($have_blame) {
4288                                print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4289                                                             file_name=>$diff->{'file'})},
4290                                              "blame") . " | ";
4291                        }
4292                        print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4293                                                     file_name=>$diff->{'file'})},
4294                                      "history");
4295                        print "</td>\n";
4296
4297                } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4298                        my $mode_chnge = "";
4299                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4300                                $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4301                                if ($from_file_type ne $to_file_type) {
4302                                        $mode_chnge .= " from $from_file_type to $to_file_type";
4303                                }
4304                                if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4305                                        if ($from_mode_str && $to_mode_str) {
4306                                                $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4307                                        } elsif ($to_mode_str) {
4308                                                $mode_chnge .= " mode: $to_mode_str";
4309                                        }
4310                                }
4311                                $mode_chnge .= "]</span>\n";
4312                        }
4313                        print "<td>";
4314                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4315                                                     hash_base=>$hash, file_name=>$diff->{'file'}),
4316                                      -class => "list"}, esc_path($diff->{'file'}));
4317                        print "</td>\n";
4318                        print "<td>$mode_chnge</td>\n";
4319                        print "<td class=\"link\">";
4320                        if ($action eq 'commitdiff') {
4321                                # link to patch
4322                                $patchno++;
4323                                print $cgi->a({-href => "#patch$patchno"}, "patch") .
4324                                      " | ";
4325                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4326                                # "commit" view and modified file (not onlu mode changed)
4327                                print $cgi->a({-href => href(action=>"blobdiff",
4328                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4329                                                             hash_base=>$hash, hash_parent_base=>$parent,
4330                                                             file_name=>$diff->{'file'})},
4331                                              "diff") .
4332                                      " | ";
4333                        }
4334                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4335                                                     hash_base=>$hash, file_name=>$diff->{'file'})},
4336                                       "blob") . " | ";
4337                        if ($have_blame) {
4338                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4339                                                             file_name=>$diff->{'file'})},
4340                                              "blame") . " | ";
4341                        }
4342                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4343                                                     file_name=>$diff->{'file'})},
4344                                      "history");
4345                        print "</td>\n";
4346
4347                } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4348                        my %status_name = ('R' => 'moved', 'C' => 'copied');
4349                        my $nstatus = $status_name{$diff->{'status'}};
4350                        my $mode_chng = "";
4351                        if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4352                                # mode also for directories, so we cannot use $to_mode_str
4353                                $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4354                        }
4355                        print "<td>" .
4356                              $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4357                                                     hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4358                                      -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4359                              "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4360                              $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4361                                                     hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4362                                      -class => "list"}, esc_path($diff->{'from_file'})) .
4363                              " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4364                              "<td class=\"link\">";
4365                        if ($action eq 'commitdiff') {
4366                                # link to patch
4367                                $patchno++;
4368                                print $cgi->a({-href => "#patch$patchno"}, "patch") .
4369                                      " | ";
4370                        } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4371                                # "commit" view and modified file (not only pure rename or copy)
4372                                print $cgi->a({-href => href(action=>"blobdiff",
4373                                                             hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4374                                                             hash_base=>$hash, hash_parent_base=>$parent,
4375                                                             file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4376                                              "diff") .
4377                                      " | ";
4378                        }
4379                        print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4380                                                     hash_base=>$parent, file_name=>$diff->{'to_file'})},
4381                                      "blob") . " | ";
4382                        if ($have_blame) {
4383                                print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4384                                                             file_name=>$diff->{'to_file'})},
4385                                              "blame") . " | ";
4386                        }
4387                        print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4388                                                    file_name=>$diff->{'to_file'})},
4389                                      "history");
4390                        print "</td>\n";
4391
4392                } # we should not encounter Unmerged (U) or Unknown (X) status
4393                print "</tr>\n";
4394        }
4395        print "</tbody>" if $has_header;
4396        print "</table>\n";
4397}
4398
4399sub git_patchset_body {
4400        my ($fd, $difftree, $hash, @hash_parents) = @_;
4401        my ($hash_parent) = $hash_parents[0];
4402
4403        my $is_combined = (@hash_parents > 1);
4404        my $patch_idx = 0;
4405        my $patch_number = 0;
4406        my $patch_line;
4407        my $diffinfo;
4408        my $to_name;
4409        my (%from, %to);
4410
4411        print "<div class=\"patchset\">\n";
4412
4413        # skip to first patch
4414        while ($patch_line = <$fd>) {
4415                chomp $patch_line;
4416
4417                last if ($patch_line =~ m/^diff /);
4418        }
4419
4420 PATCH:
4421        while ($patch_line) {
4422
4423                # parse "git diff" header line
4424                if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
4425                        # $1 is from_name, which we do not use
4426                        $to_name = unquote($2);
4427                        $to_name =~ s!^b/!!;
4428                } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
4429                        # $1 is 'cc' or 'combined', which we do not use
4430                        $to_name = unquote($2);
4431                } else {
4432                        $to_name = undef;
4433                }
4434
4435                # check if current patch belong to current raw line
4436                # and parse raw git-diff line if needed
4437                if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
4438                        # this is continuation of a split patch
4439                        print "<div class=\"patch cont\">\n";
4440                } else {
4441                        # advance raw git-diff output if needed
4442                        $patch_idx++ if defined $diffinfo;
4443
4444                        # read and prepare patch information
4445                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4446
4447                        # compact combined diff output can have some patches skipped
4448                        # find which patch (using pathname of result) we are at now;
4449                        if ($is_combined) {
4450                                while ($to_name ne $diffinfo->{'to_file'}) {
4451                                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4452                                              format_diff_cc_simplified($diffinfo, @hash_parents) .
4453                                              "</div>\n";  # class="patch"
4454
4455                                        $patch_idx++;
4456                                        $patch_number++;
4457
4458                                        last if $patch_idx > $#$difftree;
4459                                        $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4460                                }
4461                        }
4462
4463                        # modifies %from, %to hashes
4464                        parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
4465
4466                        # this is first patch for raw difftree line with $patch_idx index
4467                        # we index @$difftree array from 0, but number patches from 1
4468                        print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
4469                }
4470
4471                # git diff header
4472                #assert($patch_line =~ m/^diff /) if DEBUG;
4473                #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
4474                $patch_number++;
4475                # print "git diff" header
4476                print format_git_diff_header_line($patch_line, $diffinfo,
4477                                                  \%from, \%to);
4478
4479                # print extended diff header
4480                print "<div class=\"diff extended_header\">\n";
4481        EXTENDED_HEADER:
4482                while ($patch_line = <$fd>) {
4483                        chomp $patch_line;
4484
4485                        last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
4486
4487                        print format_extended_diff_header_line($patch_line, $diffinfo,
4488                                                               \%from, \%to);
4489                }
4490                print "</div>\n"; # class="diff extended_header"
4491
4492                # from-file/to-file diff header
4493                if (! $patch_line) {
4494                        print "</div>\n"; # class="patch"
4495                        last PATCH;
4496                }
4497                next PATCH if ($patch_line =~ m/^diff /);
4498                #assert($patch_line =~ m/^---/) if DEBUG;
4499
4500                my $last_patch_line = $patch_line;
4501                $patch_line = <$fd>;
4502                chomp $patch_line;
4503                #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
4504
4505                print format_diff_from_to_header($last_patch_line, $patch_line,
4506                                                 $diffinfo, \%from, \%to,
4507                                                 @hash_parents);
4508
4509                # the patch itself
4510        LINE:
4511                while ($patch_line = <$fd>) {
4512                        chomp $patch_line;
4513
4514                        next PATCH if ($patch_line =~ m/^diff /);
4515
4516                        print format_diff_line($patch_line, \%from, \%to);
4517                }
4518
4519        } continue {
4520                print "</div>\n"; # class="patch"
4521        }
4522
4523        # for compact combined (--cc) format, with chunk and patch simplification
4524        # the patchset might be empty, but there might be unprocessed raw lines
4525        for (++$patch_idx if $patch_number > 0;
4526             $patch_idx < @$difftree;
4527             ++$patch_idx) {
4528                # read and prepare patch information
4529                $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4530
4531                # generate anchor for "patch" links in difftree / whatchanged part
4532                print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4533                      format_diff_cc_simplified($diffinfo, @hash_parents) .
4534                      "</div>\n";  # class="patch"
4535
4536                $patch_number++;
4537        }
4538
4539        if ($patch_number == 0) {
4540                if (@hash_parents > 1) {
4541                        print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
4542                } else {
4543                        print "<div class=\"diff nodifferences\">No differences found</div>\n";
4544                }
4545        }
4546
4547        print "</div>\n"; # class="patchset"
4548}
4549
4550# . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
4551
4552# fills project list info (age, description, owner, forks) for each
4553# project in the list, removing invalid projects from returned list
4554# NOTE: modifies $projlist, but does not remove entries from it
4555sub fill_project_list_info {
4556        my ($projlist, $check_forks) = @_;
4557        my @projects;
4558
4559        my $show_ctags = gitweb_check_feature('ctags');
4560 PROJECT:
4561        foreach my $pr (@$projlist) {
4562                my (@activity) = git_get_last_activity($pr->{'path'});
4563                unless (@activity) {
4564                        next PROJECT;
4565                }
4566                ($pr->{'age'}, $pr->{'age_string'}) = @activity;
4567                if (!defined $pr->{'descr'}) {
4568                        my $descr = git_get_project_description($pr->{'path'}) || "";
4569                        $descr = to_utf8($descr);
4570                        $pr->{'descr_long'} = $descr;
4571                        $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
4572                }
4573                if (!defined $pr->{'owner'}) {
4574                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
4575                }
4576                if ($check_forks) {
4577                        my $pname = $pr->{'path'};
4578                        if (($pname =~ s/\.git$//) &&
4579                            ($pname !~ /\/$/) &&
4580                            (-d "$projectroot/$pname")) {
4581                                $pr->{'forks'} = "-d $projectroot/$pname";
4582                        } else {
4583                                $pr->{'forks'} = 0;
4584                        }
4585                }
4586                $show_ctags and $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
4587                push @projects, $pr;
4588        }
4589
4590        return @projects;
4591}
4592
4593# print 'sort by' <th> element, generating 'sort by $name' replay link
4594# if that order is not selected
4595sub print_sort_th {
4596        print format_sort_th(@_);
4597}
4598
4599sub format_sort_th {
4600        my ($name, $order, $header) = @_;
4601        my $sort_th = "";
4602        $header ||= ucfirst($name);
4603
4604        if ($order eq $name) {
4605                $sort_th .= "<th>$header</th>\n";
4606        } else {
4607                $sort_th .= "<th>" .
4608                            $cgi->a({-href => href(-replay=>1, order=>$name),
4609                                     -class => "header"}, $header) .
4610                            "</th>\n";
4611        }
4612
4613        return $sort_th;
4614}
4615
4616sub git_project_list_body {
4617        # actually uses global variable $project
4618        my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
4619
4620        my $check_forks = gitweb_check_feature('forks');
4621        my @projects = fill_project_list_info($projlist, $check_forks);
4622
4623        $order ||= $default_projects_order;
4624        $from = 0 unless defined $from;
4625        $to = $#projects if (!defined $to || $#projects < $to);
4626
4627        my %order_info = (
4628                project => { key => 'path', type => 'str' },
4629                descr => { key => 'descr_long', type => 'str' },
4630                owner => { key => 'owner', type => 'str' },
4631                age => { key => 'age', type => 'num' }
4632        );
4633        my $oi = $order_info{$order};
4634        if ($oi->{'type'} eq 'str') {
4635                @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @projects;
4636        } else {
4637                @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @projects;
4638        }
4639
4640        my $show_ctags = gitweb_check_feature('ctags');
4641        if ($show_ctags) {
4642                my %ctags;
4643                foreach my $p (@projects) {
4644                        foreach my $ct (keys %{$p->{'ctags'}}) {
4645                                $ctags{$ct} += $p->{'ctags'}->{$ct};
4646                        }
4647                }
4648                my $cloud = git_populate_project_tagcloud(\%ctags);
4649                print git_show_project_tagcloud($cloud, 64);
4650        }
4651
4652        print "<table class=\"project_list\">\n";
4653        unless ($no_header) {
4654                print "<tr>\n";
4655                if ($check_forks) {
4656                        print "<th></th>\n";
4657                }
4658                print_sort_th('project', $order, 'Project');
4659                print_sort_th('descr', $order, 'Description');
4660                print_sort_th('owner', $order, 'Owner');
4661                print_sort_th('age', $order, 'Last Change');
4662                print "<th></th>\n" . # for links
4663                      "</tr>\n";
4664        }
4665        my $alternate = 1;
4666        my $tagfilter = $cgi->param('by_tag');
4667        for (my $i = $from; $i <= $to; $i++) {
4668                my $pr = $projects[$i];
4669
4670                next if $tagfilter and $show_ctags and not grep { lc $_ eq lc $tagfilter } keys %{$pr->{'ctags'}};
4671                next if $searchtext and not $pr->{'path'} =~ /$searchtext/
4672                        and not $pr->{'descr_long'} =~ /$searchtext/;
4673                # Weed out forks or non-matching entries of search
4674                if ($check_forks) {
4675                        my $forkbase = $project; $forkbase ||= ''; $forkbase =~ s#\.git$#/#;
4676                        $forkbase="^$forkbase" if $forkbase;
4677                        next if not $searchtext and not $tagfilter and $show_ctags
4678                                and $pr->{'path'} =~ m#$forkbase.*/.*#; # regexp-safe
4679                }
4680
4681                if ($alternate) {
4682                        print "<tr class=\"dark\">\n";
4683                } else {
4684                        print "<tr class=\"light\">\n";
4685                }
4686                $alternate ^= 1;
4687                if ($check_forks) {
4688                        print "<td>";
4689                        if ($pr->{'forks'}) {
4690                                print "<!-- $pr->{'forks'} -->\n";
4691                                print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "+");
4692                        }
4693                        print "</td>\n";
4694                }
4695                print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4696                                        -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
4697                      "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4698                                        -class => "list", -title => $pr->{'descr_long'}},
4699                                        esc_html($pr->{'descr'})) . "</td>\n" .
4700                      "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
4701                print "<td class=\"". age_class($pr->{'age'}) . "\">" .
4702                      (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
4703                      "<td class=\"link\">" .
4704                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
4705                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
4706                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
4707                      $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
4708                      ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
4709                      "</td>\n" .
4710                      "</tr>\n";
4711        }
4712        if (defined $extra) {
4713                print "<tr>\n";
4714                if ($check_forks) {
4715                        print "<td></td>\n";
4716                }
4717                print "<td colspan=\"5\">$extra</td>\n" .
4718                      "</tr>\n";
4719        }
4720        print "</table>\n";
4721}
4722
4723sub git_log_body {
4724        # uses global variable $project
4725        my ($commitlist, $from, $to, $refs, $extra) = @_;
4726
4727        $from = 0 unless defined $from;
4728        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4729
4730        for (my $i = 0; $i <= $to; $i++) {
4731                my %co = %{$commitlist->[$i]};
4732                next if !%co;
4733                my $commit = $co{'id'};
4734                my $ref = format_ref_marker($refs, $commit);
4735                my %ad = parse_date($co{'author_epoch'});
4736                git_print_header_div('commit',
4737                               "<span class=\"age\">$co{'age_string'}</span>" .
4738                               esc_html($co{'title'}) . $ref,
4739                               $commit);
4740                print "<div class=\"title_text\">\n" .
4741                      "<div class=\"log_link\">\n" .
4742                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
4743                      " | " .
4744                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
4745                      " | " .
4746                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
4747                      "<br/>\n" .
4748                      "</div>\n";
4749                      git_print_authorship(\%co, -tag => 'span');
4750                      print "<br/>\n</div>\n";
4751
4752                print "<div class=\"log_body\">\n";
4753                git_print_log($co{'comment'}, -final_empty_line=> 1);
4754                print "</div>\n";
4755        }
4756        if ($extra) {
4757                print "<div class=\"page_nav\">\n";
4758                print "$extra\n";
4759                print "</div>\n";
4760        }
4761}
4762
4763sub git_shortlog_body {
4764        # uses global variable $project
4765        my ($commitlist, $from, $to, $refs, $extra) = @_;
4766
4767        $from = 0 unless defined $from;
4768        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4769
4770        print "<table class=\"shortlog\">\n";
4771        my $alternate = 1;
4772        for (my $i = $from; $i <= $to; $i++) {
4773                my %co = %{$commitlist->[$i]};
4774                my $commit = $co{'id'};
4775                my $ref = format_ref_marker($refs, $commit);
4776                if ($alternate) {
4777                        print "<tr class=\"dark\">\n";
4778                } else {
4779                        print "<tr class=\"light\">\n";
4780                }
4781                $alternate ^= 1;
4782                # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
4783                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4784                      format_author_html('td', \%co, 10) . "<td>";
4785                print format_subject_html($co{'title'}, $co{'title_short'},
4786                                          href(action=>"commit", hash=>$commit), $ref);
4787                print "</td>\n" .
4788                      "<td class=\"link\">" .
4789                      $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
4790                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
4791                      $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
4792                my $snapshot_links = format_snapshot_links($commit);
4793                if (defined $snapshot_links) {
4794                        print " | " . $snapshot_links;
4795                }
4796                print "</td>\n" .
4797                      "</tr>\n";
4798        }
4799        if (defined $extra) {
4800                print "<tr>\n" .
4801                      "<td colspan=\"4\">$extra</td>\n" .
4802                      "</tr>\n";
4803        }
4804        print "</table>\n";
4805}
4806
4807sub git_history_body {
4808        # Warning: assumes constant type (blob or tree) during history
4809        my ($commitlist, $from, $to, $refs, $extra,
4810            $file_name, $file_hash, $ftype) = @_;
4811
4812        $from = 0 unless defined $from;
4813        $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
4814
4815        print "<table class=\"history\">\n";
4816        my $alternate = 1;
4817        for (my $i = $from; $i <= $to; $i++) {
4818                my %co = %{$commitlist->[$i]};
4819                if (!%co) {
4820                        next;
4821                }
4822                my $commit = $co{'id'};
4823
4824                my $ref = format_ref_marker($refs, $commit);
4825
4826                if ($alternate) {
4827                        print "<tr class=\"dark\">\n";
4828                } else {
4829                        print "<tr class=\"light\">\n";
4830                }
4831                $alternate ^= 1;
4832                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4833        # shortlog:   format_author_html('td', \%co, 10)
4834                      format_author_html('td', \%co, 15, 3) . "<td>";
4835                # originally git_history used chop_str($co{'title'}, 50)
4836                print format_subject_html($co{'title'}, $co{'title_short'},
4837                                          href(action=>"commit", hash=>$commit), $ref);
4838                print "</td>\n" .
4839                      "<td class=\"link\">" .
4840                      $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
4841                      $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
4842
4843                if ($ftype eq 'blob') {
4844                        my $blob_current = $file_hash;
4845                        my $blob_parent  = git_get_hash_by_path($commit, $file_name);
4846                        if (defined $blob_current && defined $blob_parent &&
4847                                        $blob_current ne $blob_parent) {
4848                                print " | " .
4849                                        $cgi->a({-href => href(action=>"blobdiff",
4850                                                               hash=>$blob_current, hash_parent=>$blob_parent,
4851                                                               hash_base=>$hash_base, hash_parent_base=>$commit,
4852                                                               file_name=>$file_name)},
4853                                                "diff to current");
4854                        }
4855                }
4856                print "</td>\n" .
4857                      "</tr>\n";
4858        }
4859        if (defined $extra) {
4860                print "<tr>\n" .
4861                      "<td colspan=\"4\">$extra</td>\n" .
4862                      "</tr>\n";
4863        }
4864        print "</table>\n";
4865}
4866
4867sub git_tags_body {
4868        # uses global variable $project
4869        my ($taglist, $from, $to, $extra) = @_;
4870        $from = 0 unless defined $from;
4871        $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
4872
4873        print "<table class=\"tags\">\n";
4874        my $alternate = 1;
4875        for (my $i = $from; $i <= $to; $i++) {
4876                my $entry = $taglist->[$i];
4877                my %tag = %$entry;
4878                my $comment = $tag{'subject'};
4879                my $comment_short;
4880                if (defined $comment) {
4881                        $comment_short = chop_str($comment, 30, 5);
4882                }
4883                if ($alternate) {
4884                        print "<tr class=\"dark\">\n";
4885                } else {
4886                        print "<tr class=\"light\">\n";
4887                }
4888                $alternate ^= 1;
4889                if (defined $tag{'age'}) {
4890                        print "<td><i>$tag{'age'}</i></td>\n";
4891                } else {
4892                        print "<td></td>\n";
4893                }
4894                print "<td>" .
4895                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
4896                               -class => "list name"}, esc_html($tag{'name'})) .
4897                      "</td>\n" .
4898                      "<td>";
4899                if (defined $comment) {
4900                        print format_subject_html($comment, $comment_short,
4901                                                  href(action=>"tag", hash=>$tag{'id'}));
4902                }
4903                print "</td>\n" .
4904                      "<td class=\"selflink\">";
4905                if ($tag{'type'} eq "tag") {
4906                        print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
4907                } else {
4908                        print "&nbsp;";
4909                }
4910                print "</td>\n" .
4911                      "<td class=\"link\">" . " | " .
4912                      $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
4913                if ($tag{'reftype'} eq "commit") {
4914                        print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
4915                              " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
4916                } elsif ($tag{'reftype'} eq "blob") {
4917                        print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
4918                }
4919                print "</td>\n" .
4920                      "</tr>";
4921        }
4922        if (defined $extra) {
4923                print "<tr>\n" .
4924                      "<td colspan=\"5\">$extra</td>\n" .
4925                      "</tr>\n";
4926        }
4927        print "</table>\n";
4928}
4929
4930sub git_heads_body {
4931        # uses global variable $project
4932        my ($headlist, $head, $from, $to, $extra) = @_;
4933        $from = 0 unless defined $from;
4934        $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
4935
4936        print "<table class=\"heads\">\n";
4937        my $alternate = 1;
4938        for (my $i = $from; $i <= $to; $i++) {
4939                my $entry = $headlist->[$i];
4940                my %ref = %$entry;
4941                my $curr = $ref{'id'} eq $head;
4942                if ($alternate) {
4943                        print "<tr class=\"dark\">\n";
4944                } else {
4945                        print "<tr class=\"light\">\n";
4946                }
4947                $alternate ^= 1;
4948                print "<td><i>$ref{'age'}</i></td>\n" .
4949                      ($curr ? "<td class=\"current_head\">" : "<td>") .
4950                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
4951                               -class => "list name"},esc_html($ref{'name'})) .
4952                      "</td>\n" .
4953                      "<td class=\"link\">" .
4954                      $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
4955                      $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
4956                      $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'name'})}, "tree") .
4957                      "</td>\n" .
4958                      "</tr>";
4959        }
4960        if (defined $extra) {
4961                print "<tr>\n" .
4962                      "<td colspan=\"3\">$extra</td>\n" .
4963                      "</tr>\n";
4964        }
4965        print "</table>\n";
4966}
4967
4968sub git_search_grep_body {
4969        my ($commitlist, $from, $to, $extra) = @_;
4970        $from = 0 unless defined $from;
4971        $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4972
4973        print "<table class=\"commit_search\">\n";
4974        my $alternate = 1;
4975        for (my $i = $from; $i <= $to; $i++) {
4976                my %co = %{$commitlist->[$i]};
4977                if (!%co) {
4978                        next;
4979                }
4980                my $commit = $co{'id'};
4981                if ($alternate) {
4982                        print "<tr class=\"dark\">\n";
4983                } else {
4984                        print "<tr class=\"light\">\n";
4985                }
4986                $alternate ^= 1;
4987                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4988                      format_author_html('td', \%co, 15, 5) .
4989                      "<td>" .
4990                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
4991                               -class => "list subject"},
4992                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
4993                my $comment = $co{'comment'};
4994                foreach my $line (@$comment) {
4995                        if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
4996                                my ($lead, $match, $trail) = ($1, $2, $3);
4997                                $match = chop_str($match, 70, 5, 'center');
4998                                my $contextlen = int((80 - length($match))/2);
4999                                $contextlen = 30 if ($contextlen > 30);
5000                                $lead  = chop_str($lead,  $contextlen, 10, 'left');
5001                                $trail = chop_str($trail, $contextlen, 10, 'right');
5002
5003                                $lead  = esc_html($lead);
5004                                $match = esc_html($match);
5005                                $trail = esc_html($trail);
5006
5007                                print "$lead<span class=\"match\">$match</span>$trail<br />";
5008                        }
5009                }
5010                print "</td>\n" .
5011                      "<td class=\"link\">" .
5012                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5013                      " | " .
5014                      $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5015                      " | " .
5016                      $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5017                print "</td>\n" .
5018                      "</tr>\n";
5019        }
5020        if (defined $extra) {
5021                print "<tr>\n" .
5022                      "<td colspan=\"3\">$extra</td>\n" .
5023                      "</tr>\n";
5024        }
5025        print "</table>\n";
5026}
5027
5028## ======================================================================
5029## ======================================================================
5030## actions
5031
5032sub git_project_list {
5033        my $order = $input_params{'order'};
5034        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5035                die_error(400, "Unknown order parameter");
5036        }
5037
5038        my @list = git_get_projects_list();
5039        if (!@list) {
5040                die_error(404, "No projects found");
5041        }
5042
5043        git_header_html();
5044        if (defined $home_text && -f $home_text) {
5045                print "<div class=\"index_include\">\n";
5046                insert_file($home_text);
5047                print "</div>\n";
5048        }
5049        print $cgi->startform(-method => "get") .
5050              "<p class=\"projsearch\">Search:\n" .
5051              $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
5052              "</p>" .
5053              $cgi->end_form() . "\n";
5054        git_project_list_body(\@list, $order);
5055        git_footer_html();
5056}
5057
5058sub git_forks {
5059        my $order = $input_params{'order'};
5060        if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5061                die_error(400, "Unknown order parameter");
5062        }
5063
5064        my @list = git_get_projects_list($project);
5065        if (!@list) {
5066                die_error(404, "No forks found");
5067        }
5068
5069        git_header_html();
5070        git_print_page_nav('','');
5071        git_print_header_div('summary', "$project forks");
5072        git_project_list_body(\@list, $order);
5073        git_footer_html();
5074}
5075
5076sub git_project_index {
5077        my @projects = git_get_projects_list($project);
5078
5079        print $cgi->header(
5080                -type => 'text/plain',
5081                -charset => 'utf-8',
5082                -content_disposition => 'inline; filename="index.aux"');
5083
5084        foreach my $pr (@projects) {
5085                if (!exists $pr->{'owner'}) {
5086                        $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
5087                }
5088
5089                my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
5090                # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
5091                $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5092                $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5093                $path  =~ s/ /\+/g;
5094                $owner =~ s/ /\+/g;
5095
5096                print "$path $owner\n";
5097        }
5098}
5099
5100sub git_summary {
5101        my $descr = git_get_project_description($project) || "none";
5102        my %co = parse_commit("HEAD");
5103        my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
5104        my $head = $co{'id'};
5105
5106        my $owner = git_get_project_owner($project);
5107
5108        my $refs = git_get_references();
5109        # These get_*_list functions return one more to allow us to see if
5110        # there are more ...
5111        my @taglist  = git_get_tags_list(16);
5112        my @headlist = git_get_heads_list(16);
5113        my @forklist;
5114        my $check_forks = gitweb_check_feature('forks');
5115
5116        if ($check_forks) {
5117                @forklist = git_get_projects_list($project);
5118        }
5119
5120        git_header_html();
5121        git_print_page_nav('summary','', $head);
5122
5123        print "<div class=\"title\">&nbsp;</div>\n";
5124        print "<table class=\"projects_list\">\n" .
5125              "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
5126              "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
5127        if (defined $cd{'rfc2822'}) {
5128                print "<tr id=\"metadata_lchange\"><td>last change</td><td>$cd{'rfc2822'}</td></tr>\n";
5129        }
5130
5131        # use per project git URL list in $projectroot/$project/cloneurl
5132        # or make project git URL from git base URL and project name
5133        my $url_tag = "URL";
5134        my @url_list = git_get_project_url_list($project);
5135        @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
5136        foreach my $git_url (@url_list) {
5137                next unless $git_url;
5138                print "<tr class=\"metadata_url\"><td>$url_tag</td><td>$git_url</td></tr>\n";
5139                $url_tag = "";
5140        }
5141
5142        # Tag cloud
5143        my $show_ctags = gitweb_check_feature('ctags');
5144        if ($show_ctags) {
5145                my $ctags = git_get_project_ctags($project);
5146                my $cloud = git_populate_project_tagcloud($ctags);
5147                print "<tr id=\"metadata_ctags\"><td>Content tags:<br />";
5148                print "</td>\n<td>" unless %$ctags;
5149                print "<form action=\"$show_ctags\" method=\"post\"><input type=\"hidden\" name=\"p\" value=\"$project\" />Add: <input type=\"text\" name=\"t\" size=\"8\" /></form>";
5150                print "</td>\n<td>" if %$ctags;
5151                print git_show_project_tagcloud($cloud, 48);
5152                print "</td></tr>";
5153        }
5154
5155        print "</table>\n";
5156
5157        # If XSS prevention is on, we don't include README.html.
5158        # TODO: Allow a readme in some safe format.
5159        if (!$prevent_xss && -s "$projectroot/$project/README.html") {
5160                print "<div class=\"title\">readme</div>\n" .
5161                      "<div class=\"readme\">\n";
5162                insert_file("$projectroot/$project/README.html");
5163                print "\n</div>\n"; # class="readme"
5164        }
5165
5166        # we need to request one more than 16 (0..15) to check if
5167        # those 16 are all
5168        my @commitlist = $head ? parse_commits($head, 17) : ();
5169        if (@commitlist) {
5170                git_print_header_div('shortlog');
5171                git_shortlog_body(\@commitlist, 0, 15, $refs,
5172                                  $#commitlist <=  15 ? undef :
5173                                  $cgi->a({-href => href(action=>"shortlog")}, "..."));
5174        }
5175
5176        if (@taglist) {
5177                git_print_header_div('tags');
5178                git_tags_body(\@taglist, 0, 15,
5179                              $#taglist <=  15 ? undef :
5180                              $cgi->a({-href => href(action=>"tags")}, "..."));
5181        }
5182
5183        if (@headlist) {
5184                git_print_header_div('heads');
5185                git_heads_body(\@headlist, $head, 0, 15,
5186                               $#headlist <= 15 ? undef :
5187                               $cgi->a({-href => href(action=>"heads")}, "..."));
5188        }
5189
5190        if (@forklist) {
5191                git_print_header_div('forks');
5192                git_project_list_body(\@forklist, 'age', 0, 15,
5193                                      $#forklist <= 15 ? undef :
5194                                      $cgi->a({-href => href(action=>"forks")}, "..."),
5195                                      'no_header');
5196        }
5197
5198        git_footer_html();
5199}
5200
5201sub git_tag {
5202        my $head = git_get_head_hash($project);
5203        git_header_html();
5204        git_print_page_nav('','', $head,undef,$head);
5205        my %tag = parse_tag($hash);
5206
5207        if (! %tag) {
5208                die_error(404, "Unknown tag object");
5209        }
5210
5211        git_print_header_div('commit', esc_html($tag{'name'}), $hash);
5212        print "<div class=\"title_text\">\n" .
5213              "<table class=\"object_header\">\n" .
5214              "<tr>\n" .
5215              "<td>object</td>\n" .
5216              "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5217                               $tag{'object'}) . "</td>\n" .
5218              "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5219                                              $tag{'type'}) . "</td>\n" .
5220              "</tr>\n";
5221        if (defined($tag{'author'})) {
5222                git_print_authorship_rows(\%tag, 'author');
5223        }
5224        print "</table>\n\n" .
5225              "</div>\n";
5226        print "<div class=\"page_body\">";
5227        my $comment = $tag{'comment'};
5228        foreach my $line (@$comment) {
5229                chomp $line;
5230                print esc_html($line, -nbsp=>1) . "<br/>\n";
5231        }
5232        print "</div>\n";
5233        git_footer_html();
5234}
5235
5236sub git_blame_common {
5237        my $format = shift || 'porcelain';
5238        if ($format eq 'porcelain' && $cgi->param('js')) {
5239                $format = 'incremental';
5240                $action = 'blame_incremental'; # for page title etc
5241        }
5242
5243        # permissions
5244        gitweb_check_feature('blame')
5245                or die_error(403, "Blame view not allowed");
5246
5247        # error checking
5248        die_error(400, "No file name given") unless $file_name;
5249        $hash_base ||= git_get_head_hash($project);
5250        die_error(404, "Couldn't find base commit") unless $hash_base;
5251        my %co = parse_commit($hash_base)
5252                or die_error(404, "Commit not found");
5253        my $ftype = "blob";
5254        if (!defined $hash) {
5255                $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
5256                        or die_error(404, "Error looking up file");
5257        } else {
5258                $ftype = git_get_type($hash);
5259                if ($ftype !~ "blob") {
5260                        die_error(400, "Object is not a blob");
5261                }
5262        }
5263
5264        my $fd;
5265        if ($format eq 'incremental') {
5266                # get file contents (as base)
5267                open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
5268                        or die_error(500, "Open git-cat-file failed");
5269        } elsif ($format eq 'data') {
5270                # run git-blame --incremental
5271                open $fd, "-|", git_cmd(), "blame", "--incremental",
5272                        $hash_base, "--", $file_name
5273                        or die_error(500, "Open git-blame --incremental failed");
5274        } else {
5275                # run git-blame --porcelain
5276                open $fd, "-|", git_cmd(), "blame", '-p',
5277                        $hash_base, '--', $file_name
5278                        or die_error(500, "Open git-blame --porcelain failed");
5279        }
5280
5281        # incremental blame data returns early
5282        if ($format eq 'data') {
5283                print $cgi->header(
5284                        -type=>"text/plain", -charset => "utf-8",
5285                        -status=> "200 OK");
5286                local $| = 1; # output autoflush
5287                print while <$fd>;
5288                close $fd
5289                        or print "ERROR $!\n";
5290
5291                print 'END';
5292                if (defined $t0 && gitweb_check_feature('timed')) {
5293                        print ' '.
5294                              Time::HiRes::tv_interval($t0, [Time::HiRes::gettimeofday()]).
5295                              ' '.$number_of_git_cmds;
5296                }
5297                print "\n";
5298
5299                return;
5300        }
5301
5302        # page header
5303        git_header_html();
5304        my $formats_nav =
5305                $cgi->a({-href => href(action=>"blob", -replay=>1)},
5306                        "blob") .
5307                " | ";
5308        if ($format eq 'incremental') {
5309                $formats_nav .=
5310                        $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
5311                                "blame") . " (non-incremental)";
5312        } else {
5313                $formats_nav .=
5314                        $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
5315                                "blame") . " (incremental)";
5316        }
5317        $formats_nav .=
5318                " | " .
5319                $cgi->a({-href => href(action=>"history", -replay=>1)},
5320                        "history") .
5321                " | " .
5322                $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
5323                        "HEAD");
5324        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5325        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5326        git_print_page_path($file_name, $ftype, $hash_base);
5327
5328        # page body
5329        if ($format eq 'incremental') {
5330                print "<noscript>\n<div class=\"error\"><center><b>\n".
5331                      "This page requires JavaScript to run.\n Use ".
5332                      $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
5333                              'this page').
5334                      " instead.\n".
5335                      "</b></center></div>\n</noscript>\n";
5336
5337                print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
5338        }
5339
5340        print qq!<div class="page_body">\n!;
5341        print qq!<div id="progress_info">... / ...</div>\n!
5342                if ($format eq 'incremental');
5343        print qq!<table id="blame_table" class="blame" width="100%">\n!.
5344              #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
5345              qq!<thead>\n!.
5346              qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
5347              qq!</thead>\n!.
5348              qq!<tbody>\n!;
5349
5350        my @rev_color = qw(light dark);
5351        my $num_colors = scalar(@rev_color);
5352        my $current_color = 0;
5353
5354        if ($format eq 'incremental') {
5355                my $color_class = $rev_color[$current_color];
5356
5357                #contents of a file
5358                my $linenr = 0;
5359        LINE:
5360                while (my $line = <$fd>) {
5361                        chomp $line;
5362                        $linenr++;
5363
5364                        print qq!<tr id="l$linenr" class="$color_class">!.
5365                              qq!<td class="sha1"><a href=""> </a></td>!.
5366                              qq!<td class="linenr">!.
5367                              qq!<a class="linenr" href="">$linenr</a></td>!;
5368                        print qq!<td class="pre">! . esc_html($line) . "</td>\n";
5369                        print qq!</tr>\n!;
5370                }
5371
5372        } else { # porcelain, i.e. ordinary blame
5373                my %metainfo = (); # saves information about commits
5374
5375                # blame data
5376        LINE:
5377                while (my $line = <$fd>) {
5378                        chomp $line;
5379                        # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
5380                        # no <lines in group> for subsequent lines in group of lines
5381                        my ($full_rev, $orig_lineno, $lineno, $group_size) =
5382                           ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
5383                        if (!exists $metainfo{$full_rev}) {
5384                                $metainfo{$full_rev} = { 'nprevious' => 0 };
5385                        }
5386                        my $meta = $metainfo{$full_rev};
5387                        my $data;
5388                        while ($data = <$fd>) {
5389                                chomp $data;
5390                                last if ($data =~ s/^\t//); # contents of line
5391                                if ($data =~ /^(\S+)(?: (.*))?$/) {
5392                                        $meta->{$1} = $2 unless exists $meta->{$1};
5393                                }
5394                                if ($data =~ /^previous /) {
5395                                        $meta->{'nprevious'}++;
5396                                }
5397                        }
5398                        my $short_rev = substr($full_rev, 0, 8);
5399                        my $author = $meta->{'author'};
5400                        my %date =
5401                                parse_date($meta->{'author-time'}, $meta->{'author-tz'});
5402                        my $date = $date{'iso-tz'};
5403                        if ($group_size) {
5404                                $current_color = ($current_color + 1) % $num_colors;
5405                        }
5406                        my $tr_class = $rev_color[$current_color];
5407                        $tr_class .= ' boundary' if (exists $meta->{'boundary'});
5408                        $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
5409                        $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
5410                        print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
5411                        if ($group_size) {
5412                                print "<td class=\"sha1\"";
5413                                print " title=\"". esc_html($author) . ", $date\"";
5414                                print " rowspan=\"$group_size\"" if ($group_size > 1);
5415                                print ">";
5416                                print $cgi->a({-href => href(action=>"commit",
5417                                                             hash=>$full_rev,
5418                                                             file_name=>$file_name)},
5419                                              esc_html($short_rev));
5420                                if ($group_size >= 2) {
5421                                        my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
5422                                        if (@author_initials) {
5423                                                print "<br />" .
5424                                                      esc_html(join('', @author_initials));
5425                                                #           or join('.', ...)
5426                                        }
5427                                }
5428                                print "</td>\n";
5429                        }
5430                        # 'previous' <sha1 of parent commit> <filename at commit>
5431                        if (exists $meta->{'previous'} &&
5432                            $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
5433                                $meta->{'parent'} = $1;
5434                                $meta->{'file_parent'} = unquote($2);
5435                        }
5436                        my $linenr_commit =
5437                                exists($meta->{'parent'}) ?
5438                                $meta->{'parent'} : $full_rev;
5439                        my $linenr_filename =
5440                                exists($meta->{'file_parent'}) ?
5441                                $meta->{'file_parent'} : unquote($meta->{'filename'});
5442                        my $blamed = href(action => 'blame',
5443                                          file_name => $linenr_filename,
5444                                          hash_base => $linenr_commit);
5445                        print "<td class=\"linenr\">";
5446                        print $cgi->a({ -href => "$blamed#l$orig_lineno",
5447                                        -class => "linenr" },
5448                                      esc_html($lineno));
5449                        print "</td>";
5450                        print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
5451                        print "</tr>\n";
5452                } # end while
5453
5454        }
5455
5456        # footer
5457        print "</tbody>\n".
5458              "</table>\n"; # class="blame"
5459        print "</div>\n";   # class="blame_body"
5460        close $fd
5461                or print "Reading blob failed\n";
5462
5463        git_footer_html();
5464}
5465
5466sub git_blame {
5467        git_blame_common();
5468}
5469
5470sub git_blame_incremental {
5471        git_blame_common('incremental');
5472}
5473
5474sub git_blame_data {
5475        git_blame_common('data');
5476}
5477
5478sub git_tags {
5479        my $head = git_get_head_hash($project);
5480        git_header_html();
5481        git_print_page_nav('','', $head,undef,$head);
5482        git_print_header_div('summary', $project);
5483
5484        my @tagslist = git_get_tags_list();
5485        if (@tagslist) {
5486                git_tags_body(\@tagslist);
5487        }
5488        git_footer_html();
5489}
5490
5491sub git_heads {
5492        my $head = git_get_head_hash($project);
5493        git_header_html();
5494        git_print_page_nav('','', $head,undef,$head);
5495        git_print_header_div('summary', $project);
5496
5497        my @headslist = git_get_heads_list();
5498        if (@headslist) {
5499                git_heads_body(\@headslist, $head);
5500        }
5501        git_footer_html();
5502}
5503
5504sub git_blob_plain {
5505        my $type = shift;
5506        my $expires;
5507
5508        if (!defined $hash) {
5509                if (defined $file_name) {
5510                        my $base = $hash_base || git_get_head_hash($project);
5511                        $hash = git_get_hash_by_path($base, $file_name, "blob")
5512                                or die_error(404, "Cannot find file");
5513                } else {
5514                        die_error(400, "No file name defined");
5515                }
5516        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5517                # blobs defined by non-textual hash id's can be cached
5518                $expires = "+1d";
5519        }
5520
5521        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5522                or die_error(500, "Open git-cat-file blob '$hash' failed");
5523
5524        # content-type (can include charset)
5525        $type = blob_contenttype($fd, $file_name, $type);
5526
5527        # "save as" filename, even when no $file_name is given
5528        my $save_as = "$hash";
5529        if (defined $file_name) {
5530                $save_as = $file_name;
5531        } elsif ($type =~ m/^text\//) {
5532                $save_as .= '.txt';
5533        }
5534
5535        # With XSS prevention on, blobs of all types except a few known safe
5536        # ones are served with "Content-Disposition: attachment" to make sure
5537        # they don't run in our security domain.  For certain image types,
5538        # blob view writes an <img> tag referring to blob_plain view, and we
5539        # want to be sure not to break that by serving the image as an
5540        # attachment (though Firefox 3 doesn't seem to care).
5541        my $sandbox = $prevent_xss &&
5542                $type !~ m!^(?:text/plain|image/(?:gif|png|jpeg))$!;
5543
5544        print $cgi->header(
5545                -type => $type,
5546                -expires => $expires,
5547                -content_disposition =>
5548                        ($sandbox ? 'attachment' : 'inline')
5549                        . '; filename="' . $save_as . '"');
5550        local $/ = undef;
5551        binmode STDOUT, ':raw';
5552        print <$fd>;
5553        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
5554        close $fd;
5555}
5556
5557sub git_blob {
5558        my $expires;
5559
5560        if (!defined $hash) {
5561                if (defined $file_name) {
5562                        my $base = $hash_base || git_get_head_hash($project);
5563                        $hash = git_get_hash_by_path($base, $file_name, "blob")
5564                                or die_error(404, "Cannot find file");
5565                } else {
5566                        die_error(400, "No file name defined");
5567                }
5568        } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5569                # blobs defined by non-textual hash id's can be cached
5570                $expires = "+1d";
5571        }
5572
5573        my $have_blame = gitweb_check_feature('blame');
5574        open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5575                or die_error(500, "Couldn't cat $file_name, $hash");
5576        my $mimetype = blob_mimetype($fd, $file_name);
5577        # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
5578        if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
5579                close $fd;
5580                return git_blob_plain($mimetype);
5581        }
5582        # we can have blame only for text/* mimetype
5583        $have_blame &&= ($mimetype =~ m!^text/!);
5584
5585        my $highlight = gitweb_check_feature('highlight');
5586        my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
5587        $fd = run_highlighter($fd, $highlight, $syntax)
5588                if $syntax;
5589
5590        git_header_html(undef, $expires);
5591        my $formats_nav = '';
5592        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
5593                if (defined $file_name) {
5594                        if ($have_blame) {
5595                                $formats_nav .=
5596                                        $cgi->a({-href => href(action=>"blame", -replay=>1)},
5597                                                "blame") .
5598                                        " | ";
5599                        }
5600                        $formats_nav .=
5601                                $cgi->a({-href => href(action=>"history", -replay=>1)},
5602                                        "history") .
5603                                " | " .
5604                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5605                                        "raw") .
5606                                " | " .
5607                                $cgi->a({-href => href(action=>"blob",
5608                                                       hash_base=>"HEAD", file_name=>$file_name)},
5609                                        "HEAD");
5610                } else {
5611                        $formats_nav .=
5612                                $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5613                                        "raw");
5614                }
5615                git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5616                git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5617        } else {
5618                print "<div class=\"page_nav\">\n" .
5619                      "<br/><br/></div>\n" .
5620                      "<div class=\"title\">".esc_html($hash)."</div>\n";
5621        }
5622        git_print_page_path($file_name, "blob", $hash_base);
5623        print "<div class=\"page_body\">\n";
5624        if ($mimetype =~ m!^image/!) {
5625                print qq!<img type="!.esc_attr($mimetype).qq!"!;
5626                if ($file_name) {
5627                        print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
5628                }
5629                print qq! src="! .
5630                      href(action=>"blob_plain", hash=>$hash,
5631                           hash_base=>$hash_base, file_name=>$file_name) .
5632                      qq!" />\n!;
5633        } else {
5634                my $nr;
5635                while (my $line = <$fd>) {
5636                        chomp $line;
5637                        $nr++;
5638                        $line = untabify($line);
5639                        printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
5640                               $nr, esc_attr(href(-replay => 1)), $nr, $nr, $syntax ? $line : esc_html($line, -nbsp=>1);
5641                }
5642        }
5643        close $fd
5644                or print "Reading blob failed.\n";
5645        print "</div>";
5646        git_footer_html();
5647}
5648
5649sub git_tree {
5650        if (!defined $hash_base) {
5651                $hash_base = "HEAD";
5652        }
5653        if (!defined $hash) {
5654                if (defined $file_name) {
5655                        $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
5656                } else {
5657                        $hash = $hash_base;
5658                }
5659        }
5660        die_error(404, "No such tree") unless defined($hash);
5661
5662        my $show_sizes = gitweb_check_feature('show-sizes');
5663        my $have_blame = gitweb_check_feature('blame');
5664
5665        my @entries = ();
5666        {
5667                local $/ = "\0";
5668                open my $fd, "-|", git_cmd(), "ls-tree", '-z',
5669                        ($show_sizes ? '-l' : ()), @extra_options, $hash
5670                        or die_error(500, "Open git-ls-tree failed");
5671                @entries = map { chomp; $_ } <$fd>;
5672                close $fd
5673                        or die_error(404, "Reading tree failed");
5674        }
5675
5676        my $refs = git_get_references();
5677        my $ref = format_ref_marker($refs, $hash_base);
5678        git_header_html();
5679        my $basedir = '';
5680        if (defined $hash_base && (my %co = parse_commit($hash_base))) {
5681                my @views_nav = ();
5682                if (defined $file_name) {
5683                        push @views_nav,
5684                                $cgi->a({-href => href(action=>"history", -replay=>1)},
5685                                        "history"),
5686                                $cgi->a({-href => href(action=>"tree",
5687                                                       hash_base=>"HEAD", file_name=>$file_name)},
5688                                        "HEAD"),
5689                }
5690                my $snapshot_links = format_snapshot_links($hash);
5691                if (defined $snapshot_links) {
5692                        # FIXME: Should be available when we have no hash base as well.
5693                        push @views_nav, $snapshot_links;
5694                }
5695                git_print_page_nav('tree','', $hash_base, undef, undef,
5696                                   join(' | ', @views_nav));
5697                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
5698        } else {
5699                undef $hash_base;
5700                print "<div class=\"page_nav\">\n";
5701                print "<br/><br/></div>\n";
5702                print "<div class=\"title\">".esc_html($hash)."</div>\n";
5703        }
5704        if (defined $file_name) {
5705                $basedir = $file_name;
5706                if ($basedir ne '' && substr($basedir, -1) ne '/') {
5707                        $basedir .= '/';
5708                }
5709                git_print_page_path($file_name, 'tree', $hash_base);
5710        }
5711        print "<div class=\"page_body\">\n";
5712        print "<table class=\"tree\">\n";
5713        my $alternate = 1;
5714        # '..' (top directory) link if possible
5715        if (defined $hash_base &&
5716            defined $file_name && $file_name =~ m![^/]+$!) {
5717                if ($alternate) {
5718                        print "<tr class=\"dark\">\n";
5719                } else {
5720                        print "<tr class=\"light\">\n";
5721                }
5722                $alternate ^= 1;
5723
5724                my $up = $file_name;
5725                $up =~ s!/?[^/]+$!!;
5726                undef $up unless $up;
5727                # based on git_print_tree_entry
5728                print '<td class="mode">' . mode_str('040000') . "</td>\n";
5729                print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
5730                print '<td class="list">';
5731                print $cgi->a({-href => href(action=>"tree",
5732                                             hash_base=>$hash_base,
5733                                             file_name=>$up)},
5734                              "..");
5735                print "</td>\n";
5736                print "<td class=\"link\"></td>\n";
5737
5738                print "</tr>\n";
5739        }
5740        foreach my $line (@entries) {
5741                my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
5742
5743                if ($alternate) {
5744                        print "<tr class=\"dark\">\n";
5745                } else {
5746                        print "<tr class=\"light\">\n";
5747                }
5748                $alternate ^= 1;
5749
5750                git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
5751
5752                print "</tr>\n";
5753        }
5754        print "</table>\n" .
5755              "</div>";
5756        git_footer_html();
5757}
5758
5759sub snapshot_name {
5760        my ($project, $hash) = @_;
5761
5762        # path/to/project.git  -> project
5763        # path/to/project/.git -> project
5764        my $name = to_utf8($project);
5765        $name =~ s,([^/])/*\.git$,$1,;
5766        $name = basename($name);
5767        # sanitize name
5768        $name =~ s/[[:cntrl:]]/?/g;
5769
5770        my $ver = $hash;
5771        if ($hash =~ /^[0-9a-fA-F]+$/) {
5772                # shorten SHA-1 hash
5773                my $full_hash = git_get_full_hash($project, $hash);
5774                if ($full_hash =~ /^$hash/ && length($hash) > 7) {
5775                        $ver = git_get_short_hash($project, $hash);
5776                }
5777        } elsif ($hash =~ m!^refs/tags/(.*)$!) {
5778                # tags don't need shortened SHA-1 hash
5779                $ver = $1;
5780        } else {
5781                # branches and other need shortened SHA-1 hash
5782                if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
5783                        $ver = $1;
5784                }
5785                $ver .= '-' . git_get_short_hash($project, $hash);
5786        }
5787        # in case of hierarchical branch names
5788        $ver =~ s!/!.!g;
5789
5790        # name = project-version_string
5791        $name = "$name-$ver";
5792
5793        return wantarray ? ($name, $name) : $name;
5794}
5795
5796sub git_snapshot {
5797        my $format = $input_params{'snapshot_format'};
5798        if (!@snapshot_fmts) {
5799                die_error(403, "Snapshots not allowed");
5800        }
5801        # default to first supported snapshot format
5802        $format ||= $snapshot_fmts[0];
5803        if ($format !~ m/^[a-z0-9]+$/) {
5804                die_error(400, "Invalid snapshot format parameter");
5805        } elsif (!exists($known_snapshot_formats{$format})) {
5806                die_error(400, "Unknown snapshot format");
5807        } elsif ($known_snapshot_formats{$format}{'disabled'}) {
5808                die_error(403, "Snapshot format not allowed");
5809        } elsif (!grep($_ eq $format, @snapshot_fmts)) {
5810                die_error(403, "Unsupported snapshot format");
5811        }
5812
5813        my $type = git_get_type("$hash^{}");
5814        if (!$type) {
5815                die_error(404, 'Object does not exist');
5816        }  elsif ($type eq 'blob') {
5817                die_error(400, 'Object is not a tree-ish');
5818        }
5819
5820        my ($name, $prefix) = snapshot_name($project, $hash);
5821        my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
5822        my $cmd = quote_command(
5823                git_cmd(), 'archive',
5824                "--format=$known_snapshot_formats{$format}{'format'}",
5825                "--prefix=$prefix/", $hash);
5826        if (exists $known_snapshot_formats{$format}{'compressor'}) {
5827                $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
5828        }
5829
5830        $filename =~ s/(["\\])/\\$1/g;
5831        print $cgi->header(
5832                -type => $known_snapshot_formats{$format}{'type'},
5833                -content_disposition => 'inline; filename="' . $filename . '"',
5834                -status => '200 OK');
5835
5836        open my $fd, "-|", $cmd
5837                or die_error(500, "Execute git-archive failed");
5838        binmode STDOUT, ':raw';
5839        print <$fd>;
5840        binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
5841        close $fd;
5842}
5843
5844sub git_log_generic {
5845        my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
5846
5847        my $head = git_get_head_hash($project);
5848        if (!defined $base) {
5849                $base = $head;
5850        }
5851        if (!defined $page) {
5852                $page = 0;
5853        }
5854        my $refs = git_get_references();
5855
5856        my $commit_hash = $base;
5857        if (defined $parent) {
5858                $commit_hash = "$parent..$base";
5859        }
5860        my @commitlist =
5861                parse_commits($commit_hash, 101, (100 * $page),
5862                              defined $file_name ? ($file_name, "--full-history") : ());
5863
5864        my $ftype;
5865        if (!defined $file_hash && defined $file_name) {
5866                # some commits could have deleted file in question,
5867                # and not have it in tree, but one of them has to have it
5868                for (my $i = 0; $i < @commitlist; $i++) {
5869                        $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
5870                        last if defined $file_hash;
5871                }
5872        }
5873        if (defined $file_hash) {
5874                $ftype = git_get_type($file_hash);
5875        }
5876        if (defined $file_name && !defined $ftype) {
5877                die_error(500, "Unknown type of object");
5878        }
5879        my %co;
5880        if (defined $file_name) {
5881                %co = parse_commit($base)
5882                        or die_error(404, "Unknown commit object");
5883        }
5884
5885
5886        my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
5887        my $next_link = '';
5888        if ($#commitlist >= 100) {
5889                $next_link =
5890                        $cgi->a({-href => href(-replay=>1, page=>$page+1),
5891                                 -accesskey => "n", -title => "Alt-n"}, "next");
5892        }
5893        my $patch_max = gitweb_get_feature('patches');
5894        if ($patch_max && !defined $file_name) {
5895                if ($patch_max < 0 || @commitlist <= $patch_max) {
5896                        $paging_nav .= " &sdot; " .
5897                                $cgi->a({-href => href(action=>"patches", -replay=>1)},
5898                                        "patches");
5899                }
5900        }
5901
5902        git_header_html();
5903        git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
5904        if (defined $file_name) {
5905                git_print_header_div('commit', esc_html($co{'title'}), $base);
5906        } else {
5907                git_print_header_div('summary', $project)
5908        }
5909        git_print_page_path($file_name, $ftype, $hash_base)
5910                if (defined $file_name);
5911
5912        $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
5913                     $file_name, $file_hash, $ftype);
5914
5915        git_footer_html();
5916}
5917
5918sub git_log {
5919        git_log_generic('log', \&git_log_body,
5920                        $hash, $hash_parent);
5921}
5922
5923sub git_commit {
5924        $hash ||= $hash_base || "HEAD";
5925        my %co = parse_commit($hash)
5926            or die_error(404, "Unknown commit object");
5927
5928        my $parent  = $co{'parent'};
5929        my $parents = $co{'parents'}; # listref
5930
5931        # we need to prepare $formats_nav before any parameter munging
5932        my $formats_nav;
5933        if (!defined $parent) {
5934                # --root commitdiff
5935                $formats_nav .= '(initial)';
5936        } elsif (@$parents == 1) {
5937                # single parent commit
5938                $formats_nav .=
5939                        '(parent: ' .
5940                        $cgi->a({-href => href(action=>"commit",
5941                                               hash=>$parent)},
5942                                esc_html(substr($parent, 0, 7))) .
5943                        ')';
5944        } else {
5945                # merge commit
5946                $formats_nav .=
5947                        '(merge: ' .
5948                        join(' ', map {
5949                                $cgi->a({-href => href(action=>"commit",
5950                                                       hash=>$_)},
5951                                        esc_html(substr($_, 0, 7)));
5952                        } @$parents ) .
5953                        ')';
5954        }
5955        if (gitweb_check_feature('patches') && @$parents <= 1) {
5956                $formats_nav .= " | " .
5957                        $cgi->a({-href => href(action=>"patch", -replay=>1)},
5958                                "patch");
5959        }
5960
5961        if (!defined $parent) {
5962                $parent = "--root";
5963        }
5964        my @difftree;
5965        open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
5966                @diff_opts,
5967                (@$parents <= 1 ? $parent : '-c'),
5968                $hash, "--"
5969                or die_error(500, "Open git-diff-tree failed");
5970        @difftree = map { chomp; $_ } <$fd>;
5971        close $fd or die_error(404, "Reading git-diff-tree failed");
5972
5973        # non-textual hash id's can be cached
5974        my $expires;
5975        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5976                $expires = "+1d";
5977        }
5978        my $refs = git_get_references();
5979        my $ref = format_ref_marker($refs, $co{'id'});
5980
5981        git_header_html(undef, $expires);
5982        git_print_page_nav('commit', '',
5983                           $hash, $co{'tree'}, $hash,
5984                           $formats_nav);
5985
5986        if (defined $co{'parent'}) {
5987                git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
5988        } else {
5989                git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
5990        }
5991        print "<div class=\"title_text\">\n" .
5992              "<table class=\"object_header\">\n";
5993        git_print_authorship_rows(\%co);
5994        print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
5995        print "<tr>" .
5996              "<td>tree</td>" .
5997              "<td class=\"sha1\">" .
5998              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
5999                       class => "list"}, $co{'tree'}) .
6000              "</td>" .
6001              "<td class=\"link\">" .
6002              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
6003                      "tree");
6004        my $snapshot_links = format_snapshot_links($hash);
6005        if (defined $snapshot_links) {
6006                print " | " . $snapshot_links;
6007        }
6008        print "</td>" .
6009              "</tr>\n";
6010
6011        foreach my $par (@$parents) {
6012                print "<tr>" .
6013                      "<td>parent</td>" .
6014                      "<td class=\"sha1\">" .
6015                      $cgi->a({-href => href(action=>"commit", hash=>$par),
6016                               class => "list"}, $par) .
6017                      "</td>" .
6018                      "<td class=\"link\">" .
6019                      $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
6020                      " | " .
6021                      $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
6022                      "</td>" .
6023                      "</tr>\n";
6024        }
6025        print "</table>".
6026              "</div>\n";
6027
6028        print "<div class=\"page_body\">\n";
6029        git_print_log($co{'comment'});
6030        print "</div>\n";
6031
6032        git_difftree_body(\@difftree, $hash, @$parents);
6033
6034        git_footer_html();
6035}
6036
6037sub git_object {
6038        # object is defined by:
6039        # - hash or hash_base alone
6040        # - hash_base and file_name
6041        my $type;
6042
6043        # - hash or hash_base alone
6044        if ($hash || ($hash_base && !defined $file_name)) {
6045                my $object_id = $hash || $hash_base;
6046
6047                open my $fd, "-|", quote_command(
6048                        git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
6049                        or die_error(404, "Object does not exist");
6050                $type = <$fd>;
6051                chomp $type;
6052                close $fd
6053                        or die_error(404, "Object does not exist");
6054
6055        # - hash_base and file_name
6056        } elsif ($hash_base && defined $file_name) {
6057                $file_name =~ s,/+$,,;
6058
6059                system(git_cmd(), "cat-file", '-e', $hash_base) == 0
6060                        or die_error(404, "Base object does not exist");
6061
6062                # here errors should not hapen
6063                open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
6064                        or die_error(500, "Open git-ls-tree failed");
6065                my $line = <$fd>;
6066                close $fd;
6067
6068                #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
6069                unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
6070                        die_error(404, "File or directory for given base does not exist");
6071                }
6072                $type = $2;
6073                $hash = $3;
6074        } else {
6075                die_error(400, "Not enough information to find object");
6076        }
6077
6078        print $cgi->redirect(-uri => href(action=>$type, -full=>1,
6079                                          hash=>$hash, hash_base=>$hash_base,
6080                                          file_name=>$file_name),
6081                             -status => '302 Found');
6082}
6083
6084sub git_blobdiff {
6085        my $format = shift || 'html';
6086
6087        my $fd;
6088        my @difftree;
6089        my %diffinfo;
6090        my $expires;
6091
6092        # preparing $fd and %diffinfo for git_patchset_body
6093        # new style URI
6094        if (defined $hash_base && defined $hash_parent_base) {
6095                if (defined $file_name) {
6096                        # read raw output
6097                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6098                                $hash_parent_base, $hash_base,
6099                                "--", (defined $file_parent ? $file_parent : ()), $file_name
6100                                or die_error(500, "Open git-diff-tree failed");
6101                        @difftree = map { chomp; $_ } <$fd>;
6102                        close $fd
6103                                or die_error(404, "Reading git-diff-tree failed");
6104                        @difftree
6105                                or die_error(404, "Blob diff not found");
6106
6107                } elsif (defined $hash &&
6108                         $hash =~ /[0-9a-fA-F]{40}/) {
6109                        # try to find filename from $hash
6110
6111                        # read filtered raw output
6112                        open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6113                                $hash_parent_base, $hash_base, "--"
6114                                or die_error(500, "Open git-diff-tree failed");
6115                        @difftree =
6116                                # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
6117                                # $hash == to_id
6118                                grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
6119                                map { chomp; $_ } <$fd>;
6120                        close $fd
6121                                or die_error(404, "Reading git-diff-tree failed");
6122                        @difftree
6123                                or die_error(404, "Blob diff not found");
6124
6125                } else {
6126                        die_error(400, "Missing one of the blob diff parameters");
6127                }
6128
6129                if (@difftree > 1) {
6130                        die_error(400, "Ambiguous blob diff specification");
6131                }
6132
6133                %diffinfo = parse_difftree_raw_line($difftree[0]);
6134                $file_parent ||= $diffinfo{'from_file'} || $file_name;
6135                $file_name   ||= $diffinfo{'to_file'};
6136
6137                $hash_parent ||= $diffinfo{'from_id'};
6138                $hash        ||= $diffinfo{'to_id'};
6139
6140                # non-textual hash id's can be cached
6141                if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
6142                    $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
6143                        $expires = '+1d';
6144                }
6145
6146                # open patch output
6147                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6148                        '-p', ($format eq 'html' ? "--full-index" : ()),
6149                        $hash_parent_base, $hash_base,
6150                        "--", (defined $file_parent ? $file_parent : ()), $file_name
6151                        or die_error(500, "Open git-diff-tree failed");
6152        }
6153
6154        # old/legacy style URI -- not generated anymore since 1.4.3.
6155        if (!%diffinfo) {
6156                die_error('404 Not Found', "Missing one of the blob diff parameters")
6157        }
6158
6159        # header
6160        if ($format eq 'html') {
6161                my $formats_nav =
6162                        $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
6163                                "raw");
6164                git_header_html(undef, $expires);
6165                if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6166                        git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6167                        git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6168                } else {
6169                        print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
6170                        print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
6171                }
6172                if (defined $file_name) {
6173                        git_print_page_path($file_name, "blob", $hash_base);
6174                } else {
6175                        print "<div class=\"page_path\"></div>\n";
6176                }
6177
6178        } elsif ($format eq 'plain') {
6179                print $cgi->header(
6180                        -type => 'text/plain',
6181                        -charset => 'utf-8',
6182                        -expires => $expires,
6183                        -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
6184
6185                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6186
6187        } else {
6188                die_error(400, "Unknown blobdiff format");
6189        }
6190
6191        # patch
6192        if ($format eq 'html') {
6193                print "<div class=\"page_body\">\n";
6194
6195                git_patchset_body($fd, [ \%diffinfo ], $hash_base, $hash_parent_base);
6196                close $fd;
6197
6198                print "</div>\n"; # class="page_body"
6199                git_footer_html();
6200
6201        } else {
6202                while (my $line = <$fd>) {
6203                        $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
6204                        $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
6205
6206                        print $line;
6207
6208                        last if $line =~ m!^\+\+\+!;
6209                }
6210                local $/ = undef;
6211                print <$fd>;
6212                close $fd;
6213        }
6214}
6215
6216sub git_blobdiff_plain {
6217        git_blobdiff('plain');
6218}
6219
6220sub git_commitdiff {
6221        my %params = @_;
6222        my $format = $params{-format} || 'html';
6223
6224        my ($patch_max) = gitweb_get_feature('patches');
6225        if ($format eq 'patch') {
6226                die_error(403, "Patch view not allowed") unless $patch_max;
6227        }
6228
6229        $hash ||= $hash_base || "HEAD";
6230        my %co = parse_commit($hash)
6231            or die_error(404, "Unknown commit object");
6232
6233        # choose format for commitdiff for merge
6234        if (! defined $hash_parent && @{$co{'parents'}} > 1) {
6235                $hash_parent = '--cc';
6236        }
6237        # we need to prepare $formats_nav before almost any parameter munging
6238        my $formats_nav;
6239        if ($format eq 'html') {
6240                $formats_nav =
6241                        $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
6242                                "raw");
6243                if ($patch_max && @{$co{'parents'}} <= 1) {
6244                        $formats_nav .= " | " .
6245                                $cgi->a({-href => href(action=>"patch", -replay=>1)},
6246                                        "patch");
6247                }
6248
6249                if (defined $hash_parent &&
6250                    $hash_parent ne '-c' && $hash_parent ne '--cc') {
6251                        # commitdiff with two commits given
6252                        my $hash_parent_short = $hash_parent;
6253                        if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
6254                                $hash_parent_short = substr($hash_parent, 0, 7);
6255                        }
6256                        $formats_nav .=
6257                                ' (from';
6258                        for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
6259                                if ($co{'parents'}[$i] eq $hash_parent) {
6260                                        $formats_nav .= ' parent ' . ($i+1);
6261                                        last;
6262                                }
6263                        }
6264                        $formats_nav .= ': ' .
6265                                $cgi->a({-href => href(action=>"commitdiff",
6266                                                       hash=>$hash_parent)},
6267                                        esc_html($hash_parent_short)) .
6268                                ')';
6269                } elsif (!$co{'parent'}) {
6270                        # --root commitdiff
6271                        $formats_nav .= ' (initial)';
6272                } elsif (scalar @{$co{'parents'}} == 1) {
6273                        # single parent commit
6274                        $formats_nav .=
6275                                ' (parent: ' .
6276                                $cgi->a({-href => href(action=>"commitdiff",
6277                                                       hash=>$co{'parent'})},
6278                                        esc_html(substr($co{'parent'}, 0, 7))) .
6279                                ')';
6280                } else {
6281                        # merge commit
6282                        if ($hash_parent eq '--cc') {
6283                                $formats_nav .= ' | ' .
6284                                        $cgi->a({-href => href(action=>"commitdiff",
6285                                                               hash=>$hash, hash_parent=>'-c')},
6286                                                'combined');
6287                        } else { # $hash_parent eq '-c'
6288                                $formats_nav .= ' | ' .
6289                                        $cgi->a({-href => href(action=>"commitdiff",
6290                                                               hash=>$hash, hash_parent=>'--cc')},
6291                                                'compact');
6292                        }
6293                        $formats_nav .=
6294                                ' (merge: ' .
6295                                join(' ', map {
6296                                        $cgi->a({-href => href(action=>"commitdiff",
6297                                                               hash=>$_)},
6298                                                esc_html(substr($_, 0, 7)));
6299                                } @{$co{'parents'}} ) .
6300                                ')';
6301                }
6302        }
6303
6304        my $hash_parent_param = $hash_parent;
6305        if (!defined $hash_parent_param) {
6306                # --cc for multiple parents, --root for parentless
6307                $hash_parent_param =
6308                        @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
6309        }
6310
6311        # read commitdiff
6312        my $fd;
6313        my @difftree;
6314        if ($format eq 'html') {
6315                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6316                        "--no-commit-id", "--patch-with-raw", "--full-index",
6317                        $hash_parent_param, $hash, "--"
6318                        or die_error(500, "Open git-diff-tree failed");
6319
6320                while (my $line = <$fd>) {
6321                        chomp $line;
6322                        # empty line ends raw part of diff-tree output
6323                        last unless $line;
6324                        push @difftree, scalar parse_difftree_raw_line($line);
6325                }
6326
6327        } elsif ($format eq 'plain') {
6328                open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6329                        '-p', $hash_parent_param, $hash, "--"
6330                        or die_error(500, "Open git-diff-tree failed");
6331        } elsif ($format eq 'patch') {
6332                # For commit ranges, we limit the output to the number of
6333                # patches specified in the 'patches' feature.
6334                # For single commits, we limit the output to a single patch,
6335                # diverging from the git-format-patch default.
6336                my @commit_spec = ();
6337                if ($hash_parent) {
6338                        if ($patch_max > 0) {
6339                                push @commit_spec, "-$patch_max";
6340                        }
6341                        push @commit_spec, '-n', "$hash_parent..$hash";
6342                } else {
6343                        if ($params{-single}) {
6344                                push @commit_spec, '-1';
6345                        } else {
6346                                if ($patch_max > 0) {
6347                                        push @commit_spec, "-$patch_max";
6348                                }
6349                                push @commit_spec, "-n";
6350                        }
6351                        push @commit_spec, '--root', $hash;
6352                }
6353                open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
6354                        '--encoding=utf8', '--stdout', @commit_spec
6355                        or die_error(500, "Open git-format-patch failed");
6356        } else {
6357                die_error(400, "Unknown commitdiff format");
6358        }
6359
6360        # non-textual hash id's can be cached
6361        my $expires;
6362        if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6363                $expires = "+1d";
6364        }
6365
6366        # write commit message
6367        if ($format eq 'html') {
6368                my $refs = git_get_references();
6369                my $ref = format_ref_marker($refs, $co{'id'});
6370
6371                git_header_html(undef, $expires);
6372                git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
6373                git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
6374                print "<div class=\"title_text\">\n" .
6375                      "<table class=\"object_header\">\n";
6376                git_print_authorship_rows(\%co);
6377                print "</table>".
6378                      "</div>\n";
6379                print "<div class=\"page_body\">\n";
6380                if (@{$co{'comment'}} > 1) {
6381                        print "<div class=\"log\">\n";
6382                        git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
6383                        print "</div>\n"; # class="log"
6384                }
6385
6386        } elsif ($format eq 'plain') {
6387                my $refs = git_get_references("tags");
6388                my $tagname = git_get_rev_name_tags($hash);
6389                my $filename = basename($project) . "-$hash.patch";
6390
6391                print $cgi->header(
6392                        -type => 'text/plain',
6393                        -charset => 'utf-8',
6394                        -expires => $expires,
6395                        -content_disposition => 'inline; filename="' . "$filename" . '"');
6396                my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
6397                print "From: " . to_utf8($co{'author'}) . "\n";
6398                print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
6399                print "Subject: " . to_utf8($co{'title'}) . "\n";
6400
6401                print "X-Git-Tag: $tagname\n" if $tagname;
6402                print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6403
6404                foreach my $line (@{$co{'comment'}}) {
6405                        print to_utf8($line) . "\n";
6406                }
6407                print "---\n\n";
6408        } elsif ($format eq 'patch') {
6409                my $filename = basename($project) . "-$hash.patch";
6410
6411                print $cgi->header(
6412                        -type => 'text/plain',
6413                        -charset => 'utf-8',
6414                        -expires => $expires,
6415                        -content_disposition => 'inline; filename="' . "$filename" . '"');
6416        }
6417
6418        # write patch
6419        if ($format eq 'html') {
6420                my $use_parents = !defined $hash_parent ||
6421                        $hash_parent eq '-c' || $hash_parent eq '--cc';
6422                git_difftree_body(\@difftree, $hash,
6423                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
6424                print "<br/>\n";
6425
6426                git_patchset_body($fd, \@difftree, $hash,
6427                                  $use_parents ? @{$co{'parents'}} : $hash_parent);
6428                close $fd;
6429                print "</div>\n"; # class="page_body"
6430                git_footer_html();
6431
6432        } elsif ($format eq 'plain') {
6433                local $/ = undef;
6434                print <$fd>;
6435                close $fd
6436                        or print "Reading git-diff-tree failed\n";
6437        } elsif ($format eq 'patch') {
6438                local $/ = undef;
6439                print <$fd>;
6440                close $fd
6441                        or print "Reading git-format-patch failed\n";
6442        }
6443}
6444
6445sub git_commitdiff_plain {
6446        git_commitdiff(-format => 'plain');
6447}
6448
6449# format-patch-style patches
6450sub git_patch {
6451        git_commitdiff(-format => 'patch', -single => 1);
6452}
6453
6454sub git_patches {
6455        git_commitdiff(-format => 'patch');
6456}
6457
6458sub git_history {
6459        git_log_generic('history', \&git_history_body,
6460                        $hash_base, $hash_parent_base,
6461                        $file_name, $hash);
6462}
6463
6464sub git_search {
6465        gitweb_check_feature('search') or die_error(403, "Search is disabled");
6466        if (!defined $searchtext) {
6467                die_error(400, "Text field is empty");
6468        }
6469        if (!defined $hash) {
6470                $hash = git_get_head_hash($project);
6471        }
6472        my %co = parse_commit($hash);
6473        if (!%co) {
6474                die_error(404, "Unknown commit object");
6475        }
6476        if (!defined $page) {
6477                $page = 0;
6478        }
6479
6480        $searchtype ||= 'commit';
6481        if ($searchtype eq 'pickaxe') {
6482                # pickaxe may take all resources of your box and run for several minutes
6483                # with every query - so decide by yourself how public you make this feature
6484                gitweb_check_feature('pickaxe')
6485                    or die_error(403, "Pickaxe is disabled");
6486        }
6487        if ($searchtype eq 'grep') {
6488                gitweb_check_feature('grep')
6489                    or die_error(403, "Grep is disabled");
6490        }
6491
6492        git_header_html();
6493
6494        if ($searchtype eq 'commit' or $searchtype eq 'author' or $searchtype eq 'committer') {
6495                my $greptype;
6496                if ($searchtype eq 'commit') {
6497                        $greptype = "--grep=";
6498                } elsif ($searchtype eq 'author') {
6499                        $greptype = "--author=";
6500                } elsif ($searchtype eq 'committer') {
6501                        $greptype = "--committer=";
6502                }
6503                $greptype .= $searchtext;
6504                my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
6505                                               $greptype, '--regexp-ignore-case',
6506                                               $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
6507
6508                my $paging_nav = '';
6509                if ($page > 0) {
6510                        $paging_nav .=
6511                                $cgi->a({-href => href(action=>"search", hash=>$hash,
6512                                                       searchtext=>$searchtext,
6513                                                       searchtype=>$searchtype)},
6514                                        "first");
6515                        $paging_nav .= " &sdot; " .
6516                                $cgi->a({-href => href(-replay=>1, page=>$page-1),
6517                                         -accesskey => "p", -title => "Alt-p"}, "prev");
6518                } else {
6519                        $paging_nav .= "first";
6520                        $paging_nav .= " &sdot; prev";
6521                }
6522                my $next_link = '';
6523                if ($#commitlist >= 100) {
6524                        $next_link =
6525                                $cgi->a({-href => href(-replay=>1, page=>$page+1),
6526                                         -accesskey => "n", -title => "Alt-n"}, "next");
6527                        $paging_nav .= " &sdot; $next_link";
6528                } else {
6529                        $paging_nav .= " &sdot; next";
6530                }
6531
6532                git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
6533                git_print_header_div('commit', esc_html($co{'title'}), $hash);
6534                if ($page == 0 && !@commitlist) {
6535                        print "<p>No match.</p>\n";
6536                } else {
6537                        git_search_grep_body(\@commitlist, 0, 99, $next_link);
6538                }
6539        }
6540
6541        if ($searchtype eq 'pickaxe') {
6542                git_print_page_nav('','', $hash,$co{'tree'},$hash);
6543                git_print_header_div('commit', esc_html($co{'title'}), $hash);
6544
6545                print "<table class=\"pickaxe search\">\n";
6546                my $alternate = 1;
6547                local $/ = "\n";
6548                open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
6549                        '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
6550                        ($search_use_regexp ? '--pickaxe-regex' : ());
6551                undef %co;
6552                my @files;
6553                while (my $line = <$fd>) {
6554                        chomp $line;
6555                        next unless $line;
6556
6557                        my %set = parse_difftree_raw_line($line);
6558                        if (defined $set{'commit'}) {
6559                                # finish previous commit
6560                                if (%co) {
6561                                        print "</td>\n" .
6562                                              "<td class=\"link\">" .
6563                                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6564                                              " | " .
6565                                              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6566                                        print "</td>\n" .
6567                                              "</tr>\n";
6568                                }
6569
6570                                if ($alternate) {
6571                                        print "<tr class=\"dark\">\n";
6572                                } else {
6573                                        print "<tr class=\"light\">\n";
6574                                }
6575                                $alternate ^= 1;
6576                                %co = parse_commit($set{'commit'});
6577                                my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6578                                print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6579                                      "<td><i>$author</i></td>\n" .
6580                                      "<td>" .
6581                                      $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6582                                              -class => "list subject"},
6583                                              chop_and_escape_str($co{'title'}, 50) . "<br/>");
6584                        } elsif (defined $set{'to_id'}) {
6585                                next if ($set{'to_id'} =~ m/^0{40}$/);
6586
6587                                print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6588                                                             hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6589                                              -class => "list"},
6590                                              "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6591                                      "<br/>\n";
6592                        }
6593                }
6594                close $fd;
6595
6596                # finish last commit (warning: repetition!)
6597                if (%co) {
6598                        print "</td>\n" .
6599                              "<td class=\"link\">" .
6600                              $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6601                              " | " .
6602                              $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6603                        print "</td>\n" .
6604                              "</tr>\n";
6605                }
6606
6607                print "</table>\n";
6608        }
6609
6610        if ($searchtype eq 'grep') {
6611                git_print_page_nav('','', $hash,$co{'tree'},$hash);
6612                git_print_header_div('commit', esc_html($co{'title'}), $hash);
6613
6614                print "<table class=\"grep_search\">\n";
6615                my $alternate = 1;
6616                my $matches = 0;
6617                local $/ = "\n";
6618                open my $fd, "-|", git_cmd(), 'grep', '-n',
6619                        $search_use_regexp ? ('-E', '-i') : '-F',
6620                        $searchtext, $co{'tree'};
6621                my $lastfile = '';
6622                while (my $line = <$fd>) {
6623                        chomp $line;
6624                        my ($file, $lno, $ltext, $binary);
6625                        last if ($matches++ > 1000);
6626                        if ($line =~ /^Binary file (.+) matches$/) {
6627                                $file = $1;
6628                                $binary = 1;
6629                        } else {
6630                                (undef, $file, $lno, $ltext) = split(/:/, $line, 4);
6631                        }
6632                        if ($file ne $lastfile) {
6633                                $lastfile and print "</td></tr>\n";
6634                                if ($alternate++) {
6635                                        print "<tr class=\"dark\">\n";
6636                                } else {
6637                                        print "<tr class=\"light\">\n";
6638                                }
6639                                print "<td class=\"list\">".
6640                                        $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6641                                                               file_name=>"$file"),
6642                                                -class => "list"}, esc_path($file));
6643                                print "</td><td>\n";
6644                                $lastfile = $file;
6645                        }
6646                        if ($binary) {
6647                                print "<div class=\"binary\">Binary file</div>\n";
6648                        } else {
6649                                $ltext = untabify($ltext);
6650                                if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6651                                        $ltext = esc_html($1, -nbsp=>1);
6652                                        $ltext .= '<span class="match">';
6653                                        $ltext .= esc_html($2, -nbsp=>1);
6654                                        $ltext .= '</span>';
6655                                        $ltext .= esc_html($3, -nbsp=>1);
6656                                } else {
6657                                        $ltext = esc_html($ltext, -nbsp=>1);
6658                                }
6659                                print "<div class=\"pre\">" .
6660                                        $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6661                                                               file_name=>"$file").'#l'.$lno,
6662                                                -class => "linenr"}, sprintf('%4i', $lno))
6663                                        . ' ' .  $ltext . "</div>\n";
6664                        }
6665                }
6666                if ($lastfile) {
6667                        print "</td></tr>\n";
6668                        if ($matches > 1000) {
6669                                print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6670                        }
6671                } else {
6672                        print "<div class=\"diff nodifferences\">No matches found</div>\n";
6673                }
6674                close $fd;
6675
6676                print "</table>\n";
6677        }
6678        git_footer_html();
6679}
6680
6681sub git_search_help {
6682        git_header_html();
6683        git_print_page_nav('','', $hash,$hash,$hash);
6684        print <<EOT;
6685<p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
6686regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
6687the pattern entered is recognized as the POSIX extended
6688<a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
6689insensitive).</p>
6690<dl>
6691<dt><b>commit</b></dt>
6692<dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
6693EOT
6694        my $have_grep = gitweb_check_feature('grep');
6695        if ($have_grep) {
6696                print <<EOT;
6697<dt><b>grep</b></dt>
6698<dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
6699    a different one) are searched for the given pattern. On large trees, this search can take
6700a while and put some strain on the server, so please use it with some consideration. Note that
6701due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
6702case-sensitive.</dd>
6703EOT
6704        }
6705        print <<EOT;
6706<dt><b>author</b></dt>
6707<dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
6708<dt><b>committer</b></dt>
6709<dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
6710EOT
6711        my $have_pickaxe = gitweb_check_feature('pickaxe');
6712        if ($have_pickaxe) {
6713                print <<EOT;
6714<dt><b>pickaxe</b></dt>
6715<dd>All commits that caused the string to appear or disappear from any file (changes that
6716added, removed or "modified" the string) will be listed. This search can take a while and
6717takes a lot of strain on the server, so please use it wisely. Note that since you may be
6718interested even in changes just changing the case as well, this search is case sensitive.</dd>
6719EOT
6720        }
6721        print "</dl>\n";
6722        git_footer_html();
6723}
6724
6725sub git_shortlog {
6726        git_log_generic('shortlog', \&git_shortlog_body,
6727                        $hash, $hash_parent);
6728}
6729
6730## ......................................................................
6731## feeds (RSS, Atom; OPML)
6732
6733sub git_feed {
6734        my $format = shift || 'atom';
6735        my $have_blame = gitweb_check_feature('blame');
6736
6737        # Atom: http://www.atomenabled.org/developers/syndication/
6738        # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
6739        if ($format ne 'rss' && $format ne 'atom') {
6740                die_error(400, "Unknown web feed format");
6741        }
6742
6743        # log/feed of current (HEAD) branch, log of given branch, history of file/directory
6744        my $head = $hash || 'HEAD';
6745        my @commitlist = parse_commits($head, 150, 0, $file_name);
6746
6747        my %latest_commit;
6748        my %latest_date;
6749        my $content_type = "application/$format+xml";
6750        if (defined $cgi->http('HTTP_ACCEPT') &&
6751                 $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
6752                # browser (feed reader) prefers text/xml
6753                $content_type = 'text/xml';
6754        }
6755        if (defined($commitlist[0])) {
6756                %latest_commit = %{$commitlist[0]};
6757                my $latest_epoch = $latest_commit{'committer_epoch'};
6758                %latest_date   = parse_date($latest_epoch);
6759                my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
6760                if (defined $if_modified) {
6761                        my $since;
6762                        if (eval { require HTTP::Date; 1; }) {
6763                                $since = HTTP::Date::str2time($if_modified);
6764                        } elsif (eval { require Time::ParseDate; 1; }) {
6765                                $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
6766                        }
6767                        if (defined $since && $latest_epoch <= $since) {
6768                                print $cgi->header(
6769                                        -type => $content_type,
6770                                        -charset => 'utf-8',
6771                                        -last_modified => $latest_date{'rfc2822'},
6772                                        -status => '304 Not Modified');
6773                                return;
6774                        }
6775                }
6776                print $cgi->header(
6777                        -type => $content_type,
6778                        -charset => 'utf-8',
6779                        -last_modified => $latest_date{'rfc2822'});
6780        } else {
6781                print $cgi->header(
6782                        -type => $content_type,
6783                        -charset => 'utf-8');
6784        }
6785
6786        # Optimization: skip generating the body if client asks only
6787        # for Last-Modified date.
6788        return if ($cgi->request_method() eq 'HEAD');
6789
6790        # header variables
6791        my $title = "$site_name - $project/$action";
6792        my $feed_type = 'log';
6793        if (defined $hash) {
6794                $title .= " - '$hash'";
6795                $feed_type = 'branch log';
6796                if (defined $file_name) {
6797                        $title .= " :: $file_name";
6798                        $feed_type = 'history';
6799                }
6800        } elsif (defined $file_name) {
6801                $title .= " - $file_name";
6802                $feed_type = 'history';
6803        }
6804        $title .= " $feed_type";
6805        my $descr = git_get_project_description($project);
6806        if (defined $descr) {
6807                $descr = esc_html($descr);
6808        } else {
6809                $descr = "$project " .
6810                         ($format eq 'rss' ? 'RSS' : 'Atom') .
6811                         " feed";
6812        }
6813        my $owner = git_get_project_owner($project);
6814        $owner = esc_html($owner);
6815
6816        #header
6817        my $alt_url;
6818        if (defined $file_name) {
6819                $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
6820        } elsif (defined $hash) {
6821                $alt_url = href(-full=>1, action=>"log", hash=>$hash);
6822        } else {
6823                $alt_url = href(-full=>1, action=>"summary");
6824        }
6825        print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
6826        if ($format eq 'rss') {
6827                print <<XML;
6828<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
6829<channel>
6830XML
6831                print "<title>$title</title>\n" .
6832                      "<link>$alt_url</link>\n" .
6833                      "<description>$descr</description>\n" .
6834                      "<language>en</language>\n" .
6835                      # project owner is responsible for 'editorial' content
6836                      "<managingEditor>$owner</managingEditor>\n";
6837                if (defined $logo || defined $favicon) {
6838                        # prefer the logo to the favicon, since RSS
6839                        # doesn't allow both
6840                        my $img = esc_url($logo || $favicon);
6841                        print "<image>\n" .
6842                              "<url>$img</url>\n" .
6843                              "<title>$title</title>\n" .
6844                              "<link>$alt_url</link>\n" .
6845                              "</image>\n";
6846                }
6847                if (%latest_date) {
6848                        print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
6849                        print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
6850                }
6851                print "<generator>gitweb v.$version/$git_version</generator>\n";
6852        } elsif ($format eq 'atom') {
6853                print <<XML;
6854<feed xmlns="http://www.w3.org/2005/Atom">
6855XML
6856                print "<title>$title</title>\n" .
6857                      "<subtitle>$descr</subtitle>\n" .
6858                      '<link rel="alternate" type="text/html" href="' .
6859                      $alt_url . '" />' . "\n" .
6860                      '<link rel="self" type="' . $content_type . '" href="' .
6861                      $cgi->self_url() . '" />' . "\n" .
6862                      "<id>" . href(-full=>1) . "</id>\n" .
6863                      # use project owner for feed author
6864                      "<author><name>$owner</name></author>\n";
6865                if (defined $favicon) {
6866                        print "<icon>" . esc_url($favicon) . "</icon>\n";
6867                }
6868                if (defined $logo_url) {
6869                        # not twice as wide as tall: 72 x 27 pixels
6870                        print "<logo>" . esc_url($logo) . "</logo>\n";
6871                }
6872                if (! %latest_date) {
6873                        # dummy date to keep the feed valid until commits trickle in:
6874                        print "<updated>1970-01-01T00:00:00Z</updated>\n";
6875                } else {
6876                        print "<updated>$latest_date{'iso-8601'}</updated>\n";
6877                }
6878                print "<generator version='$version/$git_version'>gitweb</generator>\n";
6879        }
6880
6881        # contents
6882        for (my $i = 0; $i <= $#commitlist; $i++) {
6883                my %co = %{$commitlist[$i]};
6884                my $commit = $co{'id'};
6885                # we read 150, we always show 30 and the ones more recent than 48 hours
6886                if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
6887                        last;
6888                }
6889                my %cd = parse_date($co{'author_epoch'});
6890
6891                # get list of changed files
6892                open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6893                        $co{'parent'} || "--root",
6894                        $co{'id'}, "--", (defined $file_name ? $file_name : ())
6895                        or next;
6896                my @difftree = map { chomp; $_ } <$fd>;
6897                close $fd
6898                        or next;
6899
6900                # print element (entry, item)
6901                my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
6902                if ($format eq 'rss') {
6903                        print "<item>\n" .
6904                              "<title>" . esc_html($co{'title'}) . "</title>\n" .
6905                              "<author>" . esc_html($co{'author'}) . "</author>\n" .
6906                              "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
6907                              "<guid isPermaLink=\"true\">$co_url</guid>\n" .
6908                              "<link>$co_url</link>\n" .
6909                              "<description>" . esc_html($co{'title'}) . "</description>\n" .
6910                              "<content:encoded>" .
6911                              "<![CDATA[\n";
6912                } elsif ($format eq 'atom') {
6913                        print "<entry>\n" .
6914                              "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
6915                              "<updated>$cd{'iso-8601'}</updated>\n" .
6916                              "<author>\n" .
6917                              "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
6918                        if ($co{'author_email'}) {
6919                                print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
6920                        }
6921                        print "</author>\n" .
6922                              # use committer for contributor
6923                              "<contributor>\n" .
6924                              "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
6925                        if ($co{'committer_email'}) {
6926                                print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
6927                        }
6928                        print "</contributor>\n" .
6929                              "<published>$cd{'iso-8601'}</published>\n" .
6930                              "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
6931                              "<id>$co_url</id>\n" .
6932                              "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
6933                              "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
6934                }
6935                my $comment = $co{'comment'};
6936                print "<pre>\n";
6937                foreach my $line (@$comment) {
6938                        $line = esc_html($line);
6939                        print "$line\n";
6940                }
6941                print "</pre><ul>\n";
6942                foreach my $difftree_line (@difftree) {
6943                        my %difftree = parse_difftree_raw_line($difftree_line);
6944                        next if !$difftree{'from_id'};
6945
6946                        my $file = $difftree{'file'} || $difftree{'to_file'};
6947
6948                        print "<li>" .
6949                              "[" .
6950                              $cgi->a({-href => href(-full=>1, action=>"blobdiff",
6951                                                     hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
6952                                                     hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
6953                                                     file_name=>$file, file_parent=>$difftree{'from_file'}),
6954                                      -title => "diff"}, 'D');
6955                        if ($have_blame) {
6956                                print $cgi->a({-href => href(-full=>1, action=>"blame",
6957                                                             file_name=>$file, hash_base=>$commit),
6958                                              -title => "blame"}, 'B');
6959                        }
6960                        # if this is not a feed of a file history
6961                        if (!defined $file_name || $file_name ne $file) {
6962                                print $cgi->a({-href => href(-full=>1, action=>"history",
6963                                                             file_name=>$file, hash=>$commit),
6964                                              -title => "history"}, 'H');
6965                        }
6966                        $file = esc_path($file);
6967                        print "] ".
6968                              "$file</li>\n";
6969                }
6970                if ($format eq 'rss') {
6971                        print "</ul>]]>\n" .
6972                              "</content:encoded>\n" .
6973                              "</item>\n";
6974                } elsif ($format eq 'atom') {
6975                        print "</ul>\n</div>\n" .
6976                              "</content>\n" .
6977                              "</entry>\n";
6978                }
6979        }
6980
6981        # end of feed
6982        if ($format eq 'rss') {
6983                print "</channel>\n</rss>\n";
6984        } elsif ($format eq 'atom') {
6985                print "</feed>\n";
6986        }
6987}
6988
6989sub git_rss {
6990        git_feed('rss');
6991}
6992
6993sub git_atom {
6994        git_feed('atom');
6995}
6996
6997sub git_opml {
6998        my @list = git_get_projects_list();
6999
7000        print $cgi->header(
7001                -type => 'text/xml',
7002                -charset => 'utf-8',
7003                -content_disposition => 'inline; filename="opml.xml"');
7004
7005        print <<XML;
7006<?xml version="1.0" encoding="utf-8"?>
7007<opml version="1.0">
7008<head>
7009  <title>$site_name OPML Export</title>
7010</head>
7011<body>
7012<outline text="git RSS feeds">
7013XML
7014
7015        foreach my $pr (@list) {
7016                my %proj = %$pr;
7017                my $head = git_get_head_hash($proj{'path'});
7018                if (!defined $head) {
7019                        next;
7020                }
7021                $git_dir = "$projectroot/$proj{'path'}";
7022                my %co = parse_commit($head);
7023                if (!%co) {
7024                        next;
7025                }
7026
7027                my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7028                my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7029                my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7030                print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7031        }
7032        print <<XML;
7033</outline>
7034</body>
7035</opml>
7036XML
7037}