gitweb: Time::HiRes is in core for Perl 5.8
[git] / gitweb / gitweb.perl
1 #!/usr/bin/perl
2
3 # gitweb - simple web interface to track changes in git repositories
4 #
5 # (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
6 # (C) 2005, Christian Gierke
7 #
8 # This program is licensed under the GPLv2
9
10 use 5.008;
11 use strict;
12 use warnings;
13 use CGI qw(:standard :escapeHTML -nosticky);
14 use CGI::Util qw(unescape);
15 use CGI::Carp qw(fatalsToBrowser set_message);
16 use Encode;
17 use Fcntl ':mode';
18 use File::Find qw();
19 use File::Basename qw(basename);
20 use Time::HiRes qw(gettimeofday tv_interval);
21 binmode STDOUT, ':utf8';
22
23 our $t0 = [ gettimeofday() ];
24 our $number_of_git_cmds = 0;
25
26 BEGIN {
27         CGI->compile() if $ENV{'MOD_PERL'};
28 }
29
30 our $version = "++GIT_VERSION++";
31
32 our ($my_url, $my_uri, $base_url, $path_info, $home_link);
33 sub evaluate_uri {
34         our $cgi;
35
36         our $my_url = $cgi->url();
37         our $my_uri = $cgi->url(-absolute => 1);
38
39         # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
40         # needed and used only for URLs with nonempty PATH_INFO
41         our $base_url = $my_url;
42
43         # When the script is used as DirectoryIndex, the URL does not contain the name
44         # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
45         # have to do it ourselves. We make $path_info global because it's also used
46         # later on.
47         #
48         # Another issue with the script being the DirectoryIndex is that the resulting
49         # $my_url data is not the full script URL: this is good, because we want
50         # generated links to keep implying the script name if it wasn't explicitly
51         # indicated in the URL we're handling, but it means that $my_url cannot be used
52         # as base URL.
53         # Therefore, if we needed to strip PATH_INFO, then we know that we have
54         # to build the base URL ourselves:
55         our $path_info = $ENV{"PATH_INFO"};
56         if ($path_info) {
57                 if ($my_url =~ s,\Q$path_info\E$,, &&
58                     $my_uri =~ s,\Q$path_info\E$,, &&
59                     defined $ENV{'SCRIPT_NAME'}) {
60                         $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
61                 }
62         }
63
64         # target of the home link on top of all pages
65         our $home_link = $my_uri || "/";
66 }
67
68 # core git executable to use
69 # this can just be "git" if your webserver has a sensible PATH
70 our $GIT = "++GIT_BINDIR++/git";
71
72 # absolute fs-path which will be prepended to the project path
73 #our $projectroot = "/pub/scm";
74 our $projectroot = "++GITWEB_PROJECTROOT++";
75
76 # fs traversing limit for getting project list
77 # the number is relative to the projectroot
78 our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
79
80 # string of the home link on top of all pages
81 our $home_link_str = "++GITWEB_HOME_LINK_STR++";
82
83 # name of your site or organization to appear in page titles
84 # replace this with something more descriptive for clearer bookmarks
85 our $site_name = "++GITWEB_SITENAME++"
86                  || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
87
88 # filename of html text to include at top of each page
89 our $site_header = "++GITWEB_SITE_HEADER++";
90 # html text to include at home page
91 our $home_text = "++GITWEB_HOMETEXT++";
92 # filename of html text to include at bottom of each page
93 our $site_footer = "++GITWEB_SITE_FOOTER++";
94
95 # URI of stylesheets
96 our @stylesheets = ("++GITWEB_CSS++");
97 # URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
98 our $stylesheet = undef;
99 # URI of GIT logo (72x27 size)
100 our $logo = "++GITWEB_LOGO++";
101 # URI of GIT favicon, assumed to be image/png type
102 our $favicon = "++GITWEB_FAVICON++";
103 # URI of gitweb.js (JavaScript code for gitweb)
104 our $javascript = "++GITWEB_JS++";
105
106 # URI and label (title) of GIT logo link
107 #our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
108 #our $logo_label = "git documentation";
109 our $logo_url = "http://git-scm.com/";
110 our $logo_label = "git homepage";
111
112 # source of projects list
113 our $projects_list = "++GITWEB_LIST++";
114
115 # the width (in characters) of the projects list "Description" column
116 our $projects_list_description_width = 25;
117
118 # default order of projects list
119 # valid values are none, project, descr, owner, and age
120 our $default_projects_order = "project";
121
122 # show repository only if this file exists
123 # (only effective if this variable evaluates to true)
124 our $export_ok = "++GITWEB_EXPORT_OK++";
125
126 # show repository only if this subroutine returns true
127 # when given the path to the project, for example:
128 #    sub { return -e "$_[0]/git-daemon-export-ok"; }
129 our $export_auth_hook = undef;
130
131 # only allow viewing of repositories also shown on the overview page
132 our $strict_export = "++GITWEB_STRICT_EXPORT++";
133
134 # list of git base URLs used for URL to where fetch project from,
135 # i.e. full URL is "$git_base_url/$project"
136 our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
137
138 # default blob_plain mimetype and default charset for text/plain blob
139 our $default_blob_plain_mimetype = 'text/plain';
140 our $default_text_plain_charset  = undef;
141
142 # file to use for guessing MIME types before trying /etc/mime.types
143 # (relative to the current git repository)
144 our $mimetypes_file = undef;
145
146 # assume this charset if line contains non-UTF-8 characters;
147 # it should be valid encoding (see Encoding::Supported(3pm) for list),
148 # for which encoding all byte sequences are valid, for example
149 # 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
150 # could be even 'utf-8' for the old behavior)
151 our $fallback_encoding = 'latin1';
152
153 # rename detection options for git-diff and git-diff-tree
154 # - default is '-M', with the cost proportional to
155 #   (number of removed files) * (number of new files).
156 # - more costly is '-C' (which implies '-M'), with the cost proportional to
157 #   (number of changed files + number of removed files) * (number of new files)
158 # - even more costly is '-C', '--find-copies-harder' with cost
159 #   (number of files in the original tree) * (number of new files)
160 # - one might want to include '-B' option, e.g. '-B', '-M'
161 our @diff_opts = ('-M'); # taken from git_commit
162
163 # Disables features that would allow repository owners to inject script into
164 # the gitweb domain.
165 our $prevent_xss = 0;
166
167 # Path to the highlight executable to use (must be the one from
168 # http://www.andre-simon.de due to assumptions about parameters and output).
169 # Useful if highlight is not installed on your webserver's PATH.
170 # [Default: highlight]
171 our $highlight_bin = "++HIGHLIGHT_BIN++";
172
173 # information about snapshot formats that gitweb is capable of serving
174 our %known_snapshot_formats = (
175         # name => {
176         #       'display' => display name,
177         #       'type' => mime type,
178         #       'suffix' => filename suffix,
179         #       'format' => --format for git-archive,
180         #       'compressor' => [compressor command and arguments]
181         #                       (array reference, optional)
182         #       'disabled' => boolean (optional)}
183         #
184         'tgz' => {
185                 'display' => 'tar.gz',
186                 'type' => 'application/x-gzip',
187                 'suffix' => '.tar.gz',
188                 'format' => 'tar',
189                 'compressor' => ['gzip']},
190
191         'tbz2' => {
192                 'display' => 'tar.bz2',
193                 'type' => 'application/x-bzip2',
194                 'suffix' => '.tar.bz2',
195                 'format' => 'tar',
196                 'compressor' => ['bzip2']},
197
198         'txz' => {
199                 'display' => 'tar.xz',
200                 'type' => 'application/x-xz',
201                 'suffix' => '.tar.xz',
202                 'format' => 'tar',
203                 'compressor' => ['xz'],
204                 'disabled' => 1},
205
206         'zip' => {
207                 'display' => 'zip',
208                 'type' => 'application/x-zip',
209                 'suffix' => '.zip',
210                 'format' => 'zip'},
211 );
212
213 # Aliases so we understand old gitweb.snapshot values in repository
214 # configuration.
215 our %known_snapshot_format_aliases = (
216         'gzip'  => 'tgz',
217         'bzip2' => 'tbz2',
218         'xz'    => 'txz',
219
220         # backward compatibility: legacy gitweb config support
221         'x-gzip' => undef, 'gz' => undef,
222         'x-bzip2' => undef, 'bz2' => undef,
223         'x-zip' => undef, '' => undef,
224 );
225
226 # Pixel sizes for icons and avatars. If the default font sizes or lineheights
227 # are changed, it may be appropriate to change these values too via
228 # $GITWEB_CONFIG.
229 our %avatar_size = (
230         'default' => 16,
231         'double'  => 32
232 );
233
234 # Used to set the maximum load that we will still respond to gitweb queries.
235 # If server load exceed this value then return "503 server busy" error.
236 # If gitweb cannot determined server load, it is taken to be 0.
237 # Leave it undefined (or set to 'undef') to turn off load checking.
238 our $maxload = 300;
239
240 # configuration for 'highlight' (http://www.andre-simon.de/)
241 # match by basename
242 our %highlight_basename = (
243         #'Program' => 'py',
244         #'Library' => 'py',
245         'SConstruct' => 'py', # SCons equivalent of Makefile
246         'Makefile' => 'make',
247 );
248 # match by extension
249 our %highlight_ext = (
250         # main extensions, defining name of syntax;
251         # see files in /usr/share/highlight/langDefs/ directory
252         map { $_ => $_ }
253                 qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl),
254         # alternate extensions, see /etc/highlight/filetypes.conf
255         'h' => 'c',
256         map { $_ => 'cpp' } qw(cxx c++ cc),
257         map { $_ => 'php' } qw(php3 php4),
258         map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
259         'mak' => 'make',
260         map { $_ => 'xml' } qw(xhtml html htm),
261 );
262
263 # You define site-wide feature defaults here; override them with
264 # $GITWEB_CONFIG as necessary.
265 our %feature = (
266         # feature => {
267         #       'sub' => feature-sub (subroutine),
268         #       'override' => allow-override (boolean),
269         #       'default' => [ default options...] (array reference)}
270         #
271         # if feature is overridable (it means that allow-override has true value),
272         # then feature-sub will be called with default options as parameters;
273         # return value of feature-sub indicates if to enable specified feature
274         #
275         # if there is no 'sub' key (no feature-sub), then feature cannot be
276         # overridden
277         #
278         # use gitweb_get_feature(<feature>) to retrieve the <feature> value
279         # (an array) or gitweb_check_feature(<feature>) to check if <feature>
280         # is enabled
281
282         # Enable the 'blame' blob view, showing the last commit that modified
283         # each line in the file. This can be very CPU-intensive.
284
285         # To enable system wide have in $GITWEB_CONFIG
286         # $feature{'blame'}{'default'} = [1];
287         # To have project specific config enable override in $GITWEB_CONFIG
288         # $feature{'blame'}{'override'} = 1;
289         # and in project config gitweb.blame = 0|1;
290         'blame' => {
291                 'sub' => sub { feature_bool('blame', @_) },
292                 'override' => 0,
293                 'default' => [0]},
294
295         # Enable the 'snapshot' link, providing a compressed archive of any
296         # tree. This can potentially generate high traffic if you have large
297         # project.
298
299         # Value is a list of formats defined in %known_snapshot_formats that
300         # you wish to offer.
301         # To disable system wide have in $GITWEB_CONFIG
302         # $feature{'snapshot'}{'default'} = [];
303         # To have project specific config enable override in $GITWEB_CONFIG
304         # $feature{'snapshot'}{'override'} = 1;
305         # and in project config, a comma-separated list of formats or "none"
306         # to disable.  Example: gitweb.snapshot = tbz2,zip;
307         'snapshot' => {
308                 'sub' => \&feature_snapshot,
309                 'override' => 0,
310                 'default' => ['tgz']},
311
312         # Enable text search, which will list the commits which match author,
313         # committer or commit text to a given string.  Enabled by default.
314         # Project specific override is not supported.
315         'search' => {
316                 'override' => 0,
317                 'default' => [1]},
318
319         # Enable grep search, which will list the files in currently selected
320         # tree containing the given string. Enabled by default. This can be
321         # potentially CPU-intensive, of course.
322
323         # To enable system wide have in $GITWEB_CONFIG
324         # $feature{'grep'}{'default'} = [1];
325         # To have project specific config enable override in $GITWEB_CONFIG
326         # $feature{'grep'}{'override'} = 1;
327         # and in project config gitweb.grep = 0|1;
328         'grep' => {
329                 'sub' => sub { feature_bool('grep', @_) },
330                 'override' => 0,
331                 'default' => [1]},
332
333         # Enable the pickaxe search, which will list the commits that modified
334         # a given string in a file. This can be practical and quite faster
335         # alternative to 'blame', but still potentially CPU-intensive.
336
337         # To enable system wide have in $GITWEB_CONFIG
338         # $feature{'pickaxe'}{'default'} = [1];
339         # To have project specific config enable override in $GITWEB_CONFIG
340         # $feature{'pickaxe'}{'override'} = 1;
341         # and in project config gitweb.pickaxe = 0|1;
342         'pickaxe' => {
343                 'sub' => sub { feature_bool('pickaxe', @_) },
344                 'override' => 0,
345                 'default' => [1]},
346
347         # Enable showing size of blobs in a 'tree' view, in a separate
348         # column, similar to what 'ls -l' does.  This cost a bit of IO.
349
350         # To disable system wide have in $GITWEB_CONFIG
351         # $feature{'show-sizes'}{'default'} = [0];
352         # To have project specific config enable override in $GITWEB_CONFIG
353         # $feature{'show-sizes'}{'override'} = 1;
354         # and in project config gitweb.showsizes = 0|1;
355         'show-sizes' => {
356                 'sub' => sub { feature_bool('showsizes', @_) },
357                 'override' => 0,
358                 'default' => [1]},
359
360         # Make gitweb use an alternative format of the URLs which can be
361         # more readable and natural-looking: project name is embedded
362         # directly in the path and the query string contains other
363         # auxiliary information. All gitweb installations recognize
364         # URL in either format; this configures in which formats gitweb
365         # generates links.
366
367         # To enable system wide have in $GITWEB_CONFIG
368         # $feature{'pathinfo'}{'default'} = [1];
369         # Project specific override is not supported.
370
371         # Note that you will need to change the default location of CSS,
372         # favicon, logo and possibly other files to an absolute URL. Also,
373         # if gitweb.cgi serves as your indexfile, you will need to force
374         # $my_uri to contain the script name in your $GITWEB_CONFIG.
375         'pathinfo' => {
376                 'override' => 0,
377                 'default' => [0]},
378
379         # Make gitweb consider projects in project root subdirectories
380         # to be forks of existing projects. Given project $projname.git,
381         # projects matching $projname/*.git will not be shown in the main
382         # projects list, instead a '+' mark will be added to $projname
383         # there and a 'forks' view will be enabled for the project, listing
384         # all the forks. If project list is taken from a file, forks have
385         # to be listed after the main project.
386
387         # To enable system wide have in $GITWEB_CONFIG
388         # $feature{'forks'}{'default'} = [1];
389         # Project specific override is not supported.
390         'forks' => {
391                 'override' => 0,
392                 'default' => [0]},
393
394         # Insert custom links to the action bar of all project pages.
395         # This enables you mainly to link to third-party scripts integrating
396         # into gitweb; e.g. git-browser for graphical history representation
397         # or custom web-based repository administration interface.
398
399         # The 'default' value consists of a list of triplets in the form
400         # (label, link, position) where position is the label after which
401         # to insert the link and link is a format string where %n expands
402         # to the project name, %f to the project path within the filesystem,
403         # %h to the current hash (h gitweb parameter) and %b to the current
404         # hash base (hb gitweb parameter); %% expands to %.
405
406         # To enable system wide have in $GITWEB_CONFIG e.g.
407         # $feature{'actions'}{'default'} = [('graphiclog',
408         #       '/git-browser/by-commit.html?r=%n', 'summary')];
409         # Project specific override is not supported.
410         'actions' => {
411                 'override' => 0,
412                 'default' => []},
413
414         # Allow gitweb scan project content tags described in ctags/
415         # of project repository, and display the popular Web 2.0-ish
416         # "tag cloud" near the project list. Note that this is something
417         # COMPLETELY different from the normal Git tags.
418
419         # gitweb by itself can show existing tags, but it does not handle
420         # tagging itself; you need an external application for that.
421         # For an example script, check Girocco's cgi/tagproj.cgi.
422         # You may want to install the HTML::TagCloud Perl module to get
423         # a pretty tag cloud instead of just a list of tags.
424
425         # To enable system wide have in $GITWEB_CONFIG
426         # $feature{'ctags'}{'default'} = ['path_to_tag_script'];
427         # Project specific override is not supported.
428         'ctags' => {
429                 'override' => 0,
430                 'default' => [0]},
431
432         # The maximum number of patches in a patchset generated in patch
433         # view. Set this to 0 or undef to disable patch view, or to a
434         # negative number to remove any limit.
435
436         # To disable system wide have in $GITWEB_CONFIG
437         # $feature{'patches'}{'default'} = [0];
438         # To have project specific config enable override in $GITWEB_CONFIG
439         # $feature{'patches'}{'override'} = 1;
440         # and in project config gitweb.patches = 0|n;
441         # where n is the maximum number of patches allowed in a patchset.
442         'patches' => {
443                 'sub' => \&feature_patches,
444                 'override' => 0,
445                 'default' => [16]},
446
447         # Avatar support. When this feature is enabled, views such as
448         # shortlog or commit will display an avatar associated with
449         # the email of the committer(s) and/or author(s).
450
451         # Currently available providers are gravatar and picon.
452         # If an unknown provider is specified, the feature is disabled.
453
454         # Gravatar depends on Digest::MD5.
455         # Picon currently relies on the indiana.edu database.
456
457         # To enable system wide have in $GITWEB_CONFIG
458         # $feature{'avatar'}{'default'} = ['<provider>'];
459         # where <provider> is either gravatar or picon.
460         # To have project specific config enable override in $GITWEB_CONFIG
461         # $feature{'avatar'}{'override'} = 1;
462         # and in project config gitweb.avatar = <provider>;
463         'avatar' => {
464                 'sub' => \&feature_avatar,
465                 'override' => 0,
466                 'default' => ['']},
467
468         # Enable displaying how much time and how many git commands
469         # it took to generate and display page.  Disabled by default.
470         # Project specific override is not supported.
471         'timed' => {
472                 'override' => 0,
473                 'default' => [0]},
474
475         # Enable turning some links into links to actions which require
476         # JavaScript to run (like 'blame_incremental').  Not enabled by
477         # default.  Project specific override is currently not supported.
478         'javascript-actions' => {
479                 'override' => 0,
480                 'default' => [0]},
481
482         # Syntax highlighting support. This is based on Daniel Svensson's
483         # and Sham Chukoury's work in gitweb-xmms2.git.
484         # It requires the 'highlight' program present in $PATH,
485         # and therefore is disabled by default.
486
487         # To enable system wide have in $GITWEB_CONFIG
488         # $feature{'highlight'}{'default'} = [1];
489
490         'highlight' => {
491                 'sub' => sub { feature_bool('highlight', @_) },
492                 'override' => 0,
493                 'default' => [0]},
494 );
495
496 sub gitweb_get_feature {
497         my ($name) = @_;
498         return unless exists $feature{$name};
499         my ($sub, $override, @defaults) = (
500                 $feature{$name}{'sub'},
501                 $feature{$name}{'override'},
502                 @{$feature{$name}{'default'}});
503         # project specific override is possible only if we have project
504         our $git_dir; # global variable, declared later
505         if (!$override || !defined $git_dir) {
506                 return @defaults;
507         }
508         if (!defined $sub) {
509                 warn "feature $name is not overridable";
510                 return @defaults;
511         }
512         return $sub->(@defaults);
513 }
514
515 # A wrapper to check if a given feature is enabled.
516 # With this, you can say
517 #
518 #   my $bool_feat = gitweb_check_feature('bool_feat');
519 #   gitweb_check_feature('bool_feat') or somecode;
520 #
521 # instead of
522 #
523 #   my ($bool_feat) = gitweb_get_feature('bool_feat');
524 #   (gitweb_get_feature('bool_feat'))[0] or somecode;
525 #
526 sub gitweb_check_feature {
527         return (gitweb_get_feature(@_))[0];
528 }
529
530
531 sub feature_bool {
532         my $key = shift;
533         my ($val) = git_get_project_config($key, '--bool');
534
535         if (!defined $val) {
536                 return ($_[0]);
537         } elsif ($val eq 'true') {
538                 return (1);
539         } elsif ($val eq 'false') {
540                 return (0);
541         }
542 }
543
544 sub feature_snapshot {
545         my (@fmts) = @_;
546
547         my ($val) = git_get_project_config('snapshot');
548
549         if ($val) {
550                 @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
551         }
552
553         return @fmts;
554 }
555
556 sub feature_patches {
557         my @val = (git_get_project_config('patches', '--int'));
558
559         if (@val) {
560                 return @val;
561         }
562
563         return ($_[0]);
564 }
565
566 sub feature_avatar {
567         my @val = (git_get_project_config('avatar'));
568
569         return @val ? @val : @_;
570 }
571
572 # checking HEAD file with -e is fragile if the repository was
573 # initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
574 # and then pruned.
575 sub check_head_link {
576         my ($dir) = @_;
577         my $headfile = "$dir/HEAD";
578         return ((-e $headfile) ||
579                 (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
580 }
581
582 sub check_export_ok {
583         my ($dir) = @_;
584         return (check_head_link($dir) &&
585                 (!$export_ok || -e "$dir/$export_ok") &&
586                 (!$export_auth_hook || $export_auth_hook->($dir)));
587 }
588
589 # process alternate names for backward compatibility
590 # filter out unsupported (unknown) snapshot formats
591 sub filter_snapshot_fmts {
592         my @fmts = @_;
593
594         @fmts = map {
595                 exists $known_snapshot_format_aliases{$_} ?
596                        $known_snapshot_format_aliases{$_} : $_} @fmts;
597         @fmts = grep {
598                 exists $known_snapshot_formats{$_} &&
599                 !$known_snapshot_formats{$_}{'disabled'}} @fmts;
600 }
601
602 our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM);
603 sub evaluate_gitweb_config {
604         our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
605         our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
606         # die if there are errors parsing config file
607         if (-e $GITWEB_CONFIG) {
608                 do $GITWEB_CONFIG;
609                 die $@ if $@;
610         } elsif (-e $GITWEB_CONFIG_SYSTEM) {
611                 do $GITWEB_CONFIG_SYSTEM;
612                 die $@ if $@;
613         }
614 }
615
616 # Get loadavg of system, to compare against $maxload.
617 # Currently it requires '/proc/loadavg' present to get loadavg;
618 # if it is not present it returns 0, which means no load checking.
619 sub get_loadavg {
620         if( -e '/proc/loadavg' ){
621                 open my $fd, '<', '/proc/loadavg'
622                         or return 0;
623                 my @load = split(/\s+/, scalar <$fd>);
624                 close $fd;
625
626                 # The first three columns measure CPU and IO utilization of the last one,
627                 # five, and 10 minute periods.  The fourth column shows the number of
628                 # currently running processes and the total number of processes in the m/n
629                 # format.  The last column displays the last process ID used.
630                 return $load[0] || 0;
631         }
632         # additional checks for load average should go here for things that don't export
633         # /proc/loadavg
634
635         return 0;
636 }
637
638 # version of the core git binary
639 our $git_version;
640 sub evaluate_git_version {
641         our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
642         $number_of_git_cmds++;
643 }
644
645 sub check_loadavg {
646         if (defined $maxload && get_loadavg() > $maxload) {
647                 die_error(503, "The load average on the server is too high");
648         }
649 }
650
651 # ======================================================================
652 # input validation and dispatch
653
654 # input parameters can be collected from a variety of sources (presently, CGI
655 # and PATH_INFO), so we define an %input_params hash that collects them all
656 # together during validation: this allows subsequent uses (e.g. href()) to be
657 # agnostic of the parameter origin
658
659 our %input_params = ();
660
661 # input parameters are stored with the long parameter name as key. This will
662 # also be used in the href subroutine to convert parameters to their CGI
663 # equivalent, and since the href() usage is the most frequent one, we store
664 # the name -> CGI key mapping here, instead of the reverse.
665 #
666 # XXX: Warning: If you touch this, check the search form for updating,
667 # too.
668
669 our @cgi_param_mapping = (
670         project => "p",
671         action => "a",
672         file_name => "f",
673         file_parent => "fp",
674         hash => "h",
675         hash_parent => "hp",
676         hash_base => "hb",
677         hash_parent_base => "hpb",
678         page => "pg",
679         order => "o",
680         searchtext => "s",
681         searchtype => "st",
682         snapshot_format => "sf",
683         extra_options => "opt",
684         search_use_regexp => "sr",
685         # this must be last entry (for manipulation from JavaScript)
686         javascript => "js"
687 );
688 our %cgi_param_mapping = @cgi_param_mapping;
689
690 # we will also need to know the possible actions, for validation
691 our %actions = (
692         "blame" => \&git_blame,
693         "blame_incremental" => \&git_blame_incremental,
694         "blame_data" => \&git_blame_data,
695         "blobdiff" => \&git_blobdiff,
696         "blobdiff_plain" => \&git_blobdiff_plain,
697         "blob" => \&git_blob,
698         "blob_plain" => \&git_blob_plain,
699         "commitdiff" => \&git_commitdiff,
700         "commitdiff_plain" => \&git_commitdiff_plain,
701         "commit" => \&git_commit,
702         "forks" => \&git_forks,
703         "heads" => \&git_heads,
704         "history" => \&git_history,
705         "log" => \&git_log,
706         "patch" => \&git_patch,
707         "patches" => \&git_patches,
708         "rss" => \&git_rss,
709         "atom" => \&git_atom,
710         "search" => \&git_search,
711         "search_help" => \&git_search_help,
712         "shortlog" => \&git_shortlog,
713         "summary" => \&git_summary,
714         "tag" => \&git_tag,
715         "tags" => \&git_tags,
716         "tree" => \&git_tree,
717         "snapshot" => \&git_snapshot,
718         "object" => \&git_object,
719         # those below don't need $project
720         "opml" => \&git_opml,
721         "project_list" => \&git_project_list,
722         "project_index" => \&git_project_index,
723 );
724
725 # finally, we have the hash of allowed extra_options for the commands that
726 # allow them
727 our %allowed_options = (
728         "--no-merges" => [ qw(rss atom log shortlog history) ],
729 );
730
731 # fill %input_params with the CGI parameters. All values except for 'opt'
732 # should be single values, but opt can be an array. We should probably
733 # build an array of parameters that can be multi-valued, but since for the time
734 # being it's only this one, we just single it out
735 sub evaluate_query_params {
736         our $cgi;
737
738         while (my ($name, $symbol) = each %cgi_param_mapping) {
739                 if ($symbol eq 'opt') {
740                         $input_params{$name} = [ $cgi->param($symbol) ];
741                 } else {
742                         $input_params{$name} = $cgi->param($symbol);
743                 }
744         }
745 }
746
747 # now read PATH_INFO and update the parameter list for missing parameters
748 sub evaluate_path_info {
749         return if defined $input_params{'project'};
750         return if !$path_info;
751         $path_info =~ s,^/+,,;
752         return if !$path_info;
753
754         # find which part of PATH_INFO is project
755         my $project = $path_info;
756         $project =~ s,/+$,,;
757         while ($project && !check_head_link("$projectroot/$project")) {
758                 $project =~ s,/*[^/]*$,,;
759         }
760         return unless $project;
761         $input_params{'project'} = $project;
762
763         # do not change any parameters if an action is given using the query string
764         return if $input_params{'action'};
765         $path_info =~ s,^\Q$project\E/*,,;
766
767         # next, check if we have an action
768         my $action = $path_info;
769         $action =~ s,/.*$,,;
770         if (exists $actions{$action}) {
771                 $path_info =~ s,^$action/*,,;
772                 $input_params{'action'} = $action;
773         }
774
775         # list of actions that want hash_base instead of hash, but can have no
776         # pathname (f) parameter
777         my @wants_base = (
778                 'tree',
779                 'history',
780         );
781
782         # we want to catch, among others
783         # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
784         my ($parentrefname, $parentpathname, $refname, $pathname) =
785                 ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
786
787         # first, analyze the 'current' part
788         if (defined $pathname) {
789                 # we got "branch:filename" or "branch:dir/"
790                 # we could use git_get_type(branch:pathname), but:
791                 # - it needs $git_dir
792                 # - it does a git() call
793                 # - the convention of terminating directories with a slash
794                 #   makes it superfluous
795                 # - embedding the action in the PATH_INFO would make it even
796                 #   more superfluous
797                 $pathname =~ s,^/+,,;
798                 if (!$pathname || substr($pathname, -1) eq "/") {
799                         $input_params{'action'} ||= "tree";
800                         $pathname =~ s,/$,,;
801                 } else {
802                         # the default action depends on whether we had parent info
803                         # or not
804                         if ($parentrefname) {
805                                 $input_params{'action'} ||= "blobdiff_plain";
806                         } else {
807                                 $input_params{'action'} ||= "blob_plain";
808                         }
809                 }
810                 $input_params{'hash_base'} ||= $refname;
811                 $input_params{'file_name'} ||= $pathname;
812         } elsif (defined $refname) {
813                 # we got "branch". In this case we have to choose if we have to
814                 # set hash or hash_base.
815                 #
816                 # Most of the actions without a pathname only want hash to be
817                 # set, except for the ones specified in @wants_base that want
818                 # hash_base instead. It should also be noted that hand-crafted
819                 # links having 'history' as an action and no pathname or hash
820                 # set will fail, but that happens regardless of PATH_INFO.
821                 if (defined $parentrefname) {
822                         # if there is parent let the default be 'shortlog' action
823                         # (for http://git.example.com/repo.git/A..B links); if there
824                         # is no parent, dispatch will detect type of object and set
825                         # action appropriately if required (if action is not set)
826                         $input_params{'action'} ||= "shortlog";
827                 }
828                 if ($input_params{'action'} &&
829                     grep { $_ eq $input_params{'action'} } @wants_base) {
830                         $input_params{'hash_base'} ||= $refname;
831                 } else {
832                         $input_params{'hash'} ||= $refname;
833                 }
834         }
835
836         # next, handle the 'parent' part, if present
837         if (defined $parentrefname) {
838                 # a missing pathspec defaults to the 'current' filename, allowing e.g.
839                 # someproject/blobdiff/oldrev..newrev:/filename
840                 if ($parentpathname) {
841                         $parentpathname =~ s,^/+,,;
842                         $parentpathname =~ s,/$,,;
843                         $input_params{'file_parent'} ||= $parentpathname;
844                 } else {
845                         $input_params{'file_parent'} ||= $input_params{'file_name'};
846                 }
847                 # we assume that hash_parent_base is wanted if a path was specified,
848                 # or if the action wants hash_base instead of hash
849                 if (defined $input_params{'file_parent'} ||
850                         grep { $_ eq $input_params{'action'} } @wants_base) {
851                         $input_params{'hash_parent_base'} ||= $parentrefname;
852                 } else {
853                         $input_params{'hash_parent'} ||= $parentrefname;
854                 }
855         }
856
857         # for the snapshot action, we allow URLs in the form
858         # $project/snapshot/$hash.ext
859         # where .ext determines the snapshot and gets removed from the
860         # passed $refname to provide the $hash.
861         #
862         # To be able to tell that $refname includes the format extension, we
863         # require the following two conditions to be satisfied:
864         # - the hash input parameter MUST have been set from the $refname part
865         #   of the URL (i.e. they must be equal)
866         # - the snapshot format MUST NOT have been defined already (e.g. from
867         #   CGI parameter sf)
868         # It's also useless to try any matching unless $refname has a dot,
869         # so we check for that too
870         if (defined $input_params{'action'} &&
871                 $input_params{'action'} eq 'snapshot' &&
872                 defined $refname && index($refname, '.') != -1 &&
873                 $refname eq $input_params{'hash'} &&
874                 !defined $input_params{'snapshot_format'}) {
875                 # We loop over the known snapshot formats, checking for
876                 # extensions. Allowed extensions are both the defined suffix
877                 # (which includes the initial dot already) and the snapshot
878                 # format key itself, with a prepended dot
879                 while (my ($fmt, $opt) = each %known_snapshot_formats) {
880                         my $hash = $refname;
881                         unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
882                                 next;
883                         }
884                         my $sfx = $1;
885                         # a valid suffix was found, so set the snapshot format
886                         # and reset the hash parameter
887                         $input_params{'snapshot_format'} = $fmt;
888                         $input_params{'hash'} = $hash;
889                         # we also set the format suffix to the one requested
890                         # in the URL: this way a request for e.g. .tgz returns
891                         # a .tgz instead of a .tar.gz
892                         $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
893                         last;
894                 }
895         }
896 }
897
898 our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
899      $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
900      $searchtext, $search_regexp);
901 sub evaluate_and_validate_params {
902         our $action = $input_params{'action'};
903         if (defined $action) {
904                 if (!validate_action($action)) {
905                         die_error(400, "Invalid action parameter");
906                 }
907         }
908
909         # parameters which are pathnames
910         our $project = $input_params{'project'};
911         if (defined $project) {
912                 if (!validate_project($project)) {
913                         undef $project;
914                         die_error(404, "No such project");
915                 }
916         }
917
918         our $file_name = $input_params{'file_name'};
919         if (defined $file_name) {
920                 if (!validate_pathname($file_name)) {
921                         die_error(400, "Invalid file parameter");
922                 }
923         }
924
925         our $file_parent = $input_params{'file_parent'};
926         if (defined $file_parent) {
927                 if (!validate_pathname($file_parent)) {
928                         die_error(400, "Invalid file parent parameter");
929                 }
930         }
931
932         # parameters which are refnames
933         our $hash = $input_params{'hash'};
934         if (defined $hash) {
935                 if (!validate_refname($hash)) {
936                         die_error(400, "Invalid hash parameter");
937                 }
938         }
939
940         our $hash_parent = $input_params{'hash_parent'};
941         if (defined $hash_parent) {
942                 if (!validate_refname($hash_parent)) {
943                         die_error(400, "Invalid hash parent parameter");
944                 }
945         }
946
947         our $hash_base = $input_params{'hash_base'};
948         if (defined $hash_base) {
949                 if (!validate_refname($hash_base)) {
950                         die_error(400, "Invalid hash base parameter");
951                 }
952         }
953
954         our @extra_options = @{$input_params{'extra_options'}};
955         # @extra_options is always defined, since it can only be (currently) set from
956         # CGI, and $cgi->param() returns the empty array in array context if the param
957         # is not set
958         foreach my $opt (@extra_options) {
959                 if (not exists $allowed_options{$opt}) {
960                         die_error(400, "Invalid option parameter");
961                 }
962                 if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
963                         die_error(400, "Invalid option parameter for this action");
964                 }
965         }
966
967         our $hash_parent_base = $input_params{'hash_parent_base'};
968         if (defined $hash_parent_base) {
969                 if (!validate_refname($hash_parent_base)) {
970                         die_error(400, "Invalid hash parent base parameter");
971                 }
972         }
973
974         # other parameters
975         our $page = $input_params{'page'};
976         if (defined $page) {
977                 if ($page =~ m/[^0-9]/) {
978                         die_error(400, "Invalid page parameter");
979                 }
980         }
981
982         our $searchtype = $input_params{'searchtype'};
983         if (defined $searchtype) {
984                 if ($searchtype =~ m/[^a-z]/) {
985                         die_error(400, "Invalid searchtype parameter");
986                 }
987         }
988
989         our $search_use_regexp = $input_params{'search_use_regexp'};
990
991         our $searchtext = $input_params{'searchtext'};
992         our $search_regexp;
993         if (defined $searchtext) {
994                 if (length($searchtext) < 2) {
995                         die_error(403, "At least two characters are required for search parameter");
996                 }
997                 $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
998         }
999 }
1000
1001 # path to the current git repository
1002 our $git_dir;
1003 sub evaluate_git_dir {
1004         our $git_dir = "$projectroot/$project" if $project;
1005 }
1006
1007 our (@snapshot_fmts, $git_avatar);
1008 sub configure_gitweb_features {
1009         # list of supported snapshot formats
1010         our @snapshot_fmts = gitweb_get_feature('snapshot');
1011         @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1012
1013         # check that the avatar feature is set to a known provider name,
1014         # and for each provider check if the dependencies are satisfied.
1015         # if the provider name is invalid or the dependencies are not met,
1016         # reset $git_avatar to the empty string.
1017         our ($git_avatar) = gitweb_get_feature('avatar');
1018         if ($git_avatar eq 'gravatar') {
1019                 $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1020         } elsif ($git_avatar eq 'picon') {
1021                 # no dependencies
1022         } else {
1023                 $git_avatar = '';
1024         }
1025 }
1026
1027 # custom error handler: 'die <message>' is Internal Server Error
1028 sub handle_errors_html {
1029         my $msg = shift; # it is already HTML escaped
1030
1031         # to avoid infinite loop where error occurs in die_error,
1032         # change handler to default handler, disabling handle_errors_html
1033         set_message("Error occured when inside die_error:\n$msg");
1034
1035         # you cannot jump out of die_error when called as error handler;
1036         # the subroutine set via CGI::Carp::set_message is called _after_
1037         # HTTP headers are already written, so it cannot write them itself
1038         die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1039 }
1040 set_message(\&handle_errors_html);
1041
1042 # dispatch
1043 sub dispatch {
1044         if (!defined $action) {
1045                 if (defined $hash) {
1046                         $action = git_get_type($hash);
1047                 } elsif (defined $hash_base && defined $file_name) {
1048                         $action = git_get_type("$hash_base:$file_name");
1049                 } elsif (defined $project) {
1050                         $action = 'summary';
1051                 } else {
1052                         $action = 'project_list';
1053                 }
1054         }
1055         if (!defined($actions{$action})) {
1056                 die_error(400, "Unknown action");
1057         }
1058         if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1059             !$project) {
1060                 die_error(400, "Project needed");
1061         }
1062         $actions{$action}->();
1063 }
1064
1065 sub reset_timer {
1066         our $t0 = [ gettimeofday() ]
1067                 if defined $t0;
1068         our $number_of_git_cmds = 0;
1069 }
1070
1071 sub run_request {
1072         reset_timer();
1073
1074         evaluate_uri();
1075         evaluate_gitweb_config();
1076         check_loadavg();
1077
1078         # $projectroot and $projects_list might be set in gitweb config file
1079         $projects_list ||= $projectroot;
1080
1081         evaluate_query_params();
1082         evaluate_path_info();
1083         evaluate_and_validate_params();
1084         evaluate_git_dir();
1085
1086         configure_gitweb_features();
1087
1088         dispatch();
1089 }
1090
1091 our $is_last_request = sub { 1 };
1092 our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1093 our $CGI = 'CGI';
1094 our $cgi;
1095 sub configure_as_fcgi {
1096         require CGI::Fast;
1097         our $CGI = 'CGI::Fast';
1098
1099         my $request_number = 0;
1100         # let each child service 100 requests
1101         our $is_last_request = sub { ++$request_number > 100 };
1102 }
1103 sub evaluate_argv {
1104         my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1105         configure_as_fcgi()
1106                 if $script_name =~ /\.fcgi$/;
1107
1108         return unless (@ARGV);
1109
1110         require Getopt::Long;
1111         Getopt::Long::GetOptions(
1112                 'fastcgi|fcgi|f' => \&configure_as_fcgi,
1113                 'nproc|n=i' => sub {
1114                         my ($arg, $val) = @_;
1115                         return unless eval { require FCGI::ProcManager; 1; };
1116                         my $proc_manager = FCGI::ProcManager->new({
1117                                 n_processes => $val,
1118                         });
1119                         our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1120                         our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1121                         our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1122                 },
1123         );
1124 }
1125
1126 sub run {
1127         evaluate_argv();
1128         evaluate_git_version();
1129
1130         $pre_listen_hook->()
1131                 if $pre_listen_hook;
1132
1133  REQUEST:
1134         while ($cgi = $CGI->new()) {
1135                 $pre_dispatch_hook->()
1136                         if $pre_dispatch_hook;
1137
1138                 run_request();
1139
1140                 $post_dispatch_hook->()
1141                         if $post_dispatch_hook;
1142
1143                 last REQUEST if ($is_last_request->());
1144         }
1145
1146  DONE_GITWEB:
1147         1;
1148 }
1149
1150 run();
1151
1152 if (defined caller) {
1153         # wrapped in a subroutine processing requests,
1154         # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1155         return;
1156 } else {
1157         # pure CGI script, serving single request
1158         exit;
1159 }
1160
1161 ## ======================================================================
1162 ## action links
1163
1164 # possible values of extra options
1165 # -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1166 # -replay => 1      - start from a current view (replay with modifications)
1167 # -path_info => 0|1 - don't use/use path_info URL (if possible)
1168 sub href {
1169         my %params = @_;
1170         # default is to use -absolute url() i.e. $my_uri
1171         my $href = $params{-full} ? $my_url : $my_uri;
1172
1173         $params{'project'} = $project unless exists $params{'project'};
1174
1175         if ($params{-replay}) {
1176                 while (my ($name, $symbol) = each %cgi_param_mapping) {
1177                         if (!exists $params{$name}) {
1178                                 $params{$name} = $input_params{$name};
1179                         }
1180                 }
1181         }
1182
1183         my $use_pathinfo = gitweb_check_feature('pathinfo');
1184         if (defined $params{'project'} &&
1185             (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1186                 # try to put as many parameters as possible in PATH_INFO:
1187                 #   - project name
1188                 #   - action
1189                 #   - hash_parent or hash_parent_base:/file_parent
1190                 #   - hash or hash_base:/filename
1191                 #   - the snapshot_format as an appropriate suffix
1192
1193                 # When the script is the root DirectoryIndex for the domain,
1194                 # $href here would be something like http://gitweb.example.com/
1195                 # Thus, we strip any trailing / from $href, to spare us double
1196                 # slashes in the final URL
1197                 $href =~ s,/$,,;
1198
1199                 # Then add the project name, if present
1200                 $href .= "/".esc_url($params{'project'});
1201                 delete $params{'project'};
1202
1203                 # since we destructively absorb parameters, we keep this
1204                 # boolean that remembers if we're handling a snapshot
1205                 my $is_snapshot = $params{'action'} eq 'snapshot';
1206
1207                 # Summary just uses the project path URL, any other action is
1208                 # added to the URL
1209                 if (defined $params{'action'}) {
1210                         $href .= "/".esc_url($params{'action'}) unless $params{'action'} eq 'summary';
1211                         delete $params{'action'};
1212                 }
1213
1214                 # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1215                 # stripping nonexistent or useless pieces
1216                 $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1217                         || $params{'hash_parent'} || $params{'hash'});
1218                 if (defined $params{'hash_base'}) {
1219                         if (defined $params{'hash_parent_base'}) {
1220                                 $href .= esc_url($params{'hash_parent_base'});
1221                                 # skip the file_parent if it's the same as the file_name
1222                                 if (defined $params{'file_parent'}) {
1223                                         if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1224                                                 delete $params{'file_parent'};
1225                                         } elsif ($params{'file_parent'} !~ /\.\./) {
1226                                                 $href .= ":/".esc_url($params{'file_parent'});
1227                                                 delete $params{'file_parent'};
1228                                         }
1229                                 }
1230                                 $href .= "..";
1231                                 delete $params{'hash_parent'};
1232                                 delete $params{'hash_parent_base'};
1233                         } elsif (defined $params{'hash_parent'}) {
1234                                 $href .= esc_url($params{'hash_parent'}). "..";
1235                                 delete $params{'hash_parent'};
1236                         }
1237
1238                         $href .= esc_url($params{'hash_base'});
1239                         if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1240                                 $href .= ":/".esc_url($params{'file_name'});
1241                                 delete $params{'file_name'};
1242                         }
1243                         delete $params{'hash'};
1244                         delete $params{'hash_base'};
1245                 } elsif (defined $params{'hash'}) {
1246                         $href .= esc_url($params{'hash'});
1247                         delete $params{'hash'};
1248                 }
1249
1250                 # If the action was a snapshot, we can absorb the
1251                 # snapshot_format parameter too
1252                 if ($is_snapshot) {
1253                         my $fmt = $params{'snapshot_format'};
1254                         # snapshot_format should always be defined when href()
1255                         # is called, but just in case some code forgets, we
1256                         # fall back to the default
1257                         $fmt ||= $snapshot_fmts[0];
1258                         $href .= $known_snapshot_formats{$fmt}{'suffix'};
1259                         delete $params{'snapshot_format'};
1260                 }
1261         }
1262
1263         # now encode the parameters explicitly
1264         my @result = ();
1265         for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1266                 my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1267                 if (defined $params{$name}) {
1268                         if (ref($params{$name}) eq "ARRAY") {
1269                                 foreach my $par (@{$params{$name}}) {
1270                                         push @result, $symbol . "=" . esc_param($par);
1271                                 }
1272                         } else {
1273                                 push @result, $symbol . "=" . esc_param($params{$name});
1274                         }
1275                 }
1276         }
1277         $href .= "?" . join(';', @result) if scalar @result;
1278
1279         return $href;
1280 }
1281
1282
1283 ## ======================================================================
1284 ## validation, quoting/unquoting and escaping
1285
1286 sub validate_action {
1287         my $input = shift || return undef;
1288         return undef unless exists $actions{$input};
1289         return $input;
1290 }
1291
1292 sub validate_project {
1293         my $input = shift || return undef;
1294         if (!validate_pathname($input) ||
1295                 !(-d "$projectroot/$input") ||
1296                 !check_export_ok("$projectroot/$input") ||
1297                 ($strict_export && !project_in_list($input))) {
1298                 return undef;
1299         } else {
1300                 return $input;
1301         }
1302 }
1303
1304 sub validate_pathname {
1305         my $input = shift || return undef;
1306
1307         # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1308         # at the beginning, at the end, and between slashes.
1309         # also this catches doubled slashes
1310         if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1311                 return undef;
1312         }
1313         # no null characters
1314         if ($input =~ m!\0!) {
1315                 return undef;
1316         }
1317         return $input;
1318 }
1319
1320 sub validate_refname {
1321         my $input = shift || return undef;
1322
1323         # textual hashes are O.K.
1324         if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1325                 return $input;
1326         }
1327         # it must be correct pathname
1328         $input = validate_pathname($input)
1329                 or return undef;
1330         # restrictions on ref name according to git-check-ref-format
1331         if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1332                 return undef;
1333         }
1334         return $input;
1335 }
1336
1337 # decode sequences of octets in utf8 into Perl's internal form,
1338 # which is utf-8 with utf8 flag set if needed.  gitweb writes out
1339 # in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1340 sub to_utf8 {
1341         my $str = shift;
1342         return undef unless defined $str;
1343         if (utf8::valid($str)) {
1344                 utf8::decode($str);
1345                 return $str;
1346         } else {
1347                 return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1348         }
1349 }
1350
1351 # quote unsafe chars, but keep the slash, even when it's not
1352 # correct, but quoted slashes look too horrible in bookmarks
1353 sub esc_param {
1354         my $str = shift;
1355         return undef unless defined $str;
1356         $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1357         $str =~ s/ /\+/g;
1358         return $str;
1359 }
1360
1361 # quote unsafe chars in whole URL, so some characters cannot be quoted
1362 sub esc_url {
1363         my $str = shift;
1364         return undef unless defined $str;
1365         $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1366         $str =~ s/ /\+/g;
1367         return $str;
1368 }
1369
1370 # replace invalid utf8 character with SUBSTITUTION sequence
1371 sub esc_html {
1372         my $str = shift;
1373         my %opts = @_;
1374
1375         return undef unless defined $str;
1376
1377         $str = to_utf8($str);
1378         $str = $cgi->escapeHTML($str);
1379         if ($opts{'-nbsp'}) {
1380                 $str =~ s/ /&nbsp;/g;
1381         }
1382         $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1383         return $str;
1384 }
1385
1386 # quote control characters and escape filename to HTML
1387 sub esc_path {
1388         my $str = shift;
1389         my %opts = @_;
1390
1391         return undef unless defined $str;
1392
1393         $str = to_utf8($str);
1394         $str = $cgi->escapeHTML($str);
1395         if ($opts{'-nbsp'}) {
1396                 $str =~ s/ /&nbsp;/g;
1397         }
1398         $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1399         return $str;
1400 }
1401
1402 # Make control characters "printable", using character escape codes (CEC)
1403 sub quot_cec {
1404         my $cntrl = shift;
1405         my %opts = @_;
1406         my %es = ( # character escape codes, aka escape sequences
1407                 "\t" => '\t',   # tab            (HT)
1408                 "\n" => '\n',   # line feed      (LF)
1409                 "\r" => '\r',   # carrige return (CR)
1410                 "\f" => '\f',   # form feed      (FF)
1411                 "\b" => '\b',   # backspace      (BS)
1412                 "\a" => '\a',   # alarm (bell)   (BEL)
1413                 "\e" => '\e',   # escape         (ESC)
1414                 "\013" => '\v', # vertical tab   (VT)
1415                 "\000" => '\0', # nul character  (NUL)
1416         );
1417         my $chr = ( (exists $es{$cntrl})
1418                     ? $es{$cntrl}
1419                     : sprintf('\%2x', ord($cntrl)) );
1420         if ($opts{-nohtml}) {
1421                 return $chr;
1422         } else {
1423                 return "<span class=\"cntrl\">$chr</span>";
1424         }
1425 }
1426
1427 # Alternatively use unicode control pictures codepoints,
1428 # Unicode "printable representation" (PR)
1429 sub quot_upr {
1430         my $cntrl = shift;
1431         my %opts = @_;
1432
1433         my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1434         if ($opts{-nohtml}) {
1435                 return $chr;
1436         } else {
1437                 return "<span class=\"cntrl\">$chr</span>";
1438         }
1439 }
1440
1441 # git may return quoted and escaped filenames
1442 sub unquote {
1443         my $str = shift;
1444
1445         sub unq {
1446                 my $seq = shift;
1447                 my %es = ( # character escape codes, aka escape sequences
1448                         't' => "\t",   # tab            (HT, TAB)
1449                         'n' => "\n",   # newline        (NL)
1450                         'r' => "\r",   # return         (CR)
1451                         'f' => "\f",   # form feed      (FF)
1452                         'b' => "\b",   # backspace      (BS)
1453                         'a' => "\a",   # alarm (bell)   (BEL)
1454                         'e' => "\e",   # escape         (ESC)
1455                         'v' => "\013", # vertical tab   (VT)
1456                 );
1457
1458                 if ($seq =~ m/^[0-7]{1,3}$/) {
1459                         # octal char sequence
1460                         return chr(oct($seq));
1461                 } elsif (exists $es{$seq}) {
1462                         # C escape sequence, aka character escape code
1463                         return $es{$seq};
1464                 }
1465                 # quoted ordinary character
1466                 return $seq;
1467         }
1468
1469         if ($str =~ m/^"(.*)"$/) {
1470                 # needs unquoting
1471                 $str = $1;
1472                 $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1473         }
1474         return $str;
1475 }
1476
1477 # escape tabs (convert tabs to spaces)
1478 sub untabify {
1479         my $line = shift;
1480
1481         while ((my $pos = index($line, "\t")) != -1) {
1482                 if (my $count = (8 - ($pos % 8))) {
1483                         my $spaces = ' ' x $count;
1484                         $line =~ s/\t/$spaces/;
1485                 }
1486         }
1487
1488         return $line;
1489 }
1490
1491 sub project_in_list {
1492         my $project = shift;
1493         my @list = git_get_projects_list();
1494         return @list && scalar(grep { $_->{'path'} eq $project } @list);
1495 }
1496
1497 ## ----------------------------------------------------------------------
1498 ## HTML aware string manipulation
1499
1500 # Try to chop given string on a word boundary between position
1501 # $len and $len+$add_len. If there is no word boundary there,
1502 # chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1503 # (marking chopped part) would be longer than given string.
1504 sub chop_str {
1505         my $str = shift;
1506         my $len = shift;
1507         my $add_len = shift || 10;
1508         my $where = shift || 'right'; # 'left' | 'center' | 'right'
1509
1510         # Make sure perl knows it is utf8 encoded so we don't
1511         # cut in the middle of a utf8 multibyte char.
1512         $str = to_utf8($str);
1513
1514         # allow only $len chars, but don't cut a word if it would fit in $add_len
1515         # if it doesn't fit, cut it if it's still longer than the dots we would add
1516         # remove chopped character entities entirely
1517
1518         # when chopping in the middle, distribute $len into left and right part
1519         # return early if chopping wouldn't make string shorter
1520         if ($where eq 'center') {
1521                 return $str if ($len + 5 >= length($str)); # filler is length 5
1522                 $len = int($len/2);
1523         } else {
1524                 return $str if ($len + 4 >= length($str)); # filler is length 4
1525         }
1526
1527         # regexps: ending and beginning with word part up to $add_len
1528         my $endre = qr/.{$len}\w{0,$add_len}/;
1529         my $begre = qr/\w{0,$add_len}.{$len}/;
1530
1531         if ($where eq 'left') {
1532                 $str =~ m/^(.*?)($begre)$/;
1533                 my ($lead, $body) = ($1, $2);
1534                 if (length($lead) > 4) {
1535                         $lead = " ...";
1536                 }
1537                 return "$lead$body";
1538
1539         } elsif ($where eq 'center') {
1540                 $str =~ m/^($endre)(.*)$/;
1541                 my ($left, $str)  = ($1, $2);
1542                 $str =~ m/^(.*?)($begre)$/;
1543                 my ($mid, $right) = ($1, $2);
1544                 if (length($mid) > 5) {
1545                         $mid = " ... ";
1546                 }
1547                 return "$left$mid$right";
1548
1549         } else {
1550                 $str =~ m/^($endre)(.*)$/;
1551                 my $body = $1;
1552                 my $tail = $2;
1553                 if (length($tail) > 4) {
1554                         $tail = "... ";
1555                 }
1556                 return "$body$tail";
1557         }
1558 }
1559
1560 # takes the same arguments as chop_str, but also wraps a <span> around the
1561 # result with a title attribute if it does get chopped. Additionally, the
1562 # string is HTML-escaped.
1563 sub chop_and_escape_str {
1564         my ($str) = @_;
1565
1566         my $chopped = chop_str(@_);
1567         if ($chopped eq $str) {
1568                 return esc_html($chopped);
1569         } else {
1570                 $str =~ s/[[:cntrl:]]/?/g;
1571                 return $cgi->span({-title=>$str}, esc_html($chopped));
1572         }
1573 }
1574
1575 ## ----------------------------------------------------------------------
1576 ## functions returning short strings
1577
1578 # CSS class for given age value (in seconds)
1579 sub age_class {
1580         my $age = shift;
1581
1582         if (!defined $age) {
1583                 return "noage";
1584         } elsif ($age < 60*60*2) {
1585                 return "age0";
1586         } elsif ($age < 60*60*24*2) {
1587                 return "age1";
1588         } else {
1589                 return "age2";
1590         }
1591 }
1592
1593 # convert age in seconds to "nn units ago" string
1594 sub age_string {
1595         my $age = shift;
1596         my $age_str;
1597
1598         if ($age > 60*60*24*365*2) {
1599                 $age_str = (int $age/60/60/24/365);
1600                 $age_str .= " years ago";
1601         } elsif ($age > 60*60*24*(365/12)*2) {
1602                 $age_str = int $age/60/60/24/(365/12);
1603                 $age_str .= " months ago";
1604         } elsif ($age > 60*60*24*7*2) {
1605                 $age_str = int $age/60/60/24/7;
1606                 $age_str .= " weeks ago";
1607         } elsif ($age > 60*60*24*2) {
1608                 $age_str = int $age/60/60/24;
1609                 $age_str .= " days ago";
1610         } elsif ($age > 60*60*2) {
1611                 $age_str = int $age/60/60;
1612                 $age_str .= " hours ago";
1613         } elsif ($age > 60*2) {
1614                 $age_str = int $age/60;
1615                 $age_str .= " min ago";
1616         } elsif ($age > 2) {
1617                 $age_str = int $age;
1618                 $age_str .= " sec ago";
1619         } else {
1620                 $age_str .= " right now";
1621         }
1622         return $age_str;
1623 }
1624
1625 use constant {
1626         S_IFINVALID => 0030000,
1627         S_IFGITLINK => 0160000,
1628 };
1629
1630 # submodule/subproject, a commit object reference
1631 sub S_ISGITLINK {
1632         my $mode = shift;
1633
1634         return (($mode & S_IFMT) == S_IFGITLINK)
1635 }
1636
1637 # convert file mode in octal to symbolic file mode string
1638 sub mode_str {
1639         my $mode = oct shift;
1640
1641         if (S_ISGITLINK($mode)) {
1642                 return 'm---------';
1643         } elsif (S_ISDIR($mode & S_IFMT)) {
1644                 return 'drwxr-xr-x';
1645         } elsif (S_ISLNK($mode)) {
1646                 return 'lrwxrwxrwx';
1647         } elsif (S_ISREG($mode)) {
1648                 # git cares only about the executable bit
1649                 if ($mode & S_IXUSR) {
1650                         return '-rwxr-xr-x';
1651                 } else {
1652                         return '-rw-r--r--';
1653                 };
1654         } else {
1655                 return '----------';
1656         }
1657 }
1658
1659 # convert file mode in octal to file type string
1660 sub file_type {
1661         my $mode = shift;
1662
1663         if ($mode !~ m/^[0-7]+$/) {
1664                 return $mode;
1665         } else {
1666                 $mode = oct $mode;
1667         }
1668
1669         if (S_ISGITLINK($mode)) {
1670                 return "submodule";
1671         } elsif (S_ISDIR($mode & S_IFMT)) {
1672                 return "directory";
1673         } elsif (S_ISLNK($mode)) {
1674                 return "symlink";
1675         } elsif (S_ISREG($mode)) {
1676                 return "file";
1677         } else {
1678                 return "unknown";
1679         }
1680 }
1681
1682 # convert file mode in octal to file type description string
1683 sub file_type_long {
1684         my $mode = shift;
1685
1686         if ($mode !~ m/^[0-7]+$/) {
1687                 return $mode;
1688         } else {
1689                 $mode = oct $mode;
1690         }
1691
1692         if (S_ISGITLINK($mode)) {
1693                 return "submodule";
1694         } elsif (S_ISDIR($mode & S_IFMT)) {
1695                 return "directory";
1696         } elsif (S_ISLNK($mode)) {
1697                 return "symlink";
1698         } elsif (S_ISREG($mode)) {
1699                 if ($mode & S_IXUSR) {
1700                         return "executable";
1701                 } else {
1702                         return "file";
1703                 };
1704         } else {
1705                 return "unknown";
1706         }
1707 }
1708
1709
1710 ## ----------------------------------------------------------------------
1711 ## functions returning short HTML fragments, or transforming HTML fragments
1712 ## which don't belong to other sections
1713
1714 # format line of commit message.
1715 sub format_log_line_html {
1716         my $line = shift;
1717
1718         $line = esc_html($line, -nbsp=>1);
1719         $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1720                 $cgi->a({-href => href(action=>"object", hash=>$1),
1721                                         -class => "text"}, $1);
1722         }eg;
1723
1724         return $line;
1725 }
1726
1727 # format marker of refs pointing to given object
1728
1729 # the destination action is chosen based on object type and current context:
1730 # - for annotated tags, we choose the tag view unless it's the current view
1731 #   already, in which case we go to shortlog view
1732 # - for other refs, we keep the current view if we're in history, shortlog or
1733 #   log view, and select shortlog otherwise
1734 sub format_ref_marker {
1735         my ($refs, $id) = @_;
1736         my $markers = '';
1737
1738         if (defined $refs->{$id}) {
1739                 foreach my $ref (@{$refs->{$id}}) {
1740                         # this code exploits the fact that non-lightweight tags are the
1741                         # only indirect objects, and that they are the only objects for which
1742                         # we want to use tag instead of shortlog as action
1743                         my ($type, $name) = qw();
1744                         my $indirect = ($ref =~ s/\^\{\}$//);
1745                         # e.g. tags/v2.6.11 or heads/next
1746                         if ($ref =~ m!^(.*?)s?/(.*)$!) {
1747                                 $type = $1;
1748                                 $name = $2;
1749                         } else {
1750                                 $type = "ref";
1751                                 $name = $ref;
1752                         }
1753
1754                         my $class = $type;
1755                         $class .= " indirect" if $indirect;
1756
1757                         my $dest_action = "shortlog";
1758
1759                         if ($indirect) {
1760                                 $dest_action = "tag" unless $action eq "tag";
1761                         } elsif ($action =~ /^(history|(short)?log)$/) {
1762                                 $dest_action = $action;
1763                         }
1764
1765                         my $dest = "";
1766                         $dest .= "refs/" unless $ref =~ m!^refs/!;
1767                         $dest .= $ref;
1768
1769                         my $link = $cgi->a({
1770                                 -href => href(
1771                                         action=>$dest_action,
1772                                         hash=>$dest
1773                                 )}, $name);
1774
1775                         $markers .= " <span class=\"$class\" title=\"$ref\">" .
1776                                 $link . "</span>";
1777                 }
1778         }
1779
1780         if ($markers) {
1781                 return ' <span class="refs">'. $markers . '</span>';
1782         } else {
1783                 return "";
1784         }
1785 }
1786
1787 # format, perhaps shortened and with markers, title line
1788 sub format_subject_html {
1789         my ($long, $short, $href, $extra) = @_;
1790         $extra = '' unless defined($extra);
1791
1792         if (length($short) < length($long)) {
1793                 $long =~ s/[[:cntrl:]]/?/g;
1794                 return $cgi->a({-href => $href, -class => "list subject",
1795                                 -title => to_utf8($long)},
1796                        esc_html($short)) . $extra;
1797         } else {
1798                 return $cgi->a({-href => $href, -class => "list subject"},
1799                        esc_html($long)) . $extra;
1800         }
1801 }
1802
1803 # Rather than recomputing the url for an email multiple times, we cache it
1804 # after the first hit. This gives a visible benefit in views where the avatar
1805 # for the same email is used repeatedly (e.g. shortlog).
1806 # The cache is shared by all avatar engines (currently gravatar only), which
1807 # are free to use it as preferred. Since only one avatar engine is used for any
1808 # given page, there's no risk for cache conflicts.
1809 our %avatar_cache = ();
1810
1811 # Compute the picon url for a given email, by using the picon search service over at
1812 # http://www.cs.indiana.edu/picons/search.html
1813 sub picon_url {
1814         my $email = lc shift;
1815         if (!$avatar_cache{$email}) {
1816                 my ($user, $domain) = split('@', $email);
1817                 $avatar_cache{$email} =
1818                         "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1819                         "$domain/$user/" .
1820                         "users+domains+unknown/up/single";
1821         }
1822         return $avatar_cache{$email};
1823 }
1824
1825 # Compute the gravatar url for a given email, if it's not in the cache already.
1826 # Gravatar stores only the part of the URL before the size, since that's the
1827 # one computationally more expensive. This also allows reuse of the cache for
1828 # different sizes (for this particular engine).
1829 sub gravatar_url {
1830         my $email = lc shift;
1831         my $size = shift;
1832         $avatar_cache{$email} ||=
1833                 "http://www.gravatar.com/avatar/" .
1834                         Digest::MD5::md5_hex($email) . "?s=";
1835         return $avatar_cache{$email} . $size;
1836 }
1837
1838 # Insert an avatar for the given $email at the given $size if the feature
1839 # is enabled.
1840 sub git_get_avatar {
1841         my ($email, %opts) = @_;
1842         my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1843         my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1844         $opts{-size} ||= 'default';
1845         my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1846         my $url = "";
1847         if ($git_avatar eq 'gravatar') {
1848                 $url = gravatar_url($email, $size);
1849         } elsif ($git_avatar eq 'picon') {
1850                 $url = picon_url($email);
1851         }
1852         # Other providers can be added by extending the if chain, defining $url
1853         # as needed. If no variant puts something in $url, we assume avatars
1854         # are completely disabled/unavailable.
1855         if ($url) {
1856                 return $pre_white .
1857                        "<img width=\"$size\" " .
1858                             "class=\"avatar\" " .
1859                             "src=\"$url\" " .
1860                             "alt=\"\" " .
1861                        "/>" . $post_white;
1862         } else {
1863                 return "";
1864         }
1865 }
1866
1867 sub format_search_author {
1868         my ($author, $searchtype, $displaytext) = @_;
1869         my $have_search = gitweb_check_feature('search');
1870
1871         if ($have_search) {
1872                 my $performed = "";
1873                 if ($searchtype eq 'author') {
1874                         $performed = "authored";
1875                 } elsif ($searchtype eq 'committer') {
1876                         $performed = "committed";
1877                 }
1878
1879                 return $cgi->a({-href => href(action=>"search", hash=>$hash,
1880                                 searchtext=>$author,
1881                                 searchtype=>$searchtype), class=>"list",
1882                                 title=>"Search for commits $performed by $author"},
1883                                 $displaytext);
1884
1885         } else {
1886                 return $displaytext;
1887         }
1888 }
1889
1890 # format the author name of the given commit with the given tag
1891 # the author name is chopped and escaped according to the other
1892 # optional parameters (see chop_str).
1893 sub format_author_html {
1894         my $tag = shift;
1895         my $co = shift;
1896         my $author = chop_and_escape_str($co->{'author_name'}, @_);
1897         return "<$tag class=\"author\">" .
1898                format_search_author($co->{'author_name'}, "author",
1899                        git_get_avatar($co->{'author_email'}, -pad_after => 1) .
1900                        $author) .
1901                "</$tag>";
1902 }
1903
1904 # format git diff header line, i.e. "diff --(git|combined|cc) ..."
1905 sub format_git_diff_header_line {
1906         my $line = shift;
1907         my $diffinfo = shift;
1908         my ($from, $to) = @_;
1909
1910         if ($diffinfo->{'nparents'}) {
1911                 # combined diff
1912                 $line =~ s!^(diff (.*?) )"?.*$!$1!;
1913                 if ($to->{'href'}) {
1914                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1915                                          esc_path($to->{'file'}));
1916                 } else { # file was deleted (no href)
1917                         $line .= esc_path($to->{'file'});
1918                 }
1919         } else {
1920                 # "ordinary" diff
1921                 $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
1922                 if ($from->{'href'}) {
1923                         $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
1924                                          'a/' . esc_path($from->{'file'}));
1925                 } else { # file was added (no href)
1926                         $line .= 'a/' . esc_path($from->{'file'});
1927                 }
1928                 $line .= ' ';
1929                 if ($to->{'href'}) {
1930                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1931                                          'b/' . esc_path($to->{'file'}));
1932                 } else { # file was deleted
1933                         $line .= 'b/' . esc_path($to->{'file'});
1934                 }
1935         }
1936
1937         return "<div class=\"diff header\">$line</div>\n";
1938 }
1939
1940 # format extended diff header line, before patch itself
1941 sub format_extended_diff_header_line {
1942         my $line = shift;
1943         my $diffinfo = shift;
1944         my ($from, $to) = @_;
1945
1946         # match <path>
1947         if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
1948                 $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
1949                                        esc_path($from->{'file'}));
1950         }
1951         if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
1952                 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
1953                                  esc_path($to->{'file'}));
1954         }
1955         # match single <mode>
1956         if ($line =~ m/\s(\d{6})$/) {
1957                 $line .= '<span class="info"> (' .
1958                          file_type_long($1) .
1959                          ')</span>';
1960         }
1961         # match <hash>
1962         if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
1963                 # can match only for combined diff
1964                 $line = 'index ';
1965                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
1966                         if ($from->{'href'}[$i]) {
1967                                 $line .= $cgi->a({-href=>$from->{'href'}[$i],
1968                                                   -class=>"hash"},
1969                                                  substr($diffinfo->{'from_id'}[$i],0,7));
1970                         } else {
1971                                 $line .= '0' x 7;
1972                         }
1973                         # separator
1974                         $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
1975                 }
1976                 $line .= '..';
1977                 if ($to->{'href'}) {
1978                         $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
1979                                          substr($diffinfo->{'to_id'},0,7));
1980                 } else {
1981                         $line .= '0' x 7;
1982                 }
1983
1984         } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
1985                 # can match only for ordinary diff
1986                 my ($from_link, $to_link);
1987                 if ($from->{'href'}) {
1988                         $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
1989                                              substr($diffinfo->{'from_id'},0,7));
1990                 } else {
1991                         $from_link = '0' x 7;
1992                 }
1993                 if ($to->{'href'}) {
1994                         $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
1995                                            substr($diffinfo->{'to_id'},0,7));
1996                 } else {
1997                         $to_link = '0' x 7;
1998                 }
1999                 my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2000                 $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2001         }
2002
2003         return $line . "<br/>\n";
2004 }
2005
2006 # format from-file/to-file diff header
2007 sub format_diff_from_to_header {
2008         my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2009         my $line;
2010         my $result = '';
2011
2012         $line = $from_line;
2013         #assert($line =~ m/^---/) if DEBUG;
2014         # no extra formatting for "^--- /dev/null"
2015         if (! $diffinfo->{'nparents'}) {
2016                 # ordinary (single parent) diff
2017                 if ($line =~ m!^--- "?a/!) {
2018                         if ($from->{'href'}) {
2019                                 $line = '--- a/' .
2020                                         $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2021                                                 esc_path($from->{'file'}));
2022                         } else {
2023                                 $line = '--- a/' .
2024                                         esc_path($from->{'file'});
2025                         }
2026                 }
2027                 $result .= qq!<div class="diff from_file">$line</div>\n!;
2028
2029         } else {
2030                 # combined diff (merge commit)
2031                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2032                         if ($from->{'href'}[$i]) {
2033                                 $line = '--- ' .
2034                                         $cgi->a({-href=>href(action=>"blobdiff",
2035                                                              hash_parent=>$diffinfo->{'from_id'}[$i],
2036                                                              hash_parent_base=>$parents[$i],
2037                                                              file_parent=>$from->{'file'}[$i],
2038                                                              hash=>$diffinfo->{'to_id'},
2039                                                              hash_base=>$hash,
2040                                                              file_name=>$to->{'file'}),
2041                                                  -class=>"path",
2042                                                  -title=>"diff" . ($i+1)},
2043                                                 $i+1) .
2044                                         '/' .
2045                                         $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2046                                                 esc_path($from->{'file'}[$i]));
2047                         } else {
2048                                 $line = '--- /dev/null';
2049                         }
2050                         $result .= qq!<div class="diff from_file">$line</div>\n!;
2051                 }
2052         }
2053
2054         $line = $to_line;
2055         #assert($line =~ m/^\+\+\+/) if DEBUG;
2056         # no extra formatting for "^+++ /dev/null"
2057         if ($line =~ m!^\+\+\+ "?b/!) {
2058                 if ($to->{'href'}) {
2059                         $line = '+++ b/' .
2060                                 $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2061                                         esc_path($to->{'file'}));
2062                 } else {
2063                         $line = '+++ b/' .
2064                                 esc_path($to->{'file'});
2065                 }
2066         }
2067         $result .= qq!<div class="diff to_file">$line</div>\n!;
2068
2069         return $result;
2070 }
2071
2072 # create note for patch simplified by combined diff
2073 sub format_diff_cc_simplified {
2074         my ($diffinfo, @parents) = @_;
2075         my $result = '';
2076
2077         $result .= "<div class=\"diff header\">" .
2078                    "diff --cc ";
2079         if (!is_deleted($diffinfo)) {
2080                 $result .= $cgi->a({-href => href(action=>"blob",
2081                                                   hash_base=>$hash,
2082                                                   hash=>$diffinfo->{'to_id'},
2083                                                   file_name=>$diffinfo->{'to_file'}),
2084                                     -class => "path"},
2085                                    esc_path($diffinfo->{'to_file'}));
2086         } else {
2087                 $result .= esc_path($diffinfo->{'to_file'});
2088         }
2089         $result .= "</div>\n" . # class="diff header"
2090                    "<div class=\"diff nodifferences\">" .
2091                    "Simple merge" .
2092                    "</div>\n"; # class="diff nodifferences"
2093
2094         return $result;
2095 }
2096
2097 # format patch (diff) line (not to be used for diff headers)
2098 sub format_diff_line {
2099         my $line = shift;
2100         my ($from, $to) = @_;
2101         my $diff_class = "";
2102
2103         chomp $line;
2104
2105         if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2106                 # combined diff
2107                 my $prefix = substr($line, 0, scalar @{$from->{'href'}});
2108                 if ($line =~ m/^\@{3}/) {
2109                         $diff_class = " chunk_header";
2110                 } elsif ($line =~ m/^\\/) {
2111                         $diff_class = " incomplete";
2112                 } elsif ($prefix =~ tr/+/+/) {
2113                         $diff_class = " add";
2114                 } elsif ($prefix =~ tr/-/-/) {
2115                         $diff_class = " rem";
2116                 }
2117         } else {
2118                 # assume ordinary diff
2119                 my $char = substr($line, 0, 1);
2120                 if ($char eq '+') {
2121                         $diff_class = " add";
2122                 } elsif ($char eq '-') {
2123                         $diff_class = " rem";
2124                 } elsif ($char eq '@') {
2125                         $diff_class = " chunk_header";
2126                 } elsif ($char eq "\\") {
2127                         $diff_class = " incomplete";
2128                 }
2129         }
2130         $line = untabify($line);
2131         if ($from && $to && $line =~ m/^\@{2} /) {
2132                 my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2133                         $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2134
2135                 $from_lines = 0 unless defined $from_lines;
2136                 $to_lines   = 0 unless defined $to_lines;
2137
2138                 if ($from->{'href'}) {
2139                         $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2140                                              -class=>"list"}, $from_text);
2141                 }
2142                 if ($to->{'href'}) {
2143                         $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2144                                              -class=>"list"}, $to_text);
2145                 }
2146                 $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2147                         "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2148                 return "<div class=\"diff$diff_class\">$line</div>\n";
2149         } elsif ($from && $to && $line =~ m/^\@{3}/) {
2150                 my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2151                 my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2152
2153                 @from_text = split(' ', $ranges);
2154                 for (my $i = 0; $i < @from_text; ++$i) {
2155                         ($from_start[$i], $from_nlines[$i]) =
2156                                 (split(',', substr($from_text[$i], 1)), 0);
2157                 }
2158
2159                 $to_text   = pop @from_text;
2160                 $to_start  = pop @from_start;
2161                 $to_nlines = pop @from_nlines;
2162
2163                 $line = "<span class=\"chunk_info\">$prefix ";
2164                 for (my $i = 0; $i < @from_text; ++$i) {
2165                         if ($from->{'href'}[$i]) {
2166                                 $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2167                                                   -class=>"list"}, $from_text[$i]);
2168                         } else {
2169                                 $line .= $from_text[$i];
2170                         }
2171                         $line .= " ";
2172                 }
2173                 if ($to->{'href'}) {
2174                         $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2175                                           -class=>"list"}, $to_text);
2176                 } else {
2177                         $line .= $to_text;
2178                 }
2179                 $line .= " $prefix</span>" .
2180                          "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2181                 return "<div class=\"diff$diff_class\">$line</div>\n";
2182         }
2183         return "<div class=\"diff$diff_class\">" . esc_html($line, -nbsp=>1) . "</div>\n";
2184 }
2185
2186 # Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2187 # linked.  Pass the hash of the tree/commit to snapshot.
2188 sub format_snapshot_links {
2189         my ($hash) = @_;
2190         my $num_fmts = @snapshot_fmts;
2191         if ($num_fmts > 1) {
2192                 # A parenthesized list of links bearing format names.
2193                 # e.g. "snapshot (_tar.gz_ _zip_)"
2194                 return "snapshot (" . join(' ', map
2195                         $cgi->a({
2196                                 -href => href(
2197                                         action=>"snapshot",
2198                                         hash=>$hash,
2199                                         snapshot_format=>$_
2200                                 )
2201                         }, $known_snapshot_formats{$_}{'display'})
2202                 , @snapshot_fmts) . ")";
2203         } elsif ($num_fmts == 1) {
2204                 # A single "snapshot" link whose tooltip bears the format name.
2205                 # i.e. "_snapshot_"
2206                 my ($fmt) = @snapshot_fmts;
2207                 return
2208                         $cgi->a({
2209                                 -href => href(
2210                                         action=>"snapshot",
2211                                         hash=>$hash,
2212                                         snapshot_format=>$fmt
2213                                 ),
2214                                 -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2215                         }, "snapshot");
2216         } else { # $num_fmts == 0
2217                 return undef;
2218         }
2219 }
2220
2221 ## ......................................................................
2222 ## functions returning values to be passed, perhaps after some
2223 ## transformation, to other functions; e.g. returning arguments to href()
2224
2225 # returns hash to be passed to href to generate gitweb URL
2226 # in -title key it returns description of link
2227 sub get_feed_info {
2228         my $format = shift || 'Atom';
2229         my %res = (action => lc($format));
2230
2231         # feed links are possible only for project views
2232         return unless (defined $project);
2233         # some views should link to OPML, or to generic project feed,
2234         # or don't have specific feed yet (so they should use generic)
2235         return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2236
2237         my $branch;
2238         # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2239         # from tag links; this also makes possible to detect branch links
2240         if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2241             (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2242                 $branch = $1;
2243         }
2244         # find log type for feed description (title)
2245         my $type = 'log';
2246         if (defined $file_name) {
2247                 $type  = "history of $file_name";
2248                 $type .= "/" if ($action eq 'tree');
2249                 $type .= " on '$branch'" if (defined $branch);
2250         } else {
2251                 $type = "log of $branch" if (defined $branch);
2252         }
2253
2254         $res{-title} = $type;
2255         $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2256         $res{'file_name'} = $file_name;
2257
2258         return %res;
2259 }
2260
2261 ## ----------------------------------------------------------------------
2262 ## git utility subroutines, invoking git commands
2263
2264 # returns path to the core git executable and the --git-dir parameter as list
2265 sub git_cmd {
2266         $number_of_git_cmds++;
2267         return $GIT, '--git-dir='.$git_dir;
2268 }
2269
2270 # quote the given arguments for passing them to the shell
2271 # quote_command("command", "arg 1", "arg with ' and ! characters")
2272 # => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2273 # Try to avoid using this function wherever possible.
2274 sub quote_command {
2275         return join(' ',
2276                 map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2277 }
2278
2279 # get HEAD ref of given project as hash
2280 sub git_get_head_hash {
2281         return git_get_full_hash(shift, 'HEAD');
2282 }
2283
2284 sub git_get_full_hash {
2285         return git_get_hash(@_);
2286 }
2287
2288 sub git_get_short_hash {
2289         return git_get_hash(@_, '--short=7');
2290 }
2291
2292 sub git_get_hash {
2293         my ($project, $hash, @options) = @_;
2294         my $o_git_dir = $git_dir;
2295         my $retval = undef;
2296         $git_dir = "$projectroot/$project";
2297         if (open my $fd, '-|', git_cmd(), 'rev-parse',
2298             '--verify', '-q', @options, $hash) {
2299                 $retval = <$fd>;
2300                 chomp $retval if defined $retval;
2301                 close $fd;
2302         }
2303         if (defined $o_git_dir) {
2304                 $git_dir = $o_git_dir;
2305         }
2306         return $retval;
2307 }
2308
2309 # get type of given object
2310 sub git_get_type {
2311         my $hash = shift;
2312
2313         open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2314         my $type = <$fd>;
2315         close $fd or return;
2316         chomp $type;
2317         return $type;
2318 }
2319
2320 # repository configuration
2321 our $config_file = '';
2322 our %config;
2323
2324 # store multiple values for single key as anonymous array reference
2325 # single values stored directly in the hash, not as [ <value> ]
2326 sub hash_set_multi {
2327         my ($hash, $key, $value) = @_;
2328
2329         if (!exists $hash->{$key}) {
2330                 $hash->{$key} = $value;
2331         } elsif (!ref $hash->{$key}) {
2332                 $hash->{$key} = [ $hash->{$key}, $value ];
2333         } else {
2334                 push @{$hash->{$key}}, $value;
2335         }
2336 }
2337
2338 # return hash of git project configuration
2339 # optionally limited to some section, e.g. 'gitweb'
2340 sub git_parse_project_config {
2341         my $section_regexp = shift;
2342         my %config;
2343
2344         local $/ = "\0";
2345
2346         open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2347                 or return;
2348
2349         while (my $keyval = <$fh>) {
2350                 chomp $keyval;
2351                 my ($key, $value) = split(/\n/, $keyval, 2);
2352
2353                 hash_set_multi(\%config, $key, $value)
2354                         if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2355         }
2356         close $fh;
2357
2358         return %config;
2359 }
2360
2361 # convert config value to boolean: 'true' or 'false'
2362 # no value, number > 0, 'true' and 'yes' values are true
2363 # rest of values are treated as false (never as error)
2364 sub config_to_bool {
2365         my $val = shift;
2366
2367         return 1 if !defined $val;             # section.key
2368
2369         # strip leading and trailing whitespace
2370         $val =~ s/^\s+//;
2371         $val =~ s/\s+$//;
2372
2373         return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2374                 ($val =~ /^(?:true|yes)$/i));  # section.key = true
2375 }
2376
2377 # convert config value to simple decimal number
2378 # an optional value suffix of 'k', 'm', or 'g' will cause the value
2379 # to be multiplied by 1024, 1048576, or 1073741824
2380 sub config_to_int {
2381         my $val = shift;
2382
2383         # strip leading and trailing whitespace
2384         $val =~ s/^\s+//;
2385         $val =~ s/\s+$//;
2386
2387         if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2388                 $unit = lc($unit);
2389                 # unknown unit is treated as 1
2390                 return $num * ($unit eq 'g' ? 1073741824 :
2391                                $unit eq 'm' ?    1048576 :
2392                                $unit eq 'k' ?       1024 : 1);
2393         }
2394         return $val;
2395 }
2396
2397 # convert config value to array reference, if needed
2398 sub config_to_multi {
2399         my $val = shift;
2400
2401         return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2402 }
2403
2404 sub git_get_project_config {
2405         my ($key, $type) = @_;
2406
2407         return unless defined $git_dir;
2408
2409         # key sanity check
2410         return unless ($key);
2411         $key =~ s/^gitweb\.//;
2412         return if ($key =~ m/\W/);
2413
2414         # type sanity check
2415         if (defined $type) {
2416                 $type =~ s/^--//;
2417                 $type = undef
2418                         unless ($type eq 'bool' || $type eq 'int');
2419         }
2420
2421         # get config
2422         if (!defined $config_file ||
2423             $config_file ne "$git_dir/config") {
2424                 %config = git_parse_project_config('gitweb');
2425                 $config_file = "$git_dir/config";
2426         }
2427
2428         # check if config variable (key) exists
2429         return unless exists $config{"gitweb.$key"};
2430
2431         # ensure given type
2432         if (!defined $type) {
2433                 return $config{"gitweb.$key"};
2434         } elsif ($type eq 'bool') {
2435                 # backward compatibility: 'git config --bool' returns true/false
2436                 return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2437         } elsif ($type eq 'int') {
2438                 return config_to_int($config{"gitweb.$key"});
2439         }
2440         return $config{"gitweb.$key"};
2441 }
2442
2443 # get hash of given path at given ref
2444 sub git_get_hash_by_path {
2445         my $base = shift;
2446         my $path = shift || return undef;
2447         my $type = shift;
2448
2449         $path =~ s,/+$,,;
2450
2451         open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2452                 or die_error(500, "Open git-ls-tree failed");
2453         my $line = <$fd>;
2454         close $fd or return undef;
2455
2456         if (!defined $line) {
2457                 # there is no tree or hash given by $path at $base
2458                 return undef;
2459         }
2460
2461         #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2462         $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2463         if (defined $type && $type ne $2) {
2464                 # type doesn't match
2465                 return undef;
2466         }
2467         return $3;
2468 }
2469
2470 # get path of entry with given hash at given tree-ish (ref)
2471 # used to get 'from' filename for combined diff (merge commit) for renames
2472 sub git_get_path_by_hash {
2473         my $base = shift || return;
2474         my $hash = shift || return;
2475
2476         local $/ = "\0";
2477
2478         open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2479                 or return undef;
2480         while (my $line = <$fd>) {
2481                 chomp $line;
2482
2483                 #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2484                 #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2485                 if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2486                         close $fd;
2487                         return $1;
2488                 }
2489         }
2490         close $fd;
2491         return undef;
2492 }
2493
2494 ## ......................................................................
2495 ## git utility functions, directly accessing git repository
2496
2497 sub git_get_project_description {
2498         my $path = shift;
2499
2500         $git_dir = "$projectroot/$path";
2501         open my $fd, '<', "$git_dir/description"
2502                 or return git_get_project_config('description');
2503         my $descr = <$fd>;
2504         close $fd;
2505         if (defined $descr) {
2506                 chomp $descr;
2507         }
2508         return $descr;
2509 }
2510
2511 sub git_get_project_ctags {
2512         my $path = shift;
2513         my $ctags = {};
2514
2515         $git_dir = "$projectroot/$path";
2516         opendir my $dh, "$git_dir/ctags"
2517                 or return $ctags;
2518         foreach (grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh)) {
2519                 open my $ct, '<', $_ or next;
2520                 my $val = <$ct>;
2521                 chomp $val;
2522                 close $ct;
2523                 my $ctag = $_; $ctag =~ s#.*/##;
2524                 $ctags->{$ctag} = $val;
2525         }
2526         closedir $dh;
2527         $ctags;
2528 }
2529
2530 sub git_populate_project_tagcloud {
2531         my $ctags = shift;
2532
2533         # First, merge different-cased tags; tags vote on casing
2534         my %ctags_lc;
2535         foreach (keys %$ctags) {
2536                 $ctags_lc{lc $_}->{count} += $ctags->{$_};
2537                 if (not $ctags_lc{lc $_}->{topcount}
2538                     or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2539                         $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2540                         $ctags_lc{lc $_}->{topname} = $_;
2541                 }
2542         }
2543
2544         my $cloud;
2545         if (eval { require HTML::TagCloud; 1; }) {
2546                 $cloud = HTML::TagCloud->new;
2547                 foreach (sort keys %ctags_lc) {
2548                         # Pad the title with spaces so that the cloud looks
2549                         # less crammed.
2550                         my $title = $ctags_lc{$_}->{topname};
2551                         $title =~ s/ /&nbsp;/g;
2552                         $title =~ s/^/&nbsp;/g;
2553                         $title =~ s/$/&nbsp;/g;
2554                         $cloud->add($title, $home_link."?by_tag=".$_, $ctags_lc{$_}->{count});
2555                 }
2556         } else {
2557                 $cloud = \%ctags_lc;
2558         }
2559         $cloud;
2560 }
2561
2562 sub git_show_project_tagcloud {
2563         my ($cloud, $count) = @_;
2564         print STDERR ref($cloud)."..\n";
2565         if (ref $cloud eq 'HTML::TagCloud') {
2566                 return $cloud->html_and_css($count);
2567         } else {
2568                 my @tags = sort { $cloud->{$a}->{count} <=> $cloud->{$b}->{count} } keys %$cloud;
2569                 return '<p align="center">' . join (', ', map {
2570                         "<a href=\"$home_link?by_tag=$_\">$cloud->{$_}->{topname}</a>"
2571                 } splice(@tags, 0, $count)) . '</p>';
2572         }
2573 }
2574
2575 sub git_get_project_url_list {
2576         my $path = shift;
2577
2578         $git_dir = "$projectroot/$path";
2579         open my $fd, '<', "$git_dir/cloneurl"
2580                 or return wantarray ?
2581                 @{ config_to_multi(git_get_project_config('url')) } :
2582                    config_to_multi(git_get_project_config('url'));
2583         my @git_project_url_list = map { chomp; $_ } <$fd>;
2584         close $fd;
2585
2586         return wantarray ? @git_project_url_list : \@git_project_url_list;
2587 }
2588
2589 sub git_get_projects_list {
2590         my ($filter) = @_;
2591         my @list;
2592
2593         $filter ||= '';
2594         $filter =~ s/\.git$//;
2595
2596         my $check_forks = gitweb_check_feature('forks');
2597
2598         if (-d $projects_list) {
2599                 # search in directory
2600                 my $dir = $projects_list . ($filter ? "/$filter" : '');
2601                 # remove the trailing "/"
2602                 $dir =~ s!/+$!!;
2603                 my $pfxlen = length("$dir");
2604                 my $pfxdepth = ($dir =~ tr!/!!);
2605
2606                 File::Find::find({
2607                         follow_fast => 1, # follow symbolic links
2608                         follow_skip => 2, # ignore duplicates
2609                         dangling_symlinks => 0, # ignore dangling symlinks, silently
2610                         wanted => sub {
2611                                 # global variables
2612                                 our $project_maxdepth;
2613                                 our $projectroot;
2614                                 # skip project-list toplevel, if we get it.
2615                                 return if (m!^[/.]$!);
2616                                 # only directories can be git repositories
2617                                 return unless (-d $_);
2618                                 # don't traverse too deep (Find is super slow on os x)
2619                                 if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2620                                         $File::Find::prune = 1;
2621                                         return;
2622                                 }
2623
2624                                 my $subdir = substr($File::Find::name, $pfxlen + 1);
2625                                 # we check related file in $projectroot
2626                                 my $path = ($filter ? "$filter/" : '') . $subdir;
2627                                 if (check_export_ok("$projectroot/$path")) {
2628                                         push @list, { path => $path };
2629                                         $File::Find::prune = 1;
2630                                 }
2631                         },
2632                 }, "$dir");
2633
2634         } elsif (-f $projects_list) {
2635                 # read from file(url-encoded):
2636                 # 'git%2Fgit.git Linus+Torvalds'
2637                 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2638                 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2639                 my %paths;
2640                 open my $fd, '<', $projects_list or return;
2641         PROJECT:
2642                 while (my $line = <$fd>) {
2643                         chomp $line;
2644                         my ($path, $owner) = split ' ', $line;
2645                         $path = unescape($path);
2646                         $owner = unescape($owner);
2647                         if (!defined $path) {
2648                                 next;
2649                         }
2650                         if ($filter ne '') {
2651                                 # looking for forks;
2652                                 my $pfx = substr($path, 0, length($filter));
2653                                 if ($pfx ne $filter) {
2654                                         next PROJECT;
2655                                 }
2656                                 my $sfx = substr($path, length($filter));
2657                                 if ($sfx !~ /^\/.*\.git$/) {
2658                                         next PROJECT;
2659                                 }
2660                         } elsif ($check_forks) {
2661                         PATH:
2662                                 foreach my $filter (keys %paths) {
2663                                         # looking for forks;
2664                                         my $pfx = substr($path, 0, length($filter));
2665                                         if ($pfx ne $filter) {
2666                                                 next PATH;
2667                                         }
2668                                         my $sfx = substr($path, length($filter));
2669                                         if ($sfx !~ /^\/.*\.git$/) {
2670                                                 next PATH;
2671                                         }
2672                                         # is a fork, don't include it in
2673                                         # the list
2674                                         next PROJECT;
2675                                 }
2676                         }
2677                         if (check_export_ok("$projectroot/$path")) {
2678                                 my $pr = {
2679                                         path => $path,
2680                                         owner => to_utf8($owner),
2681                                 };
2682                                 push @list, $pr;
2683                                 (my $forks_path = $path) =~ s/\.git$//;
2684                                 $paths{$forks_path}++;
2685                         }
2686                 }
2687                 close $fd;
2688         }
2689         return @list;
2690 }
2691
2692 our $gitweb_project_owner = undef;
2693 sub git_get_project_list_from_file {
2694
2695         return if (defined $gitweb_project_owner);
2696
2697         $gitweb_project_owner = {};
2698         # read from file (url-encoded):
2699         # 'git%2Fgit.git Linus+Torvalds'
2700         # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2701         # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2702         if (-f $projects_list) {
2703                 open(my $fd, '<', $projects_list);
2704                 while (my $line = <$fd>) {
2705                         chomp $line;
2706                         my ($pr, $ow) = split ' ', $line;
2707                         $pr = unescape($pr);
2708                         $ow = unescape($ow);
2709                         $gitweb_project_owner->{$pr} = to_utf8($ow);
2710                 }
2711                 close $fd;
2712         }
2713 }
2714
2715 sub git_get_project_owner {
2716         my $project = shift;
2717         my $owner;
2718
2719         return undef unless $project;
2720         $git_dir = "$projectroot/$project";
2721
2722         if (!defined $gitweb_project_owner) {
2723                 git_get_project_list_from_file();
2724         }
2725
2726         if (exists $gitweb_project_owner->{$project}) {
2727                 $owner = $gitweb_project_owner->{$project};
2728         }
2729         if (!defined $owner){
2730                 $owner = git_get_project_config('owner');
2731         }
2732         if (!defined $owner) {
2733                 $owner = get_file_owner("$git_dir");
2734         }
2735
2736         return $owner;
2737 }
2738
2739 sub git_get_last_activity {
2740         my ($path) = @_;
2741         my $fd;
2742
2743         $git_dir = "$projectroot/$path";
2744         open($fd, "-|", git_cmd(), 'for-each-ref',
2745              '--format=%(committer)',
2746              '--sort=-committerdate',
2747              '--count=1',
2748              'refs/heads') or return;
2749         my $most_recent = <$fd>;
2750         close $fd or return;
2751         if (defined $most_recent &&
2752             $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
2753                 my $timestamp = $1;
2754                 my $age = time - $timestamp;
2755                 return ($age, age_string($age));
2756         }
2757         return (undef, undef);
2758 }
2759
2760 sub git_get_references {
2761         my $type = shift || "";
2762         my %refs;
2763         # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
2764         # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
2765         open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
2766                 ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
2767                 or return;
2768
2769         while (my $line = <$fd>) {
2770                 chomp $line;
2771                 if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
2772                         if (defined $refs{$1}) {
2773                                 push @{$refs{$1}}, $2;
2774                         } else {
2775                                 $refs{$1} = [ $2 ];
2776                         }
2777                 }
2778         }
2779         close $fd or return;
2780         return \%refs;
2781 }
2782
2783 sub git_get_rev_name_tags {
2784         my $hash = shift || return undef;
2785
2786         open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
2787                 or return;
2788         my $name_rev = <$fd>;
2789         close $fd;
2790
2791         if ($name_rev =~ m|^$hash tags/(.*)$|) {
2792                 return $1;
2793         } else {
2794                 # catches also '$hash undefined' output
2795                 return undef;
2796         }
2797 }
2798
2799 ## ----------------------------------------------------------------------
2800 ## parse to hash functions
2801
2802 sub parse_date {
2803         my $epoch = shift;
2804         my $tz = shift || "-0000";
2805
2806         my %date;
2807         my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
2808         my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
2809         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
2810         $date{'hour'} = $hour;
2811         $date{'minute'} = $min;
2812         $date{'mday'} = $mday;
2813         $date{'day'} = $days[$wday];
2814         $date{'month'} = $months[$mon];
2815         $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
2816                              $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
2817         $date{'mday-time'} = sprintf "%d %s %02d:%02d",
2818                              $mday, $months[$mon], $hour ,$min;
2819         $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
2820                              1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
2821
2822         $tz =~ m/^([+\-][0-9][0-9])([0-9][0-9])$/;
2823         my $local = $epoch + ((int $1 + ($2/60)) * 3600);
2824         ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
2825         $date{'hour_local'} = $hour;
2826         $date{'minute_local'} = $min;
2827         $date{'tz_local'} = $tz;
2828         $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
2829                                   1900+$year, $mon+1, $mday,
2830                                   $hour, $min, $sec, $tz);
2831         return %date;
2832 }
2833
2834 sub parse_tag {
2835         my $tag_id = shift;
2836         my %tag;
2837         my @comment;
2838
2839         open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
2840         $tag{'id'} = $tag_id;
2841         while (my $line = <$fd>) {
2842                 chomp $line;
2843                 if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
2844                         $tag{'object'} = $1;
2845                 } elsif ($line =~ m/^type (.+)$/) {
2846                         $tag{'type'} = $1;
2847                 } elsif ($line =~ m/^tag (.+)$/) {
2848                         $tag{'name'} = $1;
2849                 } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
2850                         $tag{'author'} = $1;
2851                         $tag{'author_epoch'} = $2;
2852                         $tag{'author_tz'} = $3;
2853                         if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
2854                                 $tag{'author_name'}  = $1;
2855                                 $tag{'author_email'} = $2;
2856                         } else {
2857                                 $tag{'author_name'} = $tag{'author'};
2858                         }
2859                 } elsif ($line =~ m/--BEGIN/) {
2860                         push @comment, $line;
2861                         last;
2862                 } elsif ($line eq "") {
2863                         last;
2864                 }
2865         }
2866         push @comment, <$fd>;
2867         $tag{'comment'} = \@comment;
2868         close $fd or return;
2869         if (!defined $tag{'name'}) {
2870                 return
2871         };
2872         return %tag
2873 }
2874
2875 sub parse_commit_text {
2876         my ($commit_text, $withparents) = @_;
2877         my @commit_lines = split '\n', $commit_text;
2878         my %co;
2879
2880         pop @commit_lines; # Remove '\0'
2881
2882         if (! @commit_lines) {
2883                 return;
2884         }
2885
2886         my $header = shift @commit_lines;
2887         if ($header !~ m/^[0-9a-fA-F]{40}/) {
2888                 return;
2889         }
2890         ($co{'id'}, my @parents) = split ' ', $header;
2891         while (my $line = shift @commit_lines) {
2892                 last if $line eq "\n";
2893                 if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
2894                         $co{'tree'} = $1;
2895                 } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
2896                         push @parents, $1;
2897                 } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
2898                         $co{'author'} = to_utf8($1);
2899                         $co{'author_epoch'} = $2;
2900                         $co{'author_tz'} = $3;
2901                         if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
2902                                 $co{'author_name'}  = $1;
2903                                 $co{'author_email'} = $2;
2904                         } else {
2905                                 $co{'author_name'} = $co{'author'};
2906                         }
2907                 } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
2908                         $co{'committer'} = to_utf8($1);
2909                         $co{'committer_epoch'} = $2;
2910                         $co{'committer_tz'} = $3;
2911                         if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
2912                                 $co{'committer_name'}  = $1;
2913                                 $co{'committer_email'} = $2;
2914                         } else {
2915                                 $co{'committer_name'} = $co{'committer'};
2916                         }
2917                 }
2918         }
2919         if (!defined $co{'tree'}) {
2920                 return;
2921         };
2922         $co{'parents'} = \@parents;
2923         $co{'parent'} = $parents[0];
2924
2925         foreach my $title (@commit_lines) {
2926                 $title =~ s/^    //;
2927                 if ($title ne "") {
2928                         $co{'title'} = chop_str($title, 80, 5);
2929                         # remove leading stuff of merges to make the interesting part visible
2930                         if (length($title) > 50) {
2931                                 $title =~ s/^Automatic //;
2932                                 $title =~ s/^merge (of|with) /Merge ... /i;
2933                                 if (length($title) > 50) {
2934                                         $title =~ s/(http|rsync):\/\///;
2935                                 }
2936                                 if (length($title) > 50) {
2937                                         $title =~ s/(master|www|rsync)\.//;
2938                                 }
2939                                 if (length($title) > 50) {
2940                                         $title =~ s/kernel.org:?//;
2941                                 }
2942                                 if (length($title) > 50) {
2943                                         $title =~ s/\/pub\/scm//;
2944                                 }
2945                         }
2946                         $co{'title_short'} = chop_str($title, 50, 5);
2947                         last;
2948                 }
2949         }
2950         if (! defined $co{'title'} || $co{'title'} eq "") {
2951                 $co{'title'} = $co{'title_short'} = '(no commit message)';
2952         }
2953         # remove added spaces
2954         foreach my $line (@commit_lines) {
2955                 $line =~ s/^    //;
2956         }
2957         $co{'comment'} = \@commit_lines;
2958
2959         my $age = time - $co{'committer_epoch'};
2960         $co{'age'} = $age;
2961         $co{'age_string'} = age_string($age);
2962         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
2963         if ($age > 60*60*24*7*2) {
2964                 $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
2965                 $co{'age_string_age'} = $co{'age_string'};
2966         } else {
2967                 $co{'age_string_date'} = $co{'age_string'};
2968                 $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
2969         }
2970         return %co;
2971 }
2972
2973 sub parse_commit {
2974         my ($commit_id) = @_;
2975         my %co;
2976
2977         local $/ = "\0";
2978
2979         open my $fd, "-|", git_cmd(), "rev-list",
2980                 "--parents",
2981                 "--header",
2982                 "--max-count=1",
2983                 $commit_id,
2984                 "--",
2985                 or die_error(500, "Open git-rev-list failed");
2986         %co = parse_commit_text(<$fd>, 1);
2987         close $fd;
2988
2989         return %co;
2990 }
2991
2992 sub parse_commits {
2993         my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
2994         my @cos;
2995
2996         $maxcount ||= 1;
2997         $skip ||= 0;
2998
2999         local $/ = "\0";
3000
3001         open my $fd, "-|", git_cmd(), "rev-list",
3002                 "--header",
3003                 @args,
3004                 ("--max-count=" . $maxcount),
3005                 ("--skip=" . $skip),
3006                 @extra_options,
3007                 $commit_id,
3008                 "--",
3009                 ($filename ? ($filename) : ())
3010                 or die_error(500, "Open git-rev-list failed");
3011         while (my $line = <$fd>) {
3012                 my %co = parse_commit_text($line);
3013                 push @cos, \%co;
3014         }
3015         close $fd;
3016
3017         return wantarray ? @cos : \@cos;
3018 }
3019
3020 # parse line of git-diff-tree "raw" output
3021 sub parse_difftree_raw_line {
3022         my $line = shift;
3023         my %res;
3024
3025         # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3026         # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3027         if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3028                 $res{'from_mode'} = $1;
3029                 $res{'to_mode'} = $2;
3030                 $res{'from_id'} = $3;
3031                 $res{'to_id'} = $4;
3032                 $res{'status'} = $5;
3033                 $res{'similarity'} = $6;
3034                 if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3035                         ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3036                 } else {
3037                         $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3038                 }
3039         }
3040         # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3041         # combined diff (for merge commit)
3042         elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3043                 $res{'nparents'}  = length($1);
3044                 $res{'from_mode'} = [ split(' ', $2) ];
3045                 $res{'to_mode'} = pop @{$res{'from_mode'}};
3046                 $res{'from_id'} = [ split(' ', $3) ];
3047                 $res{'to_id'} = pop @{$res{'from_id'}};
3048                 $res{'status'} = [ split('', $4) ];
3049                 $res{'to_file'} = unquote($5);
3050         }
3051         # 'c512b523472485aef4fff9e57b229d9d243c967f'
3052         elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3053                 $res{'commit'} = $1;
3054         }
3055
3056         return wantarray ? %res : \%res;
3057 }
3058
3059 # wrapper: return parsed line of git-diff-tree "raw" output
3060 # (the argument might be raw line, or parsed info)
3061 sub parsed_difftree_line {
3062         my $line_or_ref = shift;
3063
3064         if (ref($line_or_ref) eq "HASH") {
3065                 # pre-parsed (or generated by hand)
3066                 return $line_or_ref;
3067         } else {
3068                 return parse_difftree_raw_line($line_or_ref);
3069         }
3070 }
3071
3072 # parse line of git-ls-tree output
3073 sub parse_ls_tree_line {
3074         my $line = shift;
3075         my %opts = @_;
3076         my %res;
3077
3078         if ($opts{'-l'}) {
3079                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3080                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3081
3082                 $res{'mode'} = $1;
3083                 $res{'type'} = $2;
3084                 $res{'hash'} = $3;
3085                 $res{'size'} = $4;
3086                 if ($opts{'-z'}) {
3087                         $res{'name'} = $5;
3088                 } else {
3089                         $res{'name'} = unquote($5);
3090                 }
3091         } else {
3092                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3093                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3094
3095                 $res{'mode'} = $1;
3096                 $res{'type'} = $2;
3097                 $res{'hash'} = $3;
3098                 if ($opts{'-z'}) {
3099                         $res{'name'} = $4;
3100                 } else {
3101                         $res{'name'} = unquote($4);
3102                 }
3103         }
3104
3105         return wantarray ? %res : \%res;
3106 }
3107
3108 # generates _two_ hashes, references to which are passed as 2 and 3 argument
3109 sub parse_from_to_diffinfo {
3110         my ($diffinfo, $from, $to, @parents) = @_;
3111
3112         if ($diffinfo->{'nparents'}) {
3113                 # combined diff
3114                 $from->{'file'} = [];
3115                 $from->{'href'} = [];
3116                 fill_from_file_info($diffinfo, @parents)
3117                         unless exists $diffinfo->{'from_file'};
3118                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3119                         $from->{'file'}[$i] =
3120                                 defined $diffinfo->{'from_file'}[$i] ?
3121                                         $diffinfo->{'from_file'}[$i] :
3122                                         $diffinfo->{'to_file'};
3123                         if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3124                                 $from->{'href'}[$i] = href(action=>"blob",
3125                                                            hash_base=>$parents[$i],
3126                                                            hash=>$diffinfo->{'from_id'}[$i],
3127                                                            file_name=>$from->{'file'}[$i]);
3128                         } else {
3129                                 $from->{'href'}[$i] = undef;
3130                         }
3131                 }
3132         } else {
3133                 # ordinary (not combined) diff
3134                 $from->{'file'} = $diffinfo->{'from_file'};
3135                 if ($diffinfo->{'status'} ne "A") { # not new (added) file
3136                         $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3137                                                hash=>$diffinfo->{'from_id'},
3138                                                file_name=>$from->{'file'});
3139                 } else {
3140                         delete $from->{'href'};
3141                 }
3142         }
3143
3144         $to->{'file'} = $diffinfo->{'to_file'};
3145         if (!is_deleted($diffinfo)) { # file exists in result
3146                 $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3147                                      hash=>$diffinfo->{'to_id'},
3148                                      file_name=>$to->{'file'});
3149         } else {
3150                 delete $to->{'href'};
3151         }
3152 }
3153
3154 ## ......................................................................
3155 ## parse to array of hashes functions
3156
3157 sub git_get_heads_list {
3158         my $limit = shift;
3159         my @headslist;
3160
3161         open my $fd, '-|', git_cmd(), 'for-each-ref',
3162                 ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3163                 '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3164                 'refs/heads'
3165                 or return;
3166         while (my $line = <$fd>) {
3167                 my %ref_item;
3168
3169                 chomp $line;
3170                 my ($refinfo, $committerinfo) = split(/\0/, $line);
3171                 my ($hash, $name, $title) = split(' ', $refinfo, 3);
3172                 my ($committer, $epoch, $tz) =
3173                         ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3174                 $ref_item{'fullname'}  = $name;
3175                 $name =~ s!^refs/heads/!!;
3176
3177                 $ref_item{'name'}  = $name;
3178                 $ref_item{'id'}    = $hash;
3179                 $ref_item{'title'} = $title || '(no commit message)';
3180                 $ref_item{'epoch'} = $epoch;
3181                 if ($epoch) {
3182                         $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3183                 } else {
3184                         $ref_item{'age'} = "unknown";
3185                 }
3186
3187                 push @headslist, \%ref_item;
3188         }
3189         close $fd;
3190
3191         return wantarray ? @headslist : \@headslist;
3192 }
3193
3194 sub git_get_tags_list {
3195         my $limit = shift;
3196         my @tagslist;
3197
3198         open my $fd, '-|', git_cmd(), 'for-each-ref',
3199                 ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3200                 '--format=%(objectname) %(objecttype) %(refname) '.
3201                 '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3202                 'refs/tags'
3203                 or return;
3204         while (my $line = <$fd>) {
3205                 my %ref_item;
3206
3207                 chomp $line;
3208                 my ($refinfo, $creatorinfo) = split(/\0/, $line);
3209                 my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3210                 my ($creator, $epoch, $tz) =
3211                         ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3212                 $ref_item{'fullname'} = $name;
3213                 $name =~ s!^refs/tags/!!;
3214
3215                 $ref_item{'type'} = $type;
3216                 $ref_item{'id'} = $id;
3217                 $ref_item{'name'} = $name;
3218                 if ($type eq "tag") {
3219                         $ref_item{'subject'} = $title;
3220                         $ref_item{'reftype'} = $reftype;
3221                         $ref_item{'refid'}   = $refid;
3222                 } else {
3223                         $ref_item{'reftype'} = $type;
3224                         $ref_item{'refid'}   = $id;
3225                 }
3226
3227                 if ($type eq "tag" || $type eq "commit") {
3228                         $ref_item{'epoch'} = $epoch;
3229                         if ($epoch) {
3230                                 $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3231                         } else {
3232                                 $ref_item{'age'} = "unknown";
3233                         }
3234                 }
3235
3236                 push @tagslist, \%ref_item;
3237         }
3238         close $fd;
3239
3240         return wantarray ? @tagslist : \@tagslist;
3241 }
3242
3243 ## ----------------------------------------------------------------------
3244 ## filesystem-related functions
3245
3246 sub get_file_owner {
3247         my $path = shift;
3248
3249         my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3250         my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3251         if (!defined $gcos) {
3252                 return undef;
3253         }
3254         my $owner = $gcos;
3255         $owner =~ s/[,;].*$//;
3256         return to_utf8($owner);
3257 }
3258
3259 # assume that file exists
3260 sub insert_file {
3261         my $filename = shift;
3262
3263         open my $fd, '<', $filename;
3264         print map { to_utf8($_) } <$fd>;
3265         close $fd;
3266 }
3267
3268 ## ......................................................................
3269 ## mimetype related functions
3270
3271 sub mimetype_guess_file {
3272         my $filename = shift;
3273         my $mimemap = shift;
3274         -r $mimemap or return undef;
3275
3276         my %mimemap;
3277         open(my $mh, '<', $mimemap) or return undef;
3278         while (<$mh>) {
3279                 next if m/^#/; # skip comments
3280                 my ($mimetype, $exts) = split(/\t+/);
3281                 if (defined $exts) {
3282                         my @exts = split(/\s+/, $exts);
3283                         foreach my $ext (@exts) {
3284                                 $mimemap{$ext} = $mimetype;
3285                         }
3286                 }
3287         }
3288         close($mh);
3289
3290         $filename =~ /\.([^.]*)$/;
3291         return $mimemap{$1};
3292 }
3293
3294 sub mimetype_guess {
3295         my $filename = shift;
3296         my $mime;
3297         $filename =~ /\./ or return undef;
3298
3299         if ($mimetypes_file) {
3300                 my $file = $mimetypes_file;
3301                 if ($file !~ m!^/!) { # if it is relative path
3302                         # it is relative to project
3303                         $file = "$projectroot/$project/$file";
3304                 }
3305                 $mime = mimetype_guess_file($filename, $file);
3306         }
3307         $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3308         return $mime;
3309 }
3310
3311 sub blob_mimetype {
3312         my $fd = shift;
3313         my $filename = shift;
3314
3315         if ($filename) {
3316                 my $mime = mimetype_guess($filename);
3317                 $mime and return $mime;
3318         }
3319
3320         # just in case
3321         return $default_blob_plain_mimetype unless $fd;
3322
3323         if (-T $fd) {
3324                 return 'text/plain';
3325         } elsif (! $filename) {
3326                 return 'application/octet-stream';
3327         } elsif ($filename =~ m/\.png$/i) {
3328                 return 'image/png';
3329         } elsif ($filename =~ m/\.gif$/i) {
3330                 return 'image/gif';
3331         } elsif ($filename =~ m/\.jpe?g$/i) {
3332                 return 'image/jpeg';
3333         } else {
3334                 return 'application/octet-stream';
3335         }
3336 }
3337
3338 sub blob_contenttype {
3339         my ($fd, $file_name, $type) = @_;
3340
3341         $type ||= blob_mimetype($fd, $file_name);
3342         if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3343                 $type .= "; charset=$default_text_plain_charset";
3344         }
3345
3346         return $type;
3347 }
3348
3349 # guess file syntax for syntax highlighting; return undef if no highlighting
3350 # the name of syntax can (in the future) depend on syntax highlighter used
3351 sub guess_file_syntax {
3352         my ($highlight, $mimetype, $file_name) = @_;
3353         return undef unless ($highlight && defined $file_name);
3354         my $basename = basename($file_name, '.in');
3355         return $highlight_basename{$basename}
3356                 if exists $highlight_basename{$basename};
3357
3358         $basename =~ /\.([^.]*)$/;
3359         my $ext = $1 or return undef;
3360         return $highlight_ext{$ext}
3361                 if exists $highlight_ext{$ext};
3362
3363         return undef;
3364 }
3365
3366 # run highlighter and return FD of its output,
3367 # or return original FD if no highlighting
3368 sub run_highlighter {
3369         my ($fd, $highlight, $syntax) = @_;
3370         return $fd unless ($highlight && defined $syntax);
3371
3372         close $fd
3373                 or die_error(404, "Reading blob failed");
3374         open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3375                   quote_command($highlight_bin).
3376                   " --xhtml --fragment --syntax $syntax |"
3377                 or die_error(500, "Couldn't open file or run syntax highlighter");
3378         return $fd;
3379 }
3380
3381 ## ======================================================================
3382 ## functions printing HTML: header, footer, error page
3383
3384 sub get_page_title {
3385         my $title = to_utf8($site_name);
3386
3387         return $title unless (defined $project);
3388         $title .= " - " . to_utf8($project);
3389
3390         return $title unless (defined $action);
3391         $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3392
3393         return $title unless (defined $file_name);
3394         $title .= " - " . esc_path($file_name);
3395         if ($action eq "tree" && $file_name !~ m|/$|) {
3396                 $title .= "/";
3397         }
3398
3399         return $title;
3400 }
3401
3402 sub git_header_html {
3403         my $status = shift || "200 OK";
3404         my $expires = shift;
3405         my %opts = @_;
3406
3407         my $title = get_page_title();
3408         my $content_type;
3409         # require explicit support from the UA if we are to send the page as
3410         # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3411         # we have to do this because MSIE sometimes globs '*/*', pretending to
3412         # support xhtml+xml but choking when it gets what it asked for.
3413         if (defined $cgi->http('HTTP_ACCEPT') &&
3414             $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3415             $cgi->Accept('application/xhtml+xml') != 0) {
3416                 $content_type = 'application/xhtml+xml';
3417         } else {
3418                 $content_type = 'text/html';
3419         }
3420         print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3421                            -status=> $status, -expires => $expires)
3422                 unless ($opts{'-no_http_header'});
3423         my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3424         print <<EOF;
3425 <?xml version="1.0" encoding="utf-8"?>
3426 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3427 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3428 <!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3429 <!-- git core binaries version $git_version -->
3430 <head>
3431 <meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3432 <meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3433 <meta name="robots" content="index, nofollow"/>
3434 <title>$title</title>
3435 EOF
3436         # the stylesheet, favicon etc urls won't work correctly with path_info
3437         # unless we set the appropriate base URL
3438         if ($ENV{'PATH_INFO'}) {
3439                 print "<base href=\"".esc_url($base_url)."\" />\n";
3440         }
3441         # print out each stylesheet that exist, providing backwards capability
3442         # for those people who defined $stylesheet in a config file
3443         if (defined $stylesheet) {
3444                 print '<link rel="stylesheet" type="text/css" href="'.$stylesheet.'"/>'."\n";
3445         } else {
3446                 foreach my $stylesheet (@stylesheets) {
3447                         next unless $stylesheet;
3448                         print '<link rel="stylesheet" type="text/css" href="'.$stylesheet.'"/>'."\n";
3449                 }
3450         }
3451         if (defined $project) {
3452                 my %href_params = get_feed_info();
3453                 if (!exists $href_params{'-title'}) {
3454                         $href_params{'-title'} = 'log';
3455                 }
3456
3457                 foreach my $format qw(RSS Atom) {
3458                         my $type = lc($format);
3459                         my %link_attr = (
3460                                 '-rel' => 'alternate',
3461                                 '-title' => "$project - $href_params{'-title'} - $format feed",
3462                                 '-type' => "application/$type+xml"
3463                         );
3464
3465                         $href_params{'action'} = $type;
3466                         $link_attr{'-href'} = href(%href_params);
3467                         print "<link ".
3468                               "rel=\"$link_attr{'-rel'}\" ".
3469                               "title=\"$link_attr{'-title'}\" ".
3470                               "href=\"$link_attr{'-href'}\" ".
3471                               "type=\"$link_attr{'-type'}\" ".
3472                               "/>\n";
3473
3474                         $href_params{'extra_options'} = '--no-merges';
3475                         $link_attr{'-href'} = href(%href_params);
3476                         $link_attr{'-title'} .= ' (no merges)';
3477                         print "<link ".
3478                               "rel=\"$link_attr{'-rel'}\" ".
3479                               "title=\"$link_attr{'-title'}\" ".
3480                               "href=\"$link_attr{'-href'}\" ".
3481                               "type=\"$link_attr{'-type'}\" ".
3482                               "/>\n";
3483                 }
3484
3485         } else {
3486                 printf('<link rel="alternate" title="%s projects list" '.
3487                        'href="%s" type="text/plain; charset=utf-8" />'."\n",
3488                        $site_name, href(project=>undef, action=>"project_index"));
3489                 printf('<link rel="alternate" title="%s projects feeds" '.
3490                        'href="%s" type="text/x-opml" />'."\n",
3491                        $site_name, href(project=>undef, action=>"opml"));
3492         }
3493         if (defined $favicon) {
3494                 print qq(<link rel="shortcut icon" href="$favicon" type="image/png" />\n);
3495         }
3496
3497         print "</head>\n" .
3498               "<body>\n";
3499
3500         if (defined $site_header && -f $site_header) {
3501                 insert_file($site_header);
3502         }
3503
3504         print "<div class=\"page_header\">\n" .
3505               $cgi->a({-href => esc_url($logo_url),
3506                        -title => $logo_label},
3507                       qq(<img src="$logo" width="72" height="27" alt="git" class="logo"/>));
3508         print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3509         if (defined $project) {
3510                 print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3511                 if (defined $action) {
3512                         print " / $action";
3513                 }
3514                 print "\n";
3515         }
3516         print "</div>\n";
3517
3518         my $have_search = gitweb_check_feature('search');
3519         if (defined $project && $have_search) {
3520                 if (!defined $searchtext) {
3521                         $searchtext = "";
3522                 }
3523                 my $search_hash;
3524                 if (defined $hash_base) {
3525                         $search_hash = $hash_base;
3526                 } elsif (defined $hash) {
3527                         $search_hash = $hash;
3528                 } else {
3529                         $search_hash = "HEAD";
3530                 }
3531                 my $action = $my_uri;
3532                 my $use_pathinfo = gitweb_check_feature('pathinfo');
3533                 if ($use_pathinfo) {
3534                         $action .= "/".esc_url($project);
3535                 }
3536                 print $cgi->startform(-method => "get", -action => $action) .
3537                       "<div class=\"search\">\n" .
3538                       (!$use_pathinfo &&
3539                       $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3540                       $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3541                       $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3542                       $cgi->popup_menu(-name => 'st', -default => 'commit',
3543                                        -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3544                       $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3545                       " search:\n",
3546                       $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3547                       "<span title=\"Extended regular expression\">" .
3548                       $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3549                                      -checked => $search_use_regexp) .
3550                       "</span>" .
3551                       "</div>" .
3552                       $cgi->end_form() . "\n";
3553         }
3554 }
3555
3556 sub git_footer_html {
3557         my $feed_class = 'rss_logo';
3558
3559         print "<div class=\"page_footer\">\n";
3560         if (defined $project) {
3561                 my $descr = git_get_project_description($project);
3562                 if (defined $descr) {
3563                         print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3564                 }
3565
3566                 my %href_params = get_feed_info();
3567                 if (!%href_params) {
3568                         $feed_class .= ' generic';
3569                 }
3570                 $href_params{'-title'} ||= 'log';
3571
3572                 foreach my $format qw(RSS Atom) {
3573                         $href_params{'action'} = lc($format);
3574                         print $cgi->a({-href => href(%href_params),
3575                                       -title => "$href_params{'-title'} $format feed",
3576                                       -class => $feed_class}, $format)."\n";
3577                 }
3578
3579         } else {
3580                 print $cgi->a({-href => href(project=>undef, action=>"opml"),
3581                               -class => $feed_class}, "OPML") . " ";
3582                 print $cgi->a({-href => href(project=>undef, action=>"project_index"),
3583                               -class => $feed_class}, "TXT") . "\n";
3584         }
3585         print "</div>\n"; # class="page_footer"
3586
3587         if (defined $t0 && gitweb_check_feature('timed')) {
3588                 print "<div id=\"generating_info\">\n";
3589                 print 'This page took '.
3590                       '<span id="generating_time" class="time_span">'.
3591                       tv_interval($t0, [ gettimeofday() ]).
3592                       ' seconds </span>'.
3593                       ' and '.
3594                       '<span id="generating_cmd">'.
3595                       $number_of_git_cmds.
3596                       '</span> git commands '.
3597                       " to generate.\n";
3598                 print "</div>\n"; # class="page_footer"
3599         }
3600
3601         if (defined $site_footer && -f $site_footer) {
3602                 insert_file($site_footer);
3603         }
3604
3605         print qq!<script type="text/javascript" src="$javascript"></script>\n!;
3606         if (defined $action &&
3607             $action eq 'blame_incremental') {
3608                 print qq!<script type="text/javascript">\n!.
3609                       qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
3610                       qq!           "!. href() .qq!");\n!.
3611                       qq!</script>\n!;
3612         } elsif (gitweb_check_feature('javascript-actions')) {
3613                 print qq!<script type="text/javascript">\n!.
3614                       qq!window.onload = fixLinks;\n!.
3615                       qq!</script>\n!;
3616         }
3617
3618         print "</body>\n" .
3619               "</html>";
3620 }
3621
3622 # die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
3623 # Example: die_error(404, 'Hash not found')
3624 # By convention, use the following status codes (as defined in RFC 2616):
3625 # 400: Invalid or missing CGI parameters, or
3626 #      requested object exists but has wrong type.
3627 # 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
3628 #      this server or project.
3629 # 404: Requested object/revision/project doesn't exist.
3630 # 500: The server isn't configured properly, or
3631 #      an internal error occurred (e.g. failed assertions caused by bugs), or
3632 #      an unknown error occurred (e.g. the git binary died unexpectedly).
3633 # 503: The server is currently unavailable (because it is overloaded,
3634 #      or down for maintenance).  Generally, this is a temporary state.
3635 sub die_error {
3636         my $status = shift || 500;
3637         my $error = esc_html(shift) || "Internal Server Error";
3638         my $extra = shift;
3639         my %opts = @_;
3640
3641         my %http_responses = (
3642                 400 => '400 Bad Request',
3643                 403 => '403 Forbidden',
3644                 404 => '404 Not Found',
3645                 500 => '500 Internal Server Error',
3646                 503 => '503 Service Unavailable',
3647         );
3648         git_header_html($http_responses{$status}, undef, %opts);
3649         print <<EOF;
3650 <div class="page_body">
3651 <br /><br />
3652 $status - $error
3653 <br />
3654 EOF
3655         if (defined $extra) {
3656                 print "<hr />\n" .
3657                       "$extra\n";
3658         }
3659         print "</div>\n";
3660
3661         git_footer_html();
3662         goto DONE_GITWEB
3663                 unless ($opts{'-error_handler'});
3664 }
3665
3666 ## ----------------------------------------------------------------------
3667 ## functions printing or outputting HTML: navigation
3668
3669 sub git_print_page_nav {
3670         my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
3671         $extra = '' if !defined $extra; # pager or formats
3672
3673         my @navs = qw(summary shortlog log commit commitdiff tree);
3674         if ($suppress) {
3675                 @navs = grep { $_ ne $suppress } @navs;
3676         }
3677
3678         my %arg = map { $_ => {action=>$_} } @navs;
3679         if (defined $head) {
3680                 for (qw(commit commitdiff)) {
3681                         $arg{$_}{'hash'} = $head;
3682                 }
3683                 if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
3684                         for (qw(shortlog log)) {
3685                                 $arg{$_}{'hash'} = $head;
3686                         }
3687                 }
3688         }
3689
3690         $arg{'tree'}{'hash'} = $treehead if defined $treehead;
3691         $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
3692
3693         my @actions = gitweb_get_feature('actions');
3694         my %repl = (
3695                 '%' => '%',
3696                 'n' => $project,         # project name
3697                 'f' => $git_dir,         # project path within filesystem
3698                 'h' => $treehead || '',  # current hash ('h' parameter)
3699                 'b' => $treebase || '',  # hash base ('hb' parameter)
3700         );
3701         while (@actions) {
3702                 my ($label, $link, $pos) = splice(@actions,0,3);
3703                 # insert
3704                 @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
3705                 # munch munch
3706                 $link =~ s/%([%nfhb])/$repl{$1}/g;
3707                 $arg{$label}{'_href'} = $link;
3708         }
3709
3710         print "<div class=\"page_nav\">\n" .
3711                 (join " | ",
3712                  map { $_ eq $current ?
3713                        $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
3714                  } @navs);
3715         print "<br/>\n$extra<br/>\n" .
3716               "</div>\n";
3717 }
3718
3719 sub format_paging_nav {
3720         my ($action, $page, $has_next_link) = @_;
3721         my $paging_nav;
3722
3723
3724         if ($page > 0) {
3725                 $paging_nav .=
3726                         $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
3727                         " &sdot; " .
3728                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
3729                                  -accesskey => "p", -title => "Alt-p"}, "prev");
3730         } else {
3731                 $paging_nav .= "first &sdot; prev";
3732         }
3733
3734         if ($has_next_link) {
3735                 $paging_nav .= " &sdot; " .
3736                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
3737                                  -accesskey => "n", -title => "Alt-n"}, "next");
3738         } else {
3739                 $paging_nav .= " &sdot; next";
3740         }
3741
3742         return $paging_nav;
3743 }
3744
3745 ## ......................................................................
3746 ## functions printing or outputting HTML: div
3747
3748 sub git_print_header_div {
3749         my ($action, $title, $hash, $hash_base) = @_;
3750         my %args = ();
3751
3752         $args{'action'} = $action;
3753         $args{'hash'} = $hash if $hash;
3754         $args{'hash_base'} = $hash_base if $hash_base;
3755
3756         print "<div class=\"header\">\n" .
3757               $cgi->a({-href => href(%args), -class => "title"},
3758               $title ? $title : $action) .
3759               "\n</div>\n";
3760 }
3761
3762 sub print_local_time {
3763         print format_local_time(@_);
3764 }
3765
3766 sub format_local_time {
3767         my $localtime = '';
3768         my %date = @_;
3769         if ($date{'hour_local'} < 6) {
3770                 $localtime .= sprintf(" (<span class=\"atnight\">%02d:%02d</span> %s)",
3771                         $date{'hour_local'}, $date{'minute_local'}, $date{'tz_local'});
3772         } else {
3773                 $localtime .= sprintf(" (%02d:%02d %s)",
3774                         $date{'hour_local'}, $date{'minute_local'}, $date{'tz_local'});
3775         }
3776
3777         return $localtime;
3778 }
3779
3780 # Outputs the author name and date in long form
3781 sub git_print_authorship {
3782         my $co = shift;
3783         my %opts = @_;
3784         my $tag = $opts{-tag} || 'div';
3785         my $author = $co->{'author_name'};
3786
3787         my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
3788         print "<$tag class=\"author_date\">" .
3789               format_search_author($author, "author", esc_html($author)) .
3790               " [$ad{'rfc2822'}";
3791         print_local_time(%ad) if ($opts{-localtime});
3792         print "]" . git_get_avatar($co->{'author_email'}, -pad_before => 1)
3793                   . "</$tag>\n";
3794 }
3795
3796 # Outputs table rows containing the full author or committer information,
3797 # in the format expected for 'commit' view (& similar).
3798 # Parameters are a commit hash reference, followed by the list of people
3799 # to output information for. If the list is empty it defaults to both
3800 # author and committer.
3801 sub git_print_authorship_rows {
3802         my $co = shift;
3803         # too bad we can't use @people = @_ || ('author', 'committer')
3804         my @people = @_;
3805         @people = ('author', 'committer') unless @people;
3806         foreach my $who (@people) {
3807                 my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
3808                 print "<tr><td>$who</td><td>" .
3809                       format_search_author($co->{"${who}_name"}, $who,
3810                                esc_html($co->{"${who}_name"})) . " " .
3811                       format_search_author($co->{"${who}_email"}, $who,
3812                                esc_html("<" . $co->{"${who}_email"} . ">")) .
3813                       "</td><td rowspan=\"2\">" .
3814                       git_get_avatar($co->{"${who}_email"}, -size => 'double') .
3815                       "</td></tr>\n" .
3816                       "<tr>" .
3817                       "<td></td><td> $wd{'rfc2822'}";
3818                 print_local_time(%wd);
3819                 print "</td>" .
3820                       "</tr>\n";
3821         }
3822 }
3823
3824 sub git_print_page_path {
3825         my $name = shift;
3826         my $type = shift;
3827         my $hb = shift;
3828
3829
3830         print "<div class=\"page_path\">";
3831         print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
3832                       -title => 'tree root'}, to_utf8("[$project]"));
3833         print " / ";
3834         if (defined $name) {
3835                 my @dirname = split '/', $name;
3836                 my $basename = pop @dirname;
3837                 my $fullname = '';
3838
3839                 foreach my $dir (@dirname) {
3840                         $fullname .= ($fullname ? '/' : '') . $dir;
3841                         print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
3842                                                      hash_base=>$hb),
3843                                       -title => $fullname}, esc_path($dir));
3844                         print " / ";
3845                 }
3846                 if (defined $type && $type eq 'blob') {
3847                         print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
3848                                                      hash_base=>$hb),
3849                                       -title => $name}, esc_path($basename));
3850                 } elsif (defined $type && $type eq 'tree') {
3851                         print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
3852                                                      hash_base=>$hb),
3853                                       -title => $name}, esc_path($basename));
3854                         print " / ";
3855                 } else {
3856                         print esc_path($basename);
3857                 }
3858         }
3859         print "<br/></div>\n";
3860 }
3861
3862 sub git_print_log {
3863         my $log = shift;
3864         my %opts = @_;
3865
3866         if ($opts{'-remove_title'}) {
3867                 # remove title, i.e. first line of log
3868                 shift @$log;
3869         }
3870         # remove leading empty lines
3871         while (defined $log->[0] && $log->[0] eq "") {
3872                 shift @$log;
3873         }
3874
3875         # print log
3876         my $signoff = 0;
3877         my $empty = 0;
3878         foreach my $line (@$log) {
3879                 if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
3880                         $signoff = 1;
3881                         $empty = 0;
3882                         if (! $opts{'-remove_signoff'}) {
3883                                 print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
3884                                 next;
3885                         } else {
3886                                 # remove signoff lines
3887                                 next;
3888                         }
3889                 } else {
3890                         $signoff = 0;
3891                 }
3892
3893                 # print only one empty line
3894                 # do not print empty line after signoff
3895                 if ($line eq "") {
3896                         next if ($empty || $signoff);
3897                         $empty = 1;
3898                 } else {
3899                         $empty = 0;
3900                 }
3901
3902                 print format_log_line_html($line) . "<br/>\n";
3903         }
3904
3905         if ($opts{'-final_empty_line'}) {
3906                 # end with single empty line
3907                 print "<br/>\n" unless $empty;
3908         }
3909 }
3910
3911 # return link target (what link points to)
3912 sub git_get_link_target {
3913         my $hash = shift;
3914         my $link_target;
3915
3916         # read link
3917         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
3918                 or return;
3919         {
3920                 local $/ = undef;
3921                 $link_target = <$fd>;
3922         }
3923         close $fd
3924                 or return;
3925
3926         return $link_target;
3927 }
3928
3929 # given link target, and the directory (basedir) the link is in,
3930 # return target of link relative to top directory (top tree);
3931 # return undef if it is not possible (including absolute links).
3932 sub normalize_link_target {
3933         my ($link_target, $basedir) = @_;
3934
3935         # absolute symlinks (beginning with '/') cannot be normalized
3936         return if (substr($link_target, 0, 1) eq '/');
3937
3938         # normalize link target to path from top (root) tree (dir)
3939         my $path;
3940         if ($basedir) {
3941                 $path = $basedir . '/' . $link_target;
3942         } else {
3943                 # we are in top (root) tree (dir)
3944                 $path = $link_target;
3945         }
3946
3947         # remove //, /./, and /../
3948         my @path_parts;
3949         foreach my $part (split('/', $path)) {
3950                 # discard '.' and ''
3951                 next if (!$part || $part eq '.');
3952                 # handle '..'
3953                 if ($part eq '..') {
3954                         if (@path_parts) {
3955                                 pop @path_parts;
3956                         } else {
3957                                 # link leads outside repository (outside top dir)
3958                                 return;
3959                         }
3960                 } else {
3961                         push @path_parts, $part;
3962                 }
3963         }
3964         $path = join('/', @path_parts);
3965
3966         return $path;
3967 }
3968
3969 # print tree entry (row of git_tree), but without encompassing <tr> element
3970 sub git_print_tree_entry {
3971         my ($t, $basedir, $hash_base, $have_blame) = @_;
3972
3973         my %base_key = ();
3974         $base_key{'hash_base'} = $hash_base if defined $hash_base;
3975
3976         # The format of a table row is: mode list link.  Where mode is
3977         # the mode of the entry, list is the name of the entry, an href,
3978         # and link is the action links of the entry.
3979
3980         print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
3981         if (exists $t->{'size'}) {
3982                 print "<td class=\"size\">$t->{'size'}</td>\n";
3983         }
3984         if ($t->{'type'} eq "blob") {
3985                 print "<td class=\"list\">" .
3986                         $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
3987                                                file_name=>"$basedir$t->{'name'}", %base_key),
3988                                 -class => "list"}, esc_path($t->{'name'}));
3989                 if (S_ISLNK(oct $t->{'mode'})) {
3990                         my $link_target = git_get_link_target($t->{'hash'});
3991                         if ($link_target) {
3992                                 my $norm_target = normalize_link_target($link_target, $basedir);
3993                                 if (defined $norm_target) {
3994                                         print " -> " .
3995                                               $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
3996                                                                      file_name=>$norm_target),
3997                                                        -title => $norm_target}, esc_path($link_target));
3998                                 } else {
3999                                         print " -> " . esc_path($link_target);
4000                                 }
4001                         }
4002                 }
4003                 print "</td>\n";
4004                 print "<td class=\"link\">";
4005                 print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4006                                              file_name=>"$basedir$t->{'name'}", %base_key)},
4007                               "blob");
4008                 if ($have_blame) {
4009                         print " | " .
4010                               $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4011                                                      file_name=>"$basedir$t->{'name'}", %base_key)},
4012                                       "blame");
4013                 }
4014                 if (defined $hash_base) {
4015                         print " | " .
4016                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4017                                                      hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4018                                       "history");
4019                 }
4020                 print " | " .
4021                         $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4022                                                file_name=>"$basedir$t->{'name'}")},
4023                                 "raw");
4024                 print "</td>\n";
4025
4026         } elsif ($t->{'type'} eq "tree") {
4027                 print "<td class=\"list\">";
4028                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4029                                              file_name=>"$basedir$t->{'name'}",
4030                                              %base_key)},
4031                               esc_path($t->{'name'}));
4032                 print "</td>\n";
4033                 print "<td class=\"link\">";
4034                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4035                                              file_name=>"$basedir$t->{'name'}",
4036                                              %base_key)},
4037                               "tree");
4038                 if (defined $hash_base) {
4039                         print " | " .
4040                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4041                                                      file_name=>"$basedir$t->{'name'}")},
4042                                       "history");
4043                 }
4044                 print "</td>\n";
4045         } else {
4046                 # unknown object: we can only present history for it
4047                 # (this includes 'commit' object, i.e. submodule support)
4048                 print "<td class=\"list\">" .
4049                       esc_path($t->{'name'}) .
4050                       "</td>\n";
4051                 print "<td class=\"link\">";
4052                 if (defined $hash_base) {
4053                         print $cgi->a({-href => href(action=>"history",
4054                                                      hash_base=>$hash_base,
4055                                                      file_name=>"$basedir$t->{'name'}")},
4056                                       "history");
4057                 }
4058                 print "</td>\n";
4059         }
4060 }
4061
4062 ## ......................................................................
4063 ## functions printing large fragments of HTML
4064
4065 # get pre-image filenames for merge (combined) diff
4066 sub fill_from_file_info {
4067         my ($diff, @parents) = @_;
4068
4069         $diff->{'from_file'} = [ ];
4070         $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4071         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4072                 if ($diff->{'status'}[$i] eq 'R' ||
4073                     $diff->{'status'}[$i] eq 'C') {
4074                         $diff->{'from_file'}[$i] =
4075                                 git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4076                 }
4077         }
4078
4079         return $diff;
4080 }
4081
4082 # is current raw difftree line of file deletion
4083 sub is_deleted {
4084         my $diffinfo = shift;
4085
4086         return $diffinfo->{'to_id'} eq ('0' x 40);
4087 }
4088
4089 # does patch correspond to [previous] difftree raw line
4090 # $diffinfo  - hashref of parsed raw diff format
4091 # $patchinfo - hashref of parsed patch diff format
4092 #              (the same keys as in $diffinfo)
4093 sub is_patch_split {
4094         my ($diffinfo, $patchinfo) = @_;
4095
4096         return defined $diffinfo && defined $patchinfo
4097                 && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4098 }
4099
4100
4101 sub git_difftree_body {
4102         my ($difftree, $hash, @parents) = @_;
4103         my ($parent) = $parents[0];
4104         my $have_blame = gitweb_check_feature('blame');
4105         print "<div class=\"list_head\">\n";
4106         if ($#{$difftree} > 10) {
4107                 print(($#{$difftree} + 1) . " files changed:\n");
4108         }
4109         print "</div>\n";
4110
4111         print "<table class=\"" .
4112               (@parents > 1 ? "combined " : "") .
4113               "diff_tree\">\n";
4114
4115         # header only for combined diff in 'commitdiff' view
4116         my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4117         if ($has_header) {
4118                 # table header
4119                 print "<thead><tr>\n" .
4120                        "<th></th><th></th>\n"; # filename, patchN link
4121                 for (my $i = 0; $i < @parents; $i++) {
4122                         my $par = $parents[$i];
4123                         print "<th>" .
4124                               $cgi->a({-href => href(action=>"commitdiff",
4125                                                      hash=>$hash, hash_parent=>$par),
4126                                        -title => 'commitdiff to parent number ' .
4127                                                   ($i+1) . ': ' . substr($par,0,7)},
4128                                       $i+1) .
4129                               "&nbsp;</th>\n";
4130                 }
4131                 print "</tr></thead>\n<tbody>\n";
4132         }
4133
4134         my $alternate = 1;
4135         my $patchno = 0;
4136         foreach my $line (@{$difftree}) {
4137                 my $diff = parsed_difftree_line($line);
4138
4139                 if ($alternate) {
4140                         print "<tr class=\"dark\">\n";
4141                 } else {
4142                         print "<tr class=\"light\">\n";
4143                 }
4144                 $alternate ^= 1;
4145
4146                 if (exists $diff->{'nparents'}) { # combined diff
4147
4148                         fill_from_file_info($diff, @parents)
4149                                 unless exists $diff->{'from_file'};
4150
4151                         if (!is_deleted($diff)) {
4152                                 # file exists in the result (child) commit
4153                                 print "<td>" .
4154                                       $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4155                                                              file_name=>$diff->{'to_file'},
4156                                                              hash_base=>$hash),
4157                                               -class => "list"}, esc_path($diff->{'to_file'})) .
4158                                       "</td>\n";
4159                         } else {
4160                                 print "<td>" .
4161                                       esc_path($diff->{'to_file'}) .
4162                                       "</td>\n";
4163                         }
4164
4165                         if ($action eq 'commitdiff') {
4166                                 # link to patch
4167                                 $patchno++;
4168                                 print "<td class=\"link\">" .
4169                                       $cgi->a({-href => "#patch$patchno"}, "patch") .
4170                                       " | " .
4171                                       "</td>\n";
4172                         }
4173
4174                         my $has_history = 0;
4175                         my $not_deleted = 0;
4176                         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4177                                 my $hash_parent = $parents[$i];
4178                                 my $from_hash = $diff->{'from_id'}[$i];
4179                                 my $from_path = $diff->{'from_file'}[$i];
4180                                 my $status = $diff->{'status'}[$i];
4181
4182                                 $has_history ||= ($status ne 'A');
4183                                 $not_deleted ||= ($status ne 'D');
4184
4185                                 if ($status eq 'A') {
4186                                         print "<td  class=\"link\" align=\"right\"> | </td>\n";
4187                                 } elsif ($status eq 'D') {
4188                                         print "<td class=\"link\">" .
4189                                               $cgi->a({-href => href(action=>"blob",
4190                                                                      hash_base=>$hash,
4191                                                                      hash=>$from_hash,
4192                                                                      file_name=>$from_path)},
4193                                                       "blob" . ($i+1)) .
4194                                               " | </td>\n";
4195                                 } else {
4196                                         if ($diff->{'to_id'} eq $from_hash) {
4197                                                 print "<td class=\"link nochange\">";
4198                                         } else {
4199                                                 print "<td class=\"link\">";
4200                                         }
4201                                         print $cgi->a({-href => href(action=>"blobdiff",
4202                                                                      hash=>$diff->{'to_id'},
4203                                                                      hash_parent=>$from_hash,
4204                                                                      hash_base=>$hash,
4205                                                                      hash_parent_base=>$hash_parent,
4206                                                                      file_name=>$diff->{'to_file'},
4207                                                                      file_parent=>$from_path)},
4208                                                       "diff" . ($i+1)) .
4209                                               " | </td>\n";
4210                                 }
4211                         }
4212
4213                         print "<td class=\"link\">";
4214                         if ($not_deleted) {
4215                                 print $cgi->a({-href => href(action=>"blob",
4216                                                              hash=>$diff->{'to_id'},
4217                                                              file_name=>$diff->{'to_file'},
4218                                                              hash_base=>$hash)},
4219                                               "blob");
4220                                 print " | " if ($has_history);
4221                         }
4222                         if ($has_history) {
4223                                 print $cgi->a({-href => href(action=>"history",
4224                                                              file_name=>$diff->{'to_file'},
4225                                                              hash_base=>$hash)},
4226                                               "history");
4227                         }
4228                         print "</td>\n";
4229
4230                         print "</tr>\n";
4231                         next; # instead of 'else' clause, to avoid extra indent
4232                 }
4233                 # else ordinary diff
4234
4235                 my ($to_mode_oct, $to_mode_str, $to_file_type);
4236                 my ($from_mode_oct, $from_mode_str, $from_file_type);
4237                 if ($diff->{'to_mode'} ne ('0' x 6)) {
4238                         $to_mode_oct = oct $diff->{'to_mode'};
4239                         if (S_ISREG($to_mode_oct)) { # only for regular file
4240                                 $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4241                         }
4242                         $to_file_type = file_type($diff->{'to_mode'});
4243                 }
4244                 if ($diff->{'from_mode'} ne ('0' x 6)) {
4245                         $from_mode_oct = oct $diff->{'from_mode'};
4246                         if (S_ISREG($to_mode_oct)) { # only for regular file
4247                                 $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4248                         }
4249                         $from_file_type = file_type($diff->{'from_mode'});
4250                 }
4251
4252                 if ($diff->{'status'} eq "A") { # created
4253                         my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4254                         $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4255                         $mode_chng   .= "]</span>";
4256                         print "<td>";
4257                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4258                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4259                                       -class => "list"}, esc_path($diff->{'file'}));
4260                         print "</td>\n";
4261                         print "<td>$mode_chng</td>\n";
4262                         print "<td class=\"link\">";
4263                         if ($action eq 'commitdiff') {
4264                                 # link to patch
4265                                 $patchno++;
4266                                 print $cgi->a({-href => "#patch$patchno"}, "patch");
4267                                 print " | ";
4268                         }
4269                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4270                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4271                                       "blob");
4272                         print "</td>\n";
4273
4274                 } elsif ($diff->{'status'} eq "D") { # deleted
4275                         my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4276                         print "<td>";
4277                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4278                                                      hash_base=>$parent, file_name=>$diff->{'file'}),
4279                                        -class => "list"}, esc_path($diff->{'file'}));
4280                         print "</td>\n";
4281                         print "<td>$mode_chng</td>\n";
4282                         print "<td class=\"link\">";
4283                         if ($action eq 'commitdiff') {
4284                                 # link to patch
4285                                 $patchno++;
4286                                 print $cgi->a({-href => "#patch$patchno"}, "patch");
4287                                 print " | ";
4288                         }
4289                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4290                                                      hash_base=>$parent, file_name=>$diff->{'file'})},
4291                                       "blob") . " | ";
4292                         if ($have_blame) {
4293                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4294                                                              file_name=>$diff->{'file'})},
4295                                               "blame") . " | ";
4296                         }
4297                         print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4298                                                      file_name=>$diff->{'file'})},
4299                                       "history");
4300                         print "</td>\n";
4301
4302                 } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4303                         my $mode_chnge = "";
4304                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4305                                 $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4306                                 if ($from_file_type ne $to_file_type) {
4307                                         $mode_chnge .= " from $from_file_type to $to_file_type";
4308                                 }
4309                                 if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4310                                         if ($from_mode_str && $to_mode_str) {
4311                                                 $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4312                                         } elsif ($to_mode_str) {
4313                                                 $mode_chnge .= " mode: $to_mode_str";
4314                                         }
4315                                 }
4316                                 $mode_chnge .= "]</span>\n";
4317                         }
4318                         print "<td>";
4319                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4320                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4321                                       -class => "list"}, esc_path($diff->{'file'}));
4322                         print "</td>\n";
4323                         print "<td>$mode_chnge</td>\n";
4324                         print "<td class=\"link\">";
4325                         if ($action eq 'commitdiff') {
4326                                 # link to patch
4327                                 $patchno++;
4328                                 print $cgi->a({-href => "#patch$patchno"}, "patch") .
4329                                       " | ";
4330                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4331                                 # "commit" view and modified file (not onlu mode changed)
4332                                 print $cgi->a({-href => href(action=>"blobdiff",
4333                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4334                                                              hash_base=>$hash, hash_parent_base=>$parent,
4335                                                              file_name=>$diff->{'file'})},
4336                                               "diff") .
4337                                       " | ";
4338                         }
4339                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4340                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4341                                        "blob") . " | ";
4342                         if ($have_blame) {
4343                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4344                                                              file_name=>$diff->{'file'})},
4345                                               "blame") . " | ";
4346                         }
4347                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4348                                                      file_name=>$diff->{'file'})},
4349                                       "history");
4350                         print "</td>\n";
4351
4352                 } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4353                         my %status_name = ('R' => 'moved', 'C' => 'copied');
4354                         my $nstatus = $status_name{$diff->{'status'}};
4355                         my $mode_chng = "";
4356                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4357                                 # mode also for directories, so we cannot use $to_mode_str
4358                                 $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4359                         }
4360                         print "<td>" .
4361                               $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4362                                                      hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4363                                       -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4364                               "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4365                               $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4366                                                      hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4367                                       -class => "list"}, esc_path($diff->{'from_file'})) .
4368                               " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4369                               "<td class=\"link\">";
4370                         if ($action eq 'commitdiff') {
4371                                 # link to patch
4372                                 $patchno++;
4373                                 print $cgi->a({-href => "#patch$patchno"}, "patch") .
4374                                       " | ";
4375                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4376                                 # "commit" view and modified file (not only pure rename or copy)
4377                                 print $cgi->a({-href => href(action=>"blobdiff",
4378                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4379                                                              hash_base=>$hash, hash_parent_base=>$parent,
4380                                                              file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4381                                               "diff") .
4382                                       " | ";
4383                         }
4384                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4385                                                      hash_base=>$parent, file_name=>$diff->{'to_file'})},
4386                                       "blob") . " | ";
4387                         if ($have_blame) {
4388                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4389                                                              file_name=>$diff->{'to_file'})},
4390                                               "blame") . " | ";
4391                         }
4392                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4393                                                     file_name=>$diff->{'to_file'})},
4394                                       "history");
4395                         print "</td>\n";
4396
4397                 } # we should not encounter Unmerged (U) or Unknown (X) status
4398                 print "</tr>\n";
4399         }
4400         print "</tbody>" if $has_header;
4401         print "</table>\n";
4402 }
4403
4404 sub git_patchset_body {
4405         my ($fd, $difftree, $hash, @hash_parents) = @_;
4406         my ($hash_parent) = $hash_parents[0];
4407
4408         my $is_combined = (@hash_parents > 1);
4409         my $patch_idx = 0;
4410         my $patch_number = 0;
4411         my $patch_line;
4412         my $diffinfo;
4413         my $to_name;
4414         my (%from, %to);
4415
4416         print "<div class=\"patchset\">\n";
4417
4418         # skip to first patch
4419         while ($patch_line = <$fd>) {
4420                 chomp $patch_line;
4421
4422                 last if ($patch_line =~ m/^diff /);
4423         }
4424
4425  PATCH:
4426         while ($patch_line) {
4427
4428                 # parse "git diff" header line
4429                 if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
4430                         # $1 is from_name, which we do not use
4431                         $to_name = unquote($2);
4432                         $to_name =~ s!^b/!!;
4433                 } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
4434                         # $1 is 'cc' or 'combined', which we do not use
4435                         $to_name = unquote($2);
4436                 } else {
4437                         $to_name = undef;
4438                 }
4439
4440                 # check if current patch belong to current raw line
4441                 # and parse raw git-diff line if needed
4442                 if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
4443                         # this is continuation of a split patch
4444                         print "<div class=\"patch cont\">\n";
4445                 } else {
4446                         # advance raw git-diff output if needed
4447                         $patch_idx++ if defined $diffinfo;
4448
4449                         # read and prepare patch information
4450                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4451
4452                         # compact combined diff output can have some patches skipped
4453                         # find which patch (using pathname of result) we are at now;
4454                         if ($is_combined) {
4455                                 while ($to_name ne $diffinfo->{'to_file'}) {
4456                                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4457                                               format_diff_cc_simplified($diffinfo, @hash_parents) .
4458                                               "</div>\n";  # class="patch"
4459
4460                                         $patch_idx++;
4461                                         $patch_number++;
4462
4463                                         last if $patch_idx > $#$difftree;
4464                                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4465                                 }
4466                         }
4467
4468                         # modifies %from, %to hashes
4469                         parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
4470
4471                         # this is first patch for raw difftree line with $patch_idx index
4472                         # we index @$difftree array from 0, but number patches from 1
4473                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
4474                 }
4475
4476                 # git diff header
4477                 #assert($patch_line =~ m/^diff /) if DEBUG;
4478                 #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
4479                 $patch_number++;
4480                 # print "git diff" header
4481                 print format_git_diff_header_line($patch_line, $diffinfo,
4482                                                   \%from, \%to);
4483
4484                 # print extended diff header
4485                 print "<div class=\"diff extended_header\">\n";
4486         EXTENDED_HEADER:
4487                 while ($patch_line = <$fd>) {
4488                         chomp $patch_line;
4489
4490                         last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
4491
4492                         print format_extended_diff_header_line($patch_line, $diffinfo,
4493                                                                \%from, \%to);
4494                 }
4495                 print "</div>\n"; # class="diff extended_header"
4496
4497                 # from-file/to-file diff header
4498                 if (! $patch_line) {
4499                         print "</div>\n"; # class="patch"
4500                         last PATCH;
4501                 }
4502                 next PATCH if ($patch_line =~ m/^diff /);
4503                 #assert($patch_line =~ m/^---/) if DEBUG;
4504
4505                 my $last_patch_line = $patch_line;
4506                 $patch_line = <$fd>;
4507                 chomp $patch_line;
4508                 #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
4509
4510                 print format_diff_from_to_header($last_patch_line, $patch_line,
4511                                                  $diffinfo, \%from, \%to,
4512                                                  @hash_parents);
4513
4514                 # the patch itself
4515         LINE:
4516                 while ($patch_line = <$fd>) {
4517                         chomp $patch_line;
4518
4519                         next PATCH if ($patch_line =~ m/^diff /);
4520
4521                         print format_diff_line($patch_line, \%from, \%to);
4522                 }
4523
4524         } continue {
4525                 print "</div>\n"; # class="patch"
4526         }
4527
4528         # for compact combined (--cc) format, with chunk and patch simplification
4529         # the patchset might be empty, but there might be unprocessed raw lines
4530         for (++$patch_idx if $patch_number > 0;
4531              $patch_idx < @$difftree;
4532              ++$patch_idx) {
4533                 # read and prepare patch information
4534                 $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4535
4536                 # generate anchor for "patch" links in difftree / whatchanged part
4537                 print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4538                       format_diff_cc_simplified($diffinfo, @hash_parents) .
4539                       "</div>\n";  # class="patch"
4540
4541                 $patch_number++;
4542         }
4543
4544         if ($patch_number == 0) {
4545                 if (@hash_parents > 1) {
4546                         print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
4547                 } else {
4548                         print "<div class=\"diff nodifferences\">No differences found</div>\n";
4549                 }
4550         }
4551
4552         print "</div>\n"; # class="patchset"
4553 }
4554
4555 # . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
4556
4557 # fills project list info (age, description, owner, forks) for each
4558 # project in the list, removing invalid projects from returned list
4559 # NOTE: modifies $projlist, but does not remove entries from it
4560 sub fill_project_list_info {
4561         my ($projlist, $check_forks) = @_;
4562         my @projects;
4563
4564         my $show_ctags = gitweb_check_feature('ctags');
4565  PROJECT:
4566         foreach my $pr (@$projlist) {
4567                 my (@activity) = git_get_last_activity($pr->{'path'});
4568                 unless (@activity) {
4569                         next PROJECT;
4570                 }
4571                 ($pr->{'age'}, $pr->{'age_string'}) = @activity;
4572                 if (!defined $pr->{'descr'}) {
4573                         my $descr = git_get_project_description($pr->{'path'}) || "";
4574                         $descr = to_utf8($descr);
4575                         $pr->{'descr_long'} = $descr;
4576                         $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
4577                 }
4578                 if (!defined $pr->{'owner'}) {
4579                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
4580                 }
4581                 if ($check_forks) {
4582                         my $pname = $pr->{'path'};
4583                         if (($pname =~ s/\.git$//) &&
4584                             ($pname !~ /\/$/) &&
4585                             (-d "$projectroot/$pname")) {
4586                                 $pr->{'forks'} = "-d $projectroot/$pname";
4587                         } else {
4588                                 $pr->{'forks'} = 0;
4589                         }
4590                 }
4591                 $show_ctags and $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
4592                 push @projects, $pr;
4593         }
4594
4595         return @projects;
4596 }
4597
4598 # print 'sort by' <th> element, generating 'sort by $name' replay link
4599 # if that order is not selected
4600 sub print_sort_th {
4601         print format_sort_th(@_);
4602 }
4603
4604 sub format_sort_th {
4605         my ($name, $order, $header) = @_;
4606         my $sort_th = "";
4607         $header ||= ucfirst($name);
4608
4609         if ($order eq $name) {
4610                 $sort_th .= "<th>$header</th>\n";
4611         } else {
4612                 $sort_th .= "<th>" .
4613                             $cgi->a({-href => href(-replay=>1, order=>$name),
4614                                      -class => "header"}, $header) .
4615                             "</th>\n";
4616         }
4617
4618         return $sort_th;
4619 }
4620
4621 sub git_project_list_body {
4622         # actually uses global variable $project
4623         my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
4624
4625         my $check_forks = gitweb_check_feature('forks');
4626         my @projects = fill_project_list_info($projlist, $check_forks);
4627
4628         $order ||= $default_projects_order;
4629         $from = 0 unless defined $from;
4630         $to = $#projects if (!defined $to || $#projects < $to);
4631
4632         my %order_info = (
4633                 project => { key => 'path', type => 'str' },
4634                 descr => { key => 'descr_long', type => 'str' },
4635                 owner => { key => 'owner', type => 'str' },
4636                 age => { key => 'age', type => 'num' }
4637         );
4638         my $oi = $order_info{$order};
4639         if ($oi->{'type'} eq 'str') {
4640                 @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @projects;
4641         } else {
4642                 @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @projects;
4643         }
4644
4645         my $show_ctags = gitweb_check_feature('ctags');
4646         if ($show_ctags) {
4647                 my %ctags;
4648                 foreach my $p (@projects) {
4649                         foreach my $ct (keys %{$p->{'ctags'}}) {
4650                                 $ctags{$ct} += $p->{'ctags'}->{$ct};
4651                         }
4652                 }
4653                 my $cloud = git_populate_project_tagcloud(\%ctags);
4654                 print git_show_project_tagcloud($cloud, 64);
4655         }
4656
4657         print "<table class=\"project_list\">\n";
4658         unless ($no_header) {
4659                 print "<tr>\n";
4660                 if ($check_forks) {
4661                         print "<th></th>\n";
4662                 }
4663                 print_sort_th('project', $order, 'Project');
4664                 print_sort_th('descr', $order, 'Description');
4665                 print_sort_th('owner', $order, 'Owner');
4666                 print_sort_th('age', $order, 'Last Change');
4667                 print "<th></th>\n" . # for links
4668                       "</tr>\n";
4669         }
4670         my $alternate = 1;
4671         my $tagfilter = $cgi->param('by_tag');
4672         for (my $i = $from; $i <= $to; $i++) {
4673                 my $pr = $projects[$i];
4674
4675                 next if $tagfilter and $show_ctags and not grep { lc $_ eq lc $tagfilter } keys %{$pr->{'ctags'}};
4676                 next if $searchtext and not $pr->{'path'} =~ /$searchtext/
4677                         and not $pr->{'descr_long'} =~ /$searchtext/;
4678                 # Weed out forks or non-matching entries of search
4679                 if ($check_forks) {
4680                         my $forkbase = $project; $forkbase ||= ''; $forkbase =~ s#\.git$#/#;
4681                         $forkbase="^$forkbase" if $forkbase;
4682                         next if not $searchtext and not $tagfilter and $show_ctags
4683                                 and $pr->{'path'} =~ m#$forkbase.*/.*#; # regexp-safe
4684                 }
4685
4686                 if ($alternate) {
4687                         print "<tr class=\"dark\">\n";
4688                 } else {
4689                         print "<tr class=\"light\">\n";
4690                 }
4691                 $alternate ^= 1;
4692                 if ($check_forks) {
4693                         print "<td>";
4694                         if ($pr->{'forks'}) {
4695                                 print "<!-- $pr->{'forks'} -->\n";
4696                                 print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "+");
4697                         }
4698                         print "</td>\n";
4699                 }
4700                 print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4701                                         -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
4702                       "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4703                                         -class => "list", -title => $pr->{'descr_long'}},
4704                                         esc_html($pr->{'descr'})) . "</td>\n" .
4705                       "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
4706                 print "<td class=\"". age_class($pr->{'age'}) . "\">" .
4707                       (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
4708                       "<td class=\"link\">" .
4709                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
4710                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
4711                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
4712                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
4713                       ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
4714                       "</td>\n" .
4715                       "</tr>\n";
4716         }
4717         if (defined $extra) {
4718                 print "<tr>\n";
4719                 if ($check_forks) {
4720                         print "<td></td>\n";
4721                 }
4722                 print "<td colspan=\"5\">$extra</td>\n" .
4723                       "</tr>\n";
4724         }
4725         print "</table>\n";
4726 }
4727
4728 sub git_log_body {
4729         # uses global variable $project
4730         my ($commitlist, $from, $to, $refs, $extra) = @_;
4731
4732         $from = 0 unless defined $from;
4733         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4734
4735         for (my $i = 0; $i <= $to; $i++) {
4736                 my %co = %{$commitlist->[$i]};
4737                 next if !%co;
4738                 my $commit = $co{'id'};
4739                 my $ref = format_ref_marker($refs, $commit);
4740                 my %ad = parse_date($co{'author_epoch'});
4741                 git_print_header_div('commit',
4742                                "<span class=\"age\">$co{'age_string'}</span>" .
4743                                esc_html($co{'title'}) . $ref,
4744                                $commit);
4745                 print "<div class=\"title_text\">\n" .
4746                       "<div class=\"log_link\">\n" .
4747                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
4748                       " | " .
4749                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
4750                       " | " .
4751                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
4752                       "<br/>\n" .
4753                       "</div>\n";
4754                       git_print_authorship(\%co, -tag => 'span');
4755                       print "<br/>\n</div>\n";
4756
4757                 print "<div class=\"log_body\">\n";
4758                 git_print_log($co{'comment'}, -final_empty_line=> 1);
4759                 print "</div>\n";
4760         }
4761         if ($extra) {
4762                 print "<div class=\"page_nav\">\n";
4763                 print "$extra\n";
4764                 print "</div>\n";
4765         }
4766 }
4767
4768 sub git_shortlog_body {
4769         # uses global variable $project
4770         my ($commitlist, $from, $to, $refs, $extra) = @_;
4771
4772         $from = 0 unless defined $from;
4773         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4774
4775         print "<table class=\"shortlog\">\n";
4776         my $alternate = 1;
4777         for (my $i = $from; $i <= $to; $i++) {
4778                 my %co = %{$commitlist->[$i]};
4779                 my $commit = $co{'id'};
4780                 my $ref = format_ref_marker($refs, $commit);
4781                 if ($alternate) {
4782                         print "<tr class=\"dark\">\n";
4783                 } else {
4784                         print "<tr class=\"light\">\n";
4785                 }
4786                 $alternate ^= 1;
4787                 # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
4788                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4789                       format_author_html('td', \%co, 10) . "<td>";
4790                 print format_subject_html($co{'title'}, $co{'title_short'},
4791                                           href(action=>"commit", hash=>$commit), $ref);
4792                 print "</td>\n" .
4793                       "<td class=\"link\">" .
4794                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
4795                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
4796                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
4797                 my $snapshot_links = format_snapshot_links($commit);
4798                 if (defined $snapshot_links) {
4799                         print " | " . $snapshot_links;
4800                 }
4801                 print "</td>\n" .
4802                       "</tr>\n";
4803         }
4804         if (defined $extra) {
4805                 print "<tr>\n" .
4806                       "<td colspan=\"4\">$extra</td>\n" .
4807                       "</tr>\n";
4808         }
4809         print "</table>\n";
4810 }
4811
4812 sub git_history_body {
4813         # Warning: assumes constant type (blob or tree) during history
4814         my ($commitlist, $from, $to, $refs, $extra,
4815             $file_name, $file_hash, $ftype) = @_;
4816
4817         $from = 0 unless defined $from;
4818         $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
4819
4820         print "<table class=\"history\">\n";
4821         my $alternate = 1;
4822         for (my $i = $from; $i <= $to; $i++) {
4823                 my %co = %{$commitlist->[$i]};
4824                 if (!%co) {
4825                         next;
4826                 }
4827                 my $commit = $co{'id'};
4828
4829                 my $ref = format_ref_marker($refs, $commit);
4830
4831                 if ($alternate) {
4832                         print "<tr class=\"dark\">\n";
4833                 } else {
4834                         print "<tr class=\"light\">\n";
4835                 }
4836                 $alternate ^= 1;
4837                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4838         # shortlog:   format_author_html('td', \%co, 10)
4839                       format_author_html('td', \%co, 15, 3) . "<td>";
4840                 # originally git_history used chop_str($co{'title'}, 50)
4841                 print format_subject_html($co{'title'}, $co{'title_short'},
4842                                           href(action=>"commit", hash=>$commit), $ref);
4843                 print "</td>\n" .
4844                       "<td class=\"link\">" .
4845                       $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
4846                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
4847
4848                 if ($ftype eq 'blob') {
4849                         my $blob_current = $file_hash;
4850                         my $blob_parent  = git_get_hash_by_path($commit, $file_name);
4851                         if (defined $blob_current && defined $blob_parent &&
4852                                         $blob_current ne $blob_parent) {
4853                                 print " | " .
4854                                         $cgi->a({-href => href(action=>"blobdiff",
4855                                                                hash=>$blob_current, hash_parent=>$blob_parent,
4856                                                                hash_base=>$hash_base, hash_parent_base=>$commit,
4857                                                                file_name=>$file_name)},
4858                                                 "diff to current");
4859                         }
4860                 }
4861                 print "</td>\n" .
4862                       "</tr>\n";
4863         }
4864         if (defined $extra) {
4865                 print "<tr>\n" .
4866                       "<td colspan=\"4\">$extra</td>\n" .
4867                       "</tr>\n";
4868         }
4869         print "</table>\n";
4870 }
4871
4872 sub git_tags_body {
4873         # uses global variable $project
4874         my ($taglist, $from, $to, $extra) = @_;
4875         $from = 0 unless defined $from;
4876         $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
4877
4878         print "<table class=\"tags\">\n";
4879         my $alternate = 1;
4880         for (my $i = $from; $i <= $to; $i++) {
4881                 my $entry = $taglist->[$i];
4882                 my %tag = %$entry;
4883                 my $comment = $tag{'subject'};
4884                 my $comment_short;
4885                 if (defined $comment) {
4886                         $comment_short = chop_str($comment, 30, 5);
4887                 }
4888                 if ($alternate) {
4889                         print "<tr class=\"dark\">\n";
4890                 } else {
4891                         print "<tr class=\"light\">\n";
4892                 }
4893                 $alternate ^= 1;
4894                 if (defined $tag{'age'}) {
4895                         print "<td><i>$tag{'age'}</i></td>\n";
4896                 } else {
4897                         print "<td></td>\n";
4898                 }
4899                 print "<td>" .
4900                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
4901                                -class => "list name"}, esc_html($tag{'name'})) .
4902                       "</td>\n" .
4903                       "<td>";
4904                 if (defined $comment) {
4905                         print format_subject_html($comment, $comment_short,
4906                                                   href(action=>"tag", hash=>$tag{'id'}));
4907                 }
4908                 print "</td>\n" .
4909                       "<td class=\"selflink\">";
4910                 if ($tag{'type'} eq "tag") {
4911                         print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
4912                 } else {
4913                         print "&nbsp;";
4914                 }
4915                 print "</td>\n" .
4916                       "<td class=\"link\">" . " | " .
4917                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
4918                 if ($tag{'reftype'} eq "commit") {
4919                         print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
4920                               " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
4921                 } elsif ($tag{'reftype'} eq "blob") {
4922                         print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
4923                 }
4924                 print "</td>\n" .
4925                       "</tr>";
4926         }
4927         if (defined $extra) {
4928                 print "<tr>\n" .
4929                       "<td colspan=\"5\">$extra</td>\n" .
4930                       "</tr>\n";
4931         }
4932         print "</table>\n";
4933 }
4934
4935 sub git_heads_body {
4936         # uses global variable $project
4937         my ($headlist, $head, $from, $to, $extra) = @_;
4938         $from = 0 unless defined $from;
4939         $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
4940
4941         print "<table class=\"heads\">\n";
4942         my $alternate = 1;
4943         for (my $i = $from; $i <= $to; $i++) {
4944                 my $entry = $headlist->[$i];
4945                 my %ref = %$entry;
4946                 my $curr = $ref{'id'} eq $head;
4947                 if ($alternate) {
4948                         print "<tr class=\"dark\">\n";
4949                 } else {
4950                         print "<tr class=\"light\">\n";
4951                 }
4952                 $alternate ^= 1;
4953                 print "<td><i>$ref{'age'}</i></td>\n" .
4954                       ($curr ? "<td class=\"current_head\">" : "<td>") .
4955                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
4956                                -class => "list name"},esc_html($ref{'name'})) .
4957                       "</td>\n" .
4958                       "<td class=\"link\">" .
4959                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
4960                       $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
4961                       $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'name'})}, "tree") .
4962                       "</td>\n" .
4963                       "</tr>";
4964         }
4965         if (defined $extra) {
4966                 print "<tr>\n" .
4967                       "<td colspan=\"3\">$extra</td>\n" .
4968                       "</tr>\n";
4969         }
4970         print "</table>\n";
4971 }
4972
4973 sub git_search_grep_body {
4974         my ($commitlist, $from, $to, $extra) = @_;
4975         $from = 0 unless defined $from;
4976         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4977
4978         print "<table class=\"commit_search\">\n";
4979         my $alternate = 1;
4980         for (my $i = $from; $i <= $to; $i++) {
4981                 my %co = %{$commitlist->[$i]};
4982                 if (!%co) {
4983                         next;
4984                 }
4985                 my $commit = $co{'id'};
4986                 if ($alternate) {
4987                         print "<tr class=\"dark\">\n";
4988                 } else {
4989                         print "<tr class=\"light\">\n";
4990                 }
4991                 $alternate ^= 1;
4992                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4993                       format_author_html('td', \%co, 15, 5) .
4994                       "<td>" .
4995                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
4996                                -class => "list subject"},
4997                               chop_and_escape_str($co{'title'}, 50) . "<br/>");
4998                 my $comment = $co{'comment'};
4999                 foreach my $line (@$comment) {
5000                         if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
5001                                 my ($lead, $match, $trail) = ($1, $2, $3);
5002                                 $match = chop_str($match, 70, 5, 'center');
5003                                 my $contextlen = int((80 - length($match))/2);
5004                                 $contextlen = 30 if ($contextlen > 30);
5005                                 $lead  = chop_str($lead,  $contextlen, 10, 'left');
5006                                 $trail = chop_str($trail, $contextlen, 10, 'right');
5007
5008                                 $lead  = esc_html($lead);
5009                                 $match = esc_html($match);
5010                                 $trail = esc_html($trail);
5011
5012                                 print "$lead<span class=\"match\">$match</span>$trail<br />";
5013                         }
5014                 }
5015                 print "</td>\n" .
5016                       "<td class=\"link\">" .
5017                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5018                       " | " .
5019                       $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5020                       " | " .
5021                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5022                 print "</td>\n" .
5023                       "</tr>\n";
5024         }
5025         if (defined $extra) {
5026                 print "<tr>\n" .
5027                       "<td colspan=\"3\">$extra</td>\n" .
5028                       "</tr>\n";
5029         }
5030         print "</table>\n";
5031 }
5032
5033 ## ======================================================================
5034 ## ======================================================================
5035 ## actions
5036
5037 sub git_project_list {
5038         my $order = $input_params{'order'};
5039         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5040                 die_error(400, "Unknown order parameter");
5041         }
5042
5043         my @list = git_get_projects_list();
5044         if (!@list) {
5045                 die_error(404, "No projects found");
5046         }
5047
5048         git_header_html();
5049         if (defined $home_text && -f $home_text) {
5050                 print "<div class=\"index_include\">\n";
5051                 insert_file($home_text);
5052                 print "</div>\n";
5053         }
5054         print $cgi->startform(-method => "get") .
5055               "<p class=\"projsearch\">Search:\n" .
5056               $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
5057               "</p>" .
5058               $cgi->end_form() . "\n";
5059         git_project_list_body(\@list, $order);
5060         git_footer_html();
5061 }
5062
5063 sub git_forks {
5064         my $order = $input_params{'order'};
5065         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5066                 die_error(400, "Unknown order parameter");
5067         }
5068
5069         my @list = git_get_projects_list($project);
5070         if (!@list) {
5071                 die_error(404, "No forks found");
5072         }
5073
5074         git_header_html();
5075         git_print_page_nav('','');
5076         git_print_header_div('summary', "$project forks");
5077         git_project_list_body(\@list, $order);
5078         git_footer_html();
5079 }
5080
5081 sub git_project_index {
5082         my @projects = git_get_projects_list($project);
5083
5084         print $cgi->header(
5085                 -type => 'text/plain',
5086                 -charset => 'utf-8',
5087                 -content_disposition => 'inline; filename="index.aux"');
5088
5089         foreach my $pr (@projects) {
5090                 if (!exists $pr->{'owner'}) {
5091                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
5092                 }
5093
5094                 my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
5095                 # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
5096                 $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5097                 $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5098                 $path  =~ s/ /\+/g;
5099                 $owner =~ s/ /\+/g;
5100
5101                 print "$path $owner\n";
5102         }
5103 }
5104
5105 sub git_summary {
5106         my $descr = git_get_project_description($project) || "none";
5107         my %co = parse_commit("HEAD");
5108         my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
5109         my $head = $co{'id'};
5110
5111         my $owner = git_get_project_owner($project);
5112
5113         my $refs = git_get_references();
5114         # These get_*_list functions return one more to allow us to see if
5115         # there are more ...
5116         my @taglist  = git_get_tags_list(16);
5117         my @headlist = git_get_heads_list(16);
5118         my @forklist;
5119         my $check_forks = gitweb_check_feature('forks');
5120
5121         if ($check_forks) {
5122                 @forklist = git_get_projects_list($project);
5123         }
5124
5125         git_header_html();
5126         git_print_page_nav('summary','', $head);
5127
5128         print "<div class=\"title\">&nbsp;</div>\n";
5129         print "<table class=\"projects_list\">\n" .
5130               "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
5131               "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
5132         if (defined $cd{'rfc2822'}) {
5133                 print "<tr id=\"metadata_lchange\"><td>last change</td><td>$cd{'rfc2822'}</td></tr>\n";
5134         }
5135
5136         # use per project git URL list in $projectroot/$project/cloneurl
5137         # or make project git URL from git base URL and project name
5138         my $url_tag = "URL";
5139         my @url_list = git_get_project_url_list($project);
5140         @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
5141         foreach my $git_url (@url_list) {
5142                 next unless $git_url;
5143                 print "<tr class=\"metadata_url\"><td>$url_tag</td><td>$git_url</td></tr>\n";
5144                 $url_tag = "";
5145         }
5146
5147         # Tag cloud
5148         my $show_ctags = gitweb_check_feature('ctags');
5149         if ($show_ctags) {
5150                 my $ctags = git_get_project_ctags($project);
5151                 my $cloud = git_populate_project_tagcloud($ctags);
5152                 print "<tr id=\"metadata_ctags\"><td>Content tags:<br />";
5153                 print "</td>\n<td>" unless %$ctags;
5154                 print "<form action=\"$show_ctags\" method=\"post\"><input type=\"hidden\" name=\"p\" value=\"$project\" />Add: <input type=\"text\" name=\"t\" size=\"8\" /></form>";
5155                 print "</td>\n<td>" if %$ctags;
5156                 print git_show_project_tagcloud($cloud, 48);
5157                 print "</td></tr>";
5158         }
5159
5160         print "</table>\n";
5161
5162         # If XSS prevention is on, we don't include README.html.
5163         # TODO: Allow a readme in some safe format.
5164         if (!$prevent_xss && -s "$projectroot/$project/README.html") {
5165                 print "<div class=\"title\">readme</div>\n" .
5166                       "<div class=\"readme\">\n";
5167                 insert_file("$projectroot/$project/README.html");
5168                 print "\n</div>\n"; # class="readme"
5169         }
5170
5171         # we need to request one more than 16 (0..15) to check if
5172         # those 16 are all
5173         my @commitlist = $head ? parse_commits($head, 17) : ();
5174         if (@commitlist) {
5175                 git_print_header_div('shortlog');
5176                 git_shortlog_body(\@commitlist, 0, 15, $refs,
5177                                   $#commitlist <=  15 ? undef :
5178                                   $cgi->a({-href => href(action=>"shortlog")}, "..."));
5179         }
5180
5181         if (@taglist) {
5182                 git_print_header_div('tags');
5183                 git_tags_body(\@taglist, 0, 15,
5184                               $#taglist <=  15 ? undef :
5185                               $cgi->a({-href => href(action=>"tags")}, "..."));
5186         }
5187
5188         if (@headlist) {
5189                 git_print_header_div('heads');
5190                 git_heads_body(\@headlist, $head, 0, 15,
5191                                $#headlist <= 15 ? undef :
5192                                $cgi->a({-href => href(action=>"heads")}, "..."));
5193         }
5194
5195         if (@forklist) {
5196                 git_print_header_div('forks');
5197                 git_project_list_body(\@forklist, 'age', 0, 15,
5198                                       $#forklist <= 15 ? undef :
5199                                       $cgi->a({-href => href(action=>"forks")}, "..."),
5200                                       'no_header');
5201         }
5202
5203         git_footer_html();
5204 }
5205
5206 sub git_tag {
5207         my %tag = parse_tag($hash);
5208
5209         if (! %tag) {
5210                 die_error(404, "Unknown tag object");
5211         }
5212
5213         my $head = git_get_head_hash($project);
5214         git_header_html();
5215         git_print_page_nav('','', $head,undef,$head);
5216         git_print_header_div('commit', esc_html($tag{'name'}), $hash);
5217         print "<div class=\"title_text\">\n" .
5218               "<table class=\"object_header\">\n" .
5219               "<tr>\n" .
5220               "<td>object</td>\n" .
5221               "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5222                                $tag{'object'}) . "</td>\n" .
5223               "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5224                                               $tag{'type'}) . "</td>\n" .
5225               "</tr>\n";
5226         if (defined($tag{'author'})) {
5227                 git_print_authorship_rows(\%tag, 'author');
5228         }
5229         print "</table>\n\n" .
5230               "</div>\n";
5231         print "<div class=\"page_body\">";
5232         my $comment = $tag{'comment'};
5233         foreach my $line (@$comment) {
5234                 chomp $line;
5235                 print esc_html($line, -nbsp=>1) . "<br/>\n";
5236         }
5237         print "</div>\n";
5238         git_footer_html();
5239 }
5240
5241 sub git_blame_common {
5242         my $format = shift || 'porcelain';
5243         if ($format eq 'porcelain' && $cgi->param('js')) {
5244                 $format = 'incremental';
5245                 $action = 'blame_incremental'; # for page title etc
5246         }
5247
5248         # permissions
5249         gitweb_check_feature('blame')
5250                 or die_error(403, "Blame view not allowed");
5251
5252         # error checking
5253         die_error(400, "No file name given") unless $file_name;
5254         $hash_base ||= git_get_head_hash($project);
5255         die_error(404, "Couldn't find base commit") unless $hash_base;
5256         my %co = parse_commit($hash_base)
5257                 or die_error(404, "Commit not found");
5258         my $ftype = "blob";
5259         if (!defined $hash) {
5260                 $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
5261                         or die_error(404, "Error looking up file");
5262         } else {
5263                 $ftype = git_get_type($hash);
5264                 if ($ftype !~ "blob") {
5265                         die_error(400, "Object is not a blob");
5266                 }
5267         }
5268
5269         my $fd;
5270         if ($format eq 'incremental') {
5271                 # get file contents (as base)
5272                 open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
5273                         or die_error(500, "Open git-cat-file failed");
5274         } elsif ($format eq 'data') {
5275                 # run git-blame --incremental
5276                 open $fd, "-|", git_cmd(), "blame", "--incremental",
5277                         $hash_base, "--", $file_name
5278                         or die_error(500, "Open git-blame --incremental failed");
5279         } else {
5280                 # run git-blame --porcelain
5281                 open $fd, "-|", git_cmd(), "blame", '-p',
5282                         $hash_base, '--', $file_name
5283                         or die_error(500, "Open git-blame --porcelain failed");
5284         }
5285
5286         # incremental blame data returns early
5287         if ($format eq 'data') {
5288                 print $cgi->header(
5289                         -type=>"text/plain", -charset => "utf-8",
5290                         -status=> "200 OK");
5291                 local $| = 1; # output autoflush
5292                 print while <$fd>;
5293                 close $fd
5294                         or print "ERROR $!\n";
5295
5296                 print 'END';
5297                 if (defined $t0 && gitweb_check_feature('timed')) {
5298                         print ' '.
5299                               tv_interval($t0, [ gettimeofday() ]).
5300                               ' '.$number_of_git_cmds;
5301                 }
5302                 print "\n";
5303
5304                 return;
5305         }
5306
5307         # page header
5308         git_header_html();
5309         my $formats_nav =
5310                 $cgi->a({-href => href(action=>"blob", -replay=>1)},
5311                         "blob") .
5312                 " | ";
5313         if ($format eq 'incremental') {
5314                 $formats_nav .=
5315                         $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
5316                                 "blame") . " (non-incremental)";
5317         } else {
5318                 $formats_nav .=
5319                         $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
5320                                 "blame") . " (incremental)";
5321         }
5322         $formats_nav .=
5323                 " | " .
5324                 $cgi->a({-href => href(action=>"history", -replay=>1)},
5325                         "history") .
5326                 " | " .
5327                 $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
5328                         "HEAD");
5329         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5330         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5331         git_print_page_path($file_name, $ftype, $hash_base);
5332
5333         # page body
5334         if ($format eq 'incremental') {
5335                 print "<noscript>\n<div class=\"error\"><center><b>\n".
5336                       "This page requires JavaScript to run.\n Use ".
5337                       $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
5338                               'this page').
5339                       " instead.\n".
5340                       "</b></center></div>\n</noscript>\n";
5341
5342                 print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
5343         }
5344
5345         print qq!<div class="page_body">\n!;
5346         print qq!<div id="progress_info">... / ...</div>\n!
5347                 if ($format eq 'incremental');
5348         print qq!<table id="blame_table" class="blame" width="100%">\n!.
5349               #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
5350               qq!<thead>\n!.
5351               qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
5352               qq!</thead>\n!.
5353               qq!<tbody>\n!;
5354
5355         my @rev_color = qw(light dark);
5356         my $num_colors = scalar(@rev_color);
5357         my $current_color = 0;
5358
5359         if ($format eq 'incremental') {
5360                 my $color_class = $rev_color[$current_color];
5361
5362                 #contents of a file
5363                 my $linenr = 0;
5364         LINE:
5365                 while (my $line = <$fd>) {
5366                         chomp $line;
5367                         $linenr++;
5368
5369                         print qq!<tr id="l$linenr" class="$color_class">!.
5370                               qq!<td class="sha1"><a href=""> </a></td>!.
5371                               qq!<td class="linenr">!.
5372                               qq!<a class="linenr" href="">$linenr</a></td>!;
5373                         print qq!<td class="pre">! . esc_html($line) . "</td>\n";
5374                         print qq!</tr>\n!;
5375                 }
5376
5377         } else { # porcelain, i.e. ordinary blame
5378                 my %metainfo = (); # saves information about commits
5379
5380                 # blame data
5381         LINE:
5382                 while (my $line = <$fd>) {
5383                         chomp $line;
5384                         # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
5385                         # no <lines in group> for subsequent lines in group of lines
5386                         my ($full_rev, $orig_lineno, $lineno, $group_size) =
5387                            ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
5388                         if (!exists $metainfo{$full_rev}) {
5389                                 $metainfo{$full_rev} = { 'nprevious' => 0 };
5390                         }
5391                         my $meta = $metainfo{$full_rev};
5392                         my $data;
5393                         while ($data = <$fd>) {
5394                                 chomp $data;
5395                                 last if ($data =~ s/^\t//); # contents of line
5396                                 if ($data =~ /^(\S+)(?: (.*))?$/) {
5397                                         $meta->{$1} = $2 unless exists $meta->{$1};
5398                                 }
5399                                 if ($data =~ /^previous /) {
5400                                         $meta->{'nprevious'}++;
5401                                 }
5402                         }
5403                         my $short_rev = substr($full_rev, 0, 8);
5404                         my $author = $meta->{'author'};
5405                         my %date =
5406                                 parse_date($meta->{'author-time'}, $meta->{'author-tz'});
5407                         my $date = $date{'iso-tz'};
5408                         if ($group_size) {
5409                                 $current_color = ($current_color + 1) % $num_colors;
5410                         }
5411                         my $tr_class = $rev_color[$current_color];
5412                         $tr_class .= ' boundary' if (exists $meta->{'boundary'});
5413                         $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
5414                         $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
5415                         print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
5416                         if ($group_size) {
5417                                 print "<td class=\"sha1\"";
5418                                 print " title=\"". esc_html($author) . ", $date\"";
5419                                 print " rowspan=\"$group_size\"" if ($group_size > 1);
5420                                 print ">";
5421                                 print $cgi->a({-href => href(action=>"commit",
5422                                                              hash=>$full_rev,
5423                                                              file_name=>$file_name)},
5424                                               esc_html($short_rev));
5425                                 if ($group_size >= 2) {
5426                                         my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
5427                                         if (@author_initials) {
5428                                                 print "<br />" .
5429                                                       esc_html(join('', @author_initials));
5430                                                 #           or join('.', ...)
5431                                         }
5432                                 }
5433                                 print "</td>\n";
5434                         }
5435                         # 'previous' <sha1 of parent commit> <filename at commit>
5436                         if (exists $meta->{'previous'} &&
5437                             $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
5438                                 $meta->{'parent'} = $1;
5439                                 $meta->{'file_parent'} = unquote($2);
5440                         }
5441                         my $linenr_commit =
5442                                 exists($meta->{'parent'}) ?
5443                                 $meta->{'parent'} : $full_rev;
5444                         my $linenr_filename =
5445                                 exists($meta->{'file_parent'}) ?
5446                                 $meta->{'file_parent'} : unquote($meta->{'filename'});
5447                         my $blamed = href(action => 'blame',
5448                                           file_name => $linenr_filename,
5449                                           hash_base => $linenr_commit);
5450                         print "<td class=\"linenr\">";
5451                         print $cgi->a({ -href => "$blamed#l$orig_lineno",
5452                                         -class => "linenr" },
5453                                       esc_html($lineno));
5454                         print "</td>";
5455                         print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
5456                         print "</tr>\n";
5457                 } # end while
5458
5459         }
5460
5461         # footer
5462         print "</tbody>\n".
5463               "</table>\n"; # class="blame"
5464         print "</div>\n";   # class="blame_body"
5465         close $fd
5466                 or print "Reading blob failed\n";
5467
5468         git_footer_html();
5469 }
5470
5471 sub git_blame {
5472         git_blame_common();
5473 }
5474
5475 sub git_blame_incremental {
5476         git_blame_common('incremental');
5477 }
5478
5479 sub git_blame_data {
5480         git_blame_common('data');
5481 }
5482
5483 sub git_tags {
5484         my $head = git_get_head_hash($project);
5485         git_header_html();
5486         git_print_page_nav('','', $head,undef,$head);
5487         git_print_header_div('summary', $project);
5488
5489         my @tagslist = git_get_tags_list();
5490         if (@tagslist) {
5491                 git_tags_body(\@tagslist);
5492         }
5493         git_footer_html();
5494 }
5495
5496 sub git_heads {
5497         my $head = git_get_head_hash($project);
5498         git_header_html();
5499         git_print_page_nav('','', $head,undef,$head);
5500         git_print_header_div('summary', $project);
5501
5502         my @headslist = git_get_heads_list();
5503         if (@headslist) {
5504                 git_heads_body(\@headslist, $head);
5505         }
5506         git_footer_html();
5507 }
5508
5509 sub git_blob_plain {
5510         my $type = shift;
5511         my $expires;
5512
5513         if (!defined $hash) {
5514                 if (defined $file_name) {
5515                         my $base = $hash_base || git_get_head_hash($project);
5516                         $hash = git_get_hash_by_path($base, $file_name, "blob")
5517                                 or die_error(404, "Cannot find file");
5518                 } else {
5519                         die_error(400, "No file name defined");
5520                 }
5521         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5522                 # blobs defined by non-textual hash id's can be cached
5523                 $expires = "+1d";
5524         }
5525
5526         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5527                 or die_error(500, "Open git-cat-file blob '$hash' failed");
5528
5529         # content-type (can include charset)
5530         $type = blob_contenttype($fd, $file_name, $type);
5531
5532         # "save as" filename, even when no $file_name is given
5533         my $save_as = "$hash";
5534         if (defined $file_name) {
5535                 $save_as = $file_name;
5536         } elsif ($type =~ m/^text\//) {
5537                 $save_as .= '.txt';
5538         }
5539
5540         # With XSS prevention on, blobs of all types except a few known safe
5541         # ones are served with "Content-Disposition: attachment" to make sure
5542         # they don't run in our security domain.  For certain image types,
5543         # blob view writes an <img> tag referring to blob_plain view, and we
5544         # want to be sure not to break that by serving the image as an
5545         # attachment (though Firefox 3 doesn't seem to care).
5546         my $sandbox = $prevent_xss &&
5547                 $type !~ m!^(?:text/plain|image/(?:gif|png|jpeg))$!;
5548
5549         print $cgi->header(
5550                 -type => $type,
5551                 -expires => $expires,
5552                 -content_disposition =>
5553                         ($sandbox ? 'attachment' : 'inline')
5554                         . '; filename="' . $save_as . '"');
5555         local $/ = undef;
5556         binmode STDOUT, ':raw';
5557         print <$fd>;
5558         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
5559         close $fd;
5560 }
5561
5562 sub git_blob {
5563         my $expires;
5564
5565         if (!defined $hash) {
5566                 if (defined $file_name) {
5567                         my $base = $hash_base || git_get_head_hash($project);
5568                         $hash = git_get_hash_by_path($base, $file_name, "blob")
5569                                 or die_error(404, "Cannot find file");
5570                 } else {
5571                         die_error(400, "No file name defined");
5572                 }
5573         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5574                 # blobs defined by non-textual hash id's can be cached
5575                 $expires = "+1d";
5576         }
5577
5578         my $have_blame = gitweb_check_feature('blame');
5579         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5580                 or die_error(500, "Couldn't cat $file_name, $hash");
5581         my $mimetype = blob_mimetype($fd, $file_name);
5582         # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
5583         if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
5584                 close $fd;
5585                 return git_blob_plain($mimetype);
5586         }
5587         # we can have blame only for text/* mimetype
5588         $have_blame &&= ($mimetype =~ m!^text/!);
5589
5590         my $highlight = gitweb_check_feature('highlight');
5591         my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
5592         $fd = run_highlighter($fd, $highlight, $syntax)
5593                 if $syntax;
5594
5595         git_header_html(undef, $expires);
5596         my $formats_nav = '';
5597         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
5598                 if (defined $file_name) {
5599                         if ($have_blame) {
5600                                 $formats_nav .=
5601                                         $cgi->a({-href => href(action=>"blame", -replay=>1)},
5602                                                 "blame") .
5603                                         " | ";
5604                         }
5605                         $formats_nav .=
5606                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
5607                                         "history") .
5608                                 " | " .
5609                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5610                                         "raw") .
5611                                 " | " .
5612                                 $cgi->a({-href => href(action=>"blob",
5613                                                        hash_base=>"HEAD", file_name=>$file_name)},
5614                                         "HEAD");
5615                 } else {
5616                         $formats_nav .=
5617                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5618                                         "raw");
5619                 }
5620                 git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5621                 git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5622         } else {
5623                 print "<div class=\"page_nav\">\n" .
5624                       "<br/><br/></div>\n" .
5625                       "<div class=\"title\">$hash</div>\n";
5626         }
5627         git_print_page_path($file_name, "blob", $hash_base);
5628         print "<div class=\"page_body\">\n";
5629         if ($mimetype =~ m!^image/!) {
5630                 print qq!<img type="$mimetype"!;
5631                 if ($file_name) {
5632                         print qq! alt="$file_name" title="$file_name"!;
5633                 }
5634                 print qq! src="! .
5635                       href(action=>"blob_plain", hash=>$hash,
5636                            hash_base=>$hash_base, file_name=>$file_name) .
5637                       qq!" />\n!;
5638         } else {
5639                 my $nr;
5640                 while (my $line = <$fd>) {
5641                         chomp $line;
5642                         $nr++;
5643                         $line = untabify($line);
5644                         printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
5645                                $nr, href(-replay => 1), $nr, $nr, $syntax ? $line : esc_html($line, -nbsp=>1);
5646                 }
5647         }
5648         close $fd
5649                 or print "Reading blob failed.\n";
5650         print "</div>";
5651         git_footer_html();
5652 }
5653
5654 sub git_tree {
5655         if (!defined $hash_base) {
5656                 $hash_base = "HEAD";
5657         }
5658         if (!defined $hash) {
5659                 if (defined $file_name) {
5660                         $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
5661                 } else {
5662                         $hash = $hash_base;
5663                 }
5664         }
5665         die_error(404, "No such tree") unless defined($hash);
5666
5667         my $show_sizes = gitweb_check_feature('show-sizes');
5668         my $have_blame = gitweb_check_feature('blame');
5669
5670         my @entries = ();
5671         {
5672                 local $/ = "\0";
5673                 open my $fd, "-|", git_cmd(), "ls-tree", '-z',
5674                         ($show_sizes ? '-l' : ()), @extra_options, $hash
5675                         or die_error(500, "Open git-ls-tree failed");
5676                 @entries = map { chomp; $_ } <$fd>;
5677                 close $fd
5678                         or die_error(404, "Reading tree failed");
5679         }
5680
5681         my $refs = git_get_references();
5682         my $ref = format_ref_marker($refs, $hash_base);
5683         git_header_html();
5684         my $basedir = '';
5685         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
5686                 my @views_nav = ();
5687                 if (defined $file_name) {
5688                         push @views_nav,
5689                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
5690                                         "history"),
5691                                 $cgi->a({-href => href(action=>"tree",
5692                                                        hash_base=>"HEAD", file_name=>$file_name)},
5693                                         "HEAD"),
5694                 }
5695                 my $snapshot_links = format_snapshot_links($hash);
5696                 if (defined $snapshot_links) {
5697                         # FIXME: Should be available when we have no hash base as well.
5698                         push @views_nav, $snapshot_links;
5699                 }
5700                 git_print_page_nav('tree','', $hash_base, undef, undef,
5701                                    join(' | ', @views_nav));
5702                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
5703         } else {
5704                 undef $hash_base;
5705                 print "<div class=\"page_nav\">\n";
5706                 print "<br/><br/></div>\n";
5707                 print "<div class=\"title\">$hash</div>\n";
5708         }
5709         if (defined $file_name) {
5710                 $basedir = $file_name;
5711                 if ($basedir ne '' && substr($basedir, -1) ne '/') {
5712                         $basedir .= '/';
5713                 }
5714                 git_print_page_path($file_name, 'tree', $hash_base);
5715         }
5716         print "<div class=\"page_body\">\n";
5717         print "<table class=\"tree\">\n";
5718         my $alternate = 1;
5719         # '..' (top directory) link if possible
5720         if (defined $hash_base &&
5721             defined $file_name && $file_name =~ m![^/]+$!) {
5722                 if ($alternate) {
5723                         print "<tr class=\"dark\">\n";
5724                 } else {
5725                         print "<tr class=\"light\">\n";
5726                 }
5727                 $alternate ^= 1;
5728
5729                 my $up = $file_name;
5730                 $up =~ s!/?[^/]+$!!;
5731                 undef $up unless $up;
5732                 # based on git_print_tree_entry
5733                 print '<td class="mode">' . mode_str('040000') . "</td>\n";
5734                 print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
5735                 print '<td class="list">';
5736                 print $cgi->a({-href => href(action=>"tree",
5737                                              hash_base=>$hash_base,
5738                                              file_name=>$up)},
5739                               "..");
5740                 print "</td>\n";
5741                 print "<td class=\"link\"></td>\n";
5742
5743                 print "</tr>\n";
5744         }
5745         foreach my $line (@entries) {
5746                 my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
5747
5748                 if ($alternate) {
5749                         print "<tr class=\"dark\">\n";
5750                 } else {
5751                         print "<tr class=\"light\">\n";
5752                 }
5753                 $alternate ^= 1;
5754
5755                 git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
5756
5757                 print "</tr>\n";
5758         }
5759         print "</table>\n" .
5760               "</div>";
5761         git_footer_html();
5762 }
5763
5764 sub snapshot_name {
5765         my ($project, $hash) = @_;
5766
5767         # path/to/project.git  -> project
5768         # path/to/project/.git -> project
5769         my $name = to_utf8($project);
5770         $name =~ s,([^/])/*\.git$,$1,;
5771         $name = basename($name);
5772         # sanitize name
5773         $name =~ s/[[:cntrl:]]/?/g;
5774
5775         my $ver = $hash;
5776         if ($hash =~ /^[0-9a-fA-F]+$/) {
5777                 # shorten SHA-1 hash
5778                 my $full_hash = git_get_full_hash($project, $hash);
5779                 if ($full_hash =~ /^$hash/ && length($hash) > 7) {
5780                         $ver = git_get_short_hash($project, $hash);
5781                 }
5782         } elsif ($hash =~ m!^refs/tags/(.*)$!) {
5783                 # tags don't need shortened SHA-1 hash
5784                 $ver = $1;
5785         } else {
5786                 # branches and other need shortened SHA-1 hash
5787                 if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
5788                         $ver = $1;
5789                 }
5790                 $ver .= '-' . git_get_short_hash($project, $hash);
5791         }
5792         # in case of hierarchical branch names
5793         $ver =~ s!/!.!g;
5794
5795         # name = project-version_string
5796         $name = "$name-$ver";
5797
5798         return wantarray ? ($name, $name) : $name;
5799 }
5800
5801 sub git_snapshot {
5802         my $format = $input_params{'snapshot_format'};
5803         if (!@snapshot_fmts) {
5804                 die_error(403, "Snapshots not allowed");
5805         }
5806         # default to first supported snapshot format
5807         $format ||= $snapshot_fmts[0];
5808         if ($format !~ m/^[a-z0-9]+$/) {
5809                 die_error(400, "Invalid snapshot format parameter");
5810         } elsif (!exists($known_snapshot_formats{$format})) {
5811                 die_error(400, "Unknown snapshot format");
5812         } elsif ($known_snapshot_formats{$format}{'disabled'}) {
5813                 die_error(403, "Snapshot format not allowed");
5814         } elsif (!grep($_ eq $format, @snapshot_fmts)) {
5815                 die_error(403, "Unsupported snapshot format");
5816         }
5817
5818         my $type = git_get_type("$hash^{}");
5819         if (!$type) {
5820                 die_error(404, 'Object does not exist');
5821         }  elsif ($type eq 'blob') {
5822                 die_error(400, 'Object is not a tree-ish');
5823         }
5824
5825         my ($name, $prefix) = snapshot_name($project, $hash);
5826         my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
5827         my $cmd = quote_command(
5828                 git_cmd(), 'archive',
5829                 "--format=$known_snapshot_formats{$format}{'format'}",
5830                 "--prefix=$prefix/", $hash);
5831         if (exists $known_snapshot_formats{$format}{'compressor'}) {
5832                 $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
5833         }
5834
5835         $filename =~ s/(["\\])/\\$1/g;
5836         print $cgi->header(
5837                 -type => $known_snapshot_formats{$format}{'type'},
5838                 -content_disposition => 'inline; filename="' . $filename . '"',
5839                 -status => '200 OK');
5840
5841         open my $fd, "-|", $cmd
5842                 or die_error(500, "Execute git-archive failed");
5843         binmode STDOUT, ':raw';
5844         print <$fd>;
5845         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
5846         close $fd;
5847 }
5848
5849 sub git_log_generic {
5850         my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
5851
5852         my $head = git_get_head_hash($project);
5853         if (!defined $base) {
5854                 $base = $head;
5855         }
5856         if (!defined $page) {
5857                 $page = 0;
5858         }
5859         my $refs = git_get_references();
5860
5861         my $commit_hash = $base;
5862         if (defined $parent) {
5863                 $commit_hash = "$parent..$base";
5864         }
5865         my @commitlist =
5866                 parse_commits($commit_hash, 101, (100 * $page),
5867                               defined $file_name ? ($file_name, "--full-history") : ());
5868
5869         my $ftype;
5870         if (!defined $file_hash && defined $file_name) {
5871                 # some commits could have deleted file in question,
5872                 # and not have it in tree, but one of them has to have it
5873                 for (my $i = 0; $i < @commitlist; $i++) {
5874                         $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
5875                         last if defined $file_hash;
5876                 }
5877         }
5878         if (defined $file_hash) {
5879                 $ftype = git_get_type($file_hash);
5880         }
5881         if (defined $file_name && !defined $ftype) {
5882                 die_error(500, "Unknown type of object");
5883         }
5884         my %co;
5885         if (defined $file_name) {
5886                 %co = parse_commit($base)
5887                         or die_error(404, "Unknown commit object");
5888         }
5889
5890
5891         my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
5892         my $next_link = '';
5893         if ($#commitlist >= 100) {
5894                 $next_link =
5895                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
5896                                  -accesskey => "n", -title => "Alt-n"}, "next");
5897         }
5898         my $patch_max = gitweb_get_feature('patches');
5899         if ($patch_max && !defined $file_name) {
5900                 if ($patch_max < 0 || @commitlist <= $patch_max) {
5901                         $paging_nav .= " &sdot; " .
5902                                 $cgi->a({-href => href(action=>"patches", -replay=>1)},
5903                                         "patches");
5904                 }
5905         }
5906
5907         git_header_html();
5908         git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
5909         if (defined $file_name) {
5910                 git_print_header_div('commit', esc_html($co{'title'}), $base);
5911         } else {
5912                 git_print_header_div('summary', $project)
5913         }
5914         git_print_page_path($file_name, $ftype, $hash_base)
5915                 if (defined $file_name);
5916
5917         $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
5918                      $file_name, $file_hash, $ftype);
5919
5920         git_footer_html();
5921 }
5922
5923 sub git_log {
5924         git_log_generic('log', \&git_log_body,
5925                         $hash, $hash_parent);
5926 }
5927
5928 sub git_commit {
5929         $hash ||= $hash_base || "HEAD";
5930         my %co = parse_commit($hash)
5931             or die_error(404, "Unknown commit object");
5932
5933         my $parent  = $co{'parent'};
5934         my $parents = $co{'parents'}; # listref
5935
5936         # we need to prepare $formats_nav before any parameter munging
5937         my $formats_nav;
5938         if (!defined $parent) {
5939                 # --root commitdiff
5940                 $formats_nav .= '(initial)';
5941         } elsif (@$parents == 1) {
5942                 # single parent commit
5943                 $formats_nav .=
5944                         '(parent: ' .
5945                         $cgi->a({-href => href(action=>"commit",
5946                                                hash=>$parent)},
5947                                 esc_html(substr($parent, 0, 7))) .
5948                         ')';
5949         } else {
5950                 # merge commit
5951                 $formats_nav .=
5952                         '(merge: ' .
5953                         join(' ', map {
5954                                 $cgi->a({-href => href(action=>"commit",
5955                                                        hash=>$_)},
5956                                         esc_html(substr($_, 0, 7)));
5957                         } @$parents ) .
5958                         ')';
5959         }
5960         if (gitweb_check_feature('patches') && @$parents <= 1) {
5961                 $formats_nav .= " | " .
5962                         $cgi->a({-href => href(action=>"patch", -replay=>1)},
5963                                 "patch");
5964         }
5965
5966         if (!defined $parent) {
5967                 $parent = "--root";
5968         }
5969         my @difftree;
5970         open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
5971                 @diff_opts,
5972                 (@$parents <= 1 ? $parent : '-c'),
5973                 $hash, "--"
5974                 or die_error(500, "Open git-diff-tree failed");
5975         @difftree = map { chomp; $_ } <$fd>;
5976         close $fd or die_error(404, "Reading git-diff-tree failed");
5977
5978         # non-textual hash id's can be cached
5979         my $expires;
5980         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5981                 $expires = "+1d";
5982         }
5983         my $refs = git_get_references();
5984         my $ref = format_ref_marker($refs, $co{'id'});
5985
5986         git_header_html(undef, $expires);
5987         git_print_page_nav('commit', '',
5988                            $hash, $co{'tree'}, $hash,
5989                            $formats_nav);
5990
5991         if (defined $co{'parent'}) {
5992                 git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
5993         } else {
5994                 git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
5995         }
5996         print "<div class=\"title_text\">\n" .
5997               "<table class=\"object_header\">\n";
5998         git_print_authorship_rows(\%co);
5999         print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
6000         print "<tr>" .
6001               "<td>tree</td>" .
6002               "<td class=\"sha1\">" .
6003               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
6004                        class => "list"}, $co{'tree'}) .
6005               "</td>" .
6006               "<td class=\"link\">" .
6007               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
6008                       "tree");
6009         my $snapshot_links = format_snapshot_links($hash);
6010         if (defined $snapshot_links) {
6011                 print " | " . $snapshot_links;
6012         }
6013         print "</td>" .
6014               "</tr>\n";
6015
6016         foreach my $par (@$parents) {
6017                 print "<tr>" .
6018                       "<td>parent</td>" .
6019                       "<td class=\"sha1\">" .
6020                       $cgi->a({-href => href(action=>"commit", hash=>$par),
6021                                class => "list"}, $par) .
6022                       "</td>" .
6023                       "<td class=\"link\">" .
6024                       $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
6025                       " | " .
6026                       $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
6027                       "</td>" .
6028                       "</tr>\n";
6029         }
6030         print "</table>".
6031               "</div>\n";
6032
6033         print "<div class=\"page_body\">\n";
6034         git_print_log($co{'comment'});
6035         print "</div>\n";
6036
6037         git_difftree_body(\@difftree, $hash, @$parents);
6038
6039         git_footer_html();
6040 }
6041
6042 sub git_object {
6043         # object is defined by:
6044         # - hash or hash_base alone
6045         # - hash_base and file_name
6046         my $type;
6047
6048         # - hash or hash_base alone
6049         if ($hash || ($hash_base && !defined $file_name)) {
6050                 my $object_id = $hash || $hash_base;
6051
6052                 open my $fd, "-|", quote_command(
6053                         git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
6054                         or die_error(404, "Object does not exist");
6055                 $type = <$fd>;
6056                 chomp $type;
6057                 close $fd
6058                         or die_error(404, "Object does not exist");
6059
6060         # - hash_base and file_name
6061         } elsif ($hash_base && defined $file_name) {
6062                 $file_name =~ s,/+$,,;
6063
6064                 system(git_cmd(), "cat-file", '-e', $hash_base) == 0
6065                         or die_error(404, "Base object does not exist");
6066
6067                 # here errors should not hapen
6068                 open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
6069                         or die_error(500, "Open git-ls-tree failed");
6070                 my $line = <$fd>;
6071                 close $fd;
6072
6073                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
6074                 unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
6075                         die_error(404, "File or directory for given base does not exist");
6076                 }
6077                 $type = $2;
6078                 $hash = $3;
6079         } else {
6080                 die_error(400, "Not enough information to find object");
6081         }
6082
6083         print $cgi->redirect(-uri => href(action=>$type, -full=>1,
6084                                           hash=>$hash, hash_base=>$hash_base,
6085                                           file_name=>$file_name),
6086                              -status => '302 Found');
6087 }
6088
6089 sub git_blobdiff {
6090         my $format = shift || 'html';
6091
6092         my $fd;
6093         my @difftree;
6094         my %diffinfo;
6095         my $expires;
6096
6097         # preparing $fd and %diffinfo for git_patchset_body
6098         # new style URI
6099         if (defined $hash_base && defined $hash_parent_base) {
6100                 if (defined $file_name) {
6101                         # read raw output
6102                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6103                                 $hash_parent_base, $hash_base,
6104                                 "--", (defined $file_parent ? $file_parent : ()), $file_name
6105                                 or die_error(500, "Open git-diff-tree failed");
6106                         @difftree = map { chomp; $_ } <$fd>;
6107                         close $fd
6108                                 or die_error(404, "Reading git-diff-tree failed");
6109                         @difftree
6110                                 or die_error(404, "Blob diff not found");
6111
6112                 } elsif (defined $hash &&
6113                          $hash =~ /[0-9a-fA-F]{40}/) {
6114                         # try to find filename from $hash
6115
6116                         # read filtered raw output
6117                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6118                                 $hash_parent_base, $hash_base, "--"
6119                                 or die_error(500, "Open git-diff-tree failed");
6120                         @difftree =
6121                                 # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
6122                                 # $hash == to_id
6123                                 grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
6124                                 map { chomp; $_ } <$fd>;
6125                         close $fd
6126                                 or die_error(404, "Reading git-diff-tree failed");
6127                         @difftree
6128                                 or die_error(404, "Blob diff not found");
6129
6130                 } else {
6131                         die_error(400, "Missing one of the blob diff parameters");
6132                 }
6133
6134                 if (@difftree > 1) {
6135                         die_error(400, "Ambiguous blob diff specification");
6136                 }
6137
6138                 %diffinfo = parse_difftree_raw_line($difftree[0]);
6139                 $file_parent ||= $diffinfo{'from_file'} || $file_name;
6140                 $file_name   ||= $diffinfo{'to_file'};
6141
6142                 $hash_parent ||= $diffinfo{'from_id'};
6143                 $hash        ||= $diffinfo{'to_id'};
6144
6145                 # non-textual hash id's can be cached
6146                 if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
6147                     $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
6148                         $expires = '+1d';
6149                 }
6150
6151                 # open patch output
6152                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6153                         '-p', ($format eq 'html' ? "--full-index" : ()),
6154                         $hash_parent_base, $hash_base,
6155                         "--", (defined $file_parent ? $file_parent : ()), $file_name
6156                         or die_error(500, "Open git-diff-tree failed");
6157         }
6158
6159         # old/legacy style URI -- not generated anymore since 1.4.3.
6160         if (!%diffinfo) {
6161                 die_error('404 Not Found', "Missing one of the blob diff parameters")
6162         }
6163
6164         # header
6165         if ($format eq 'html') {
6166                 my $formats_nav =
6167                         $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
6168                                 "raw");
6169                 git_header_html(undef, $expires);
6170                 if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6171                         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6172                         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6173                 } else {
6174                         print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
6175                         print "<div class=\"title\">$hash vs $hash_parent</div>\n";
6176                 }
6177                 if (defined $file_name) {
6178                         git_print_page_path($file_name, "blob", $hash_base);
6179                 } else {
6180                         print "<div class=\"page_path\"></div>\n";
6181                 }
6182
6183         } elsif ($format eq 'plain') {
6184                 print $cgi->header(
6185                         -type => 'text/plain',
6186                         -charset => 'utf-8',
6187                         -expires => $expires,
6188                         -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
6189
6190                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6191
6192         } else {
6193                 die_error(400, "Unknown blobdiff format");
6194         }
6195
6196         # patch
6197         if ($format eq 'html') {
6198                 print "<div class=\"page_body\">\n";
6199
6200                 git_patchset_body($fd, [ \%diffinfo ], $hash_base, $hash_parent_base);
6201                 close $fd;
6202
6203                 print "</div>\n"; # class="page_body"
6204                 git_footer_html();
6205
6206         } else {
6207                 while (my $line = <$fd>) {
6208                         $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
6209                         $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
6210
6211                         print $line;
6212
6213                         last if $line =~ m!^\+\+\+!;
6214                 }
6215                 local $/ = undef;
6216                 print <$fd>;
6217                 close $fd;
6218         }
6219 }
6220
6221 sub git_blobdiff_plain {
6222         git_blobdiff('plain');
6223 }
6224
6225 sub git_commitdiff {
6226         my %params = @_;
6227         my $format = $params{-format} || 'html';
6228
6229         my ($patch_max) = gitweb_get_feature('patches');
6230         if ($format eq 'patch') {
6231                 die_error(403, "Patch view not allowed") unless $patch_max;
6232         }
6233
6234         $hash ||= $hash_base || "HEAD";
6235         my %co = parse_commit($hash)
6236             or die_error(404, "Unknown commit object");
6237
6238         # choose format for commitdiff for merge
6239         if (! defined $hash_parent && @{$co{'parents'}} > 1) {
6240                 $hash_parent = '--cc';
6241         }
6242         # we need to prepare $formats_nav before almost any parameter munging
6243         my $formats_nav;
6244         if ($format eq 'html') {
6245                 $formats_nav =
6246                         $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
6247                                 "raw");
6248                 if ($patch_max && @{$co{'parents'}} <= 1) {
6249                         $formats_nav .= " | " .
6250                                 $cgi->a({-href => href(action=>"patch", -replay=>1)},
6251                                         "patch");
6252                 }
6253
6254                 if (defined $hash_parent &&
6255                     $hash_parent ne '-c' && $hash_parent ne '--cc') {
6256                         # commitdiff with two commits given
6257                         my $hash_parent_short = $hash_parent;
6258                         if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
6259                                 $hash_parent_short = substr($hash_parent, 0, 7);
6260                         }
6261                         $formats_nav .=
6262                                 ' (from';
6263                         for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
6264                                 if ($co{'parents'}[$i] eq $hash_parent) {
6265                                         $formats_nav .= ' parent ' . ($i+1);
6266                                         last;
6267                                 }
6268                         }
6269                         $formats_nav .= ': ' .
6270                                 $cgi->a({-href => href(action=>"commitdiff",
6271                                                        hash=>$hash_parent)},
6272                                         esc_html($hash_parent_short)) .
6273                                 ')';
6274                 } elsif (!$co{'parent'}) {
6275                         # --root commitdiff
6276                         $formats_nav .= ' (initial)';
6277                 } elsif (scalar @{$co{'parents'}} == 1) {
6278                         # single parent commit
6279                         $formats_nav .=
6280                                 ' (parent: ' .
6281                                 $cgi->a({-href => href(action=>"commitdiff",
6282                                                        hash=>$co{'parent'})},
6283                                         esc_html(substr($co{'parent'}, 0, 7))) .
6284                                 ')';
6285                 } else {
6286                         # merge commit
6287                         if ($hash_parent eq '--cc') {
6288                                 $formats_nav .= ' | ' .
6289                                         $cgi->a({-href => href(action=>"commitdiff",
6290                                                                hash=>$hash, hash_parent=>'-c')},
6291                                                 'combined');
6292                         } else { # $hash_parent eq '-c'
6293                                 $formats_nav .= ' | ' .
6294                                         $cgi->a({-href => href(action=>"commitdiff",
6295                                                                hash=>$hash, hash_parent=>'--cc')},
6296                                                 'compact');
6297                         }
6298                         $formats_nav .=
6299                                 ' (merge: ' .
6300                                 join(' ', map {
6301                                         $cgi->a({-href => href(action=>"commitdiff",
6302                                                                hash=>$_)},
6303                                                 esc_html(substr($_, 0, 7)));
6304                                 } @{$co{'parents'}} ) .
6305                                 ')';
6306                 }
6307         }
6308
6309         my $hash_parent_param = $hash_parent;
6310         if (!defined $hash_parent_param) {
6311                 # --cc for multiple parents, --root for parentless
6312                 $hash_parent_param =
6313                         @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
6314         }
6315
6316         # read commitdiff
6317         my $fd;
6318         my @difftree;
6319         if ($format eq 'html') {
6320                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6321                         "--no-commit-id", "--patch-with-raw", "--full-index",
6322                         $hash_parent_param, $hash, "--"
6323                         or die_error(500, "Open git-diff-tree failed");
6324
6325                 while (my $line = <$fd>) {
6326                         chomp $line;
6327                         # empty line ends raw part of diff-tree output
6328                         last unless $line;
6329                         push @difftree, scalar parse_difftree_raw_line($line);
6330                 }
6331
6332         } elsif ($format eq 'plain') {
6333                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6334                         '-p', $hash_parent_param, $hash, "--"
6335                         or die_error(500, "Open git-diff-tree failed");
6336         } elsif ($format eq 'patch') {
6337                 # For commit ranges, we limit the output to the number of
6338                 # patches specified in the 'patches' feature.
6339                 # For single commits, we limit the output to a single patch,
6340                 # diverging from the git-format-patch default.
6341                 my @commit_spec = ();
6342                 if ($hash_parent) {
6343                         if ($patch_max > 0) {
6344                                 push @commit_spec, "-$patch_max";
6345                         }
6346                         push @commit_spec, '-n', "$hash_parent..$hash";
6347                 } else {
6348                         if ($params{-single}) {
6349                                 push @commit_spec, '-1';
6350                         } else {
6351                                 if ($patch_max > 0) {
6352                                         push @commit_spec, "-$patch_max";
6353                                 }
6354                                 push @commit_spec, "-n";
6355                         }
6356                         push @commit_spec, '--root', $hash;
6357                 }
6358                 open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
6359                         '--encoding=utf8', '--stdout', @commit_spec
6360                         or die_error(500, "Open git-format-patch failed");
6361         } else {
6362                 die_error(400, "Unknown commitdiff format");
6363         }
6364
6365         # non-textual hash id's can be cached
6366         my $expires;
6367         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6368                 $expires = "+1d";
6369         }
6370
6371         # write commit message
6372         if ($format eq 'html') {
6373                 my $refs = git_get_references();
6374                 my $ref = format_ref_marker($refs, $co{'id'});
6375
6376                 git_header_html(undef, $expires);
6377                 git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
6378                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
6379                 print "<div class=\"title_text\">\n" .
6380                       "<table class=\"object_header\">\n";
6381                 git_print_authorship_rows(\%co);
6382                 print "</table>".
6383                       "</div>\n";
6384                 print "<div class=\"page_body\">\n";
6385                 if (@{$co{'comment'}} > 1) {
6386                         print "<div class=\"log\">\n";
6387                         git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
6388                         print "</div>\n"; # class="log"
6389                 }
6390
6391         } elsif ($format eq 'plain') {
6392                 my $refs = git_get_references("tags");
6393                 my $tagname = git_get_rev_name_tags($hash);
6394                 my $filename = basename($project) . "-$hash.patch";
6395
6396                 print $cgi->header(
6397                         -type => 'text/plain',
6398                         -charset => 'utf-8',
6399                         -expires => $expires,
6400                         -content_disposition => 'inline; filename="' . "$filename" . '"');
6401                 my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
6402                 print "From: " . to_utf8($co{'author'}) . "\n";
6403                 print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
6404                 print "Subject: " . to_utf8($co{'title'}) . "\n";
6405
6406                 print "X-Git-Tag: $tagname\n" if $tagname;
6407                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6408
6409                 foreach my $line (@{$co{'comment'}}) {
6410                         print to_utf8($line) . "\n";
6411                 }
6412                 print "---\n\n";
6413         } elsif ($format eq 'patch') {
6414                 my $filename = basename($project) . "-$hash.patch";
6415
6416                 print $cgi->header(
6417                         -type => 'text/plain',
6418                         -charset => 'utf-8',
6419                         -expires => $expires,
6420                         -content_disposition => 'inline; filename="' . "$filename" . '"');
6421         }
6422
6423         # write patch
6424         if ($format eq 'html') {
6425                 my $use_parents = !defined $hash_parent ||
6426                         $hash_parent eq '-c' || $hash_parent eq '--cc';
6427                 git_difftree_body(\@difftree, $hash,
6428                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
6429                 print "<br/>\n";
6430
6431                 git_patchset_body($fd, \@difftree, $hash,
6432                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
6433                 close $fd;
6434                 print "</div>\n"; # class="page_body"
6435                 git_footer_html();
6436
6437         } elsif ($format eq 'plain') {
6438                 local $/ = undef;
6439                 print <$fd>;
6440                 close $fd
6441                         or print "Reading git-diff-tree failed\n";
6442         } elsif ($format eq 'patch') {
6443                 local $/ = undef;
6444                 print <$fd>;
6445                 close $fd
6446                         or print "Reading git-format-patch failed\n";
6447         }
6448 }
6449
6450 sub git_commitdiff_plain {
6451         git_commitdiff(-format => 'plain');
6452 }
6453
6454 # format-patch-style patches
6455 sub git_patch {
6456         git_commitdiff(-format => 'patch', -single => 1);
6457 }
6458
6459 sub git_patches {
6460         git_commitdiff(-format => 'patch');
6461 }
6462
6463 sub git_history {
6464         git_log_generic('history', \&git_history_body,
6465                         $hash_base, $hash_parent_base,
6466                         $file_name, $hash);
6467 }
6468
6469 sub git_search {
6470         gitweb_check_feature('search') or die_error(403, "Search is disabled");
6471         if (!defined $searchtext) {
6472                 die_error(400, "Text field is empty");
6473         }
6474         if (!defined $hash) {
6475                 $hash = git_get_head_hash($project);
6476         }
6477         my %co = parse_commit($hash);
6478         if (!%co) {
6479                 die_error(404, "Unknown commit object");
6480         }
6481         if (!defined $page) {
6482                 $page = 0;
6483         }
6484
6485         $searchtype ||= 'commit';
6486         if ($searchtype eq 'pickaxe') {
6487                 # pickaxe may take all resources of your box and run for several minutes
6488                 # with every query - so decide by yourself how public you make this feature
6489                 gitweb_check_feature('pickaxe')
6490                     or die_error(403, "Pickaxe is disabled");
6491         }
6492         if ($searchtype eq 'grep') {
6493                 gitweb_check_feature('grep')
6494                     or die_error(403, "Grep is disabled");
6495         }
6496
6497         git_header_html();
6498
6499         if ($searchtype eq 'commit' or $searchtype eq 'author' or $searchtype eq 'committer') {
6500                 my $greptype;
6501                 if ($searchtype eq 'commit') {
6502                         $greptype = "--grep=";
6503                 } elsif ($searchtype eq 'author') {
6504                         $greptype = "--author=";
6505                 } elsif ($searchtype eq 'committer') {
6506                         $greptype = "--committer=";
6507                 }
6508                 $greptype .= $searchtext;
6509                 my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
6510                                                $greptype, '--regexp-ignore-case',
6511                                                $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
6512
6513                 my $paging_nav = '';
6514                 if ($page > 0) {
6515                         $paging_nav .=
6516                                 $cgi->a({-href => href(action=>"search", hash=>$hash,
6517                                                        searchtext=>$searchtext,
6518                                                        searchtype=>$searchtype)},
6519                                         "first");
6520                         $paging_nav .= " &sdot; " .
6521                                 $cgi->a({-href => href(-replay=>1, page=>$page-1),
6522                                          -accesskey => "p", -title => "Alt-p"}, "prev");
6523                 } else {
6524                         $paging_nav .= "first";
6525                         $paging_nav .= " &sdot; prev";
6526                 }
6527                 my $next_link = '';
6528                 if ($#commitlist >= 100) {
6529                         $next_link =
6530                                 $cgi->a({-href => href(-replay=>1, page=>$page+1),
6531                                          -accesskey => "n", -title => "Alt-n"}, "next");
6532                         $paging_nav .= " &sdot; $next_link";
6533                 } else {
6534                         $paging_nav .= " &sdot; next";
6535                 }
6536
6537                 git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
6538                 git_print_header_div('commit', esc_html($co{'title'}), $hash);
6539                 if ($page == 0 && !@commitlist) {
6540                         print "<p>No match.</p>\n";
6541                 } else {
6542                         git_search_grep_body(\@commitlist, 0, 99, $next_link);
6543                 }
6544         }
6545
6546         if ($searchtype eq 'pickaxe') {
6547                 git_print_page_nav('','', $hash,$co{'tree'},$hash);
6548                 git_print_header_div('commit', esc_html($co{'title'}), $hash);
6549
6550                 print "<table class=\"pickaxe search\">\n";
6551                 my $alternate = 1;
6552                 local $/ = "\n";
6553                 open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
6554                         '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
6555                         ($search_use_regexp ? '--pickaxe-regex' : ());
6556                 undef %co;
6557                 my @files;
6558                 while (my $line = <$fd>) {
6559                         chomp $line;
6560                         next unless $line;
6561
6562                         my %set = parse_difftree_raw_line($line);
6563                         if (defined $set{'commit'}) {
6564                                 # finish previous commit
6565                                 if (%co) {
6566                                         print "</td>\n" .
6567                                               "<td class=\"link\">" .
6568                                               $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6569                                               " | " .
6570                                               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6571                                         print "</td>\n" .
6572                                               "</tr>\n";
6573                                 }
6574
6575                                 if ($alternate) {
6576                                         print "<tr class=\"dark\">\n";
6577                                 } else {
6578                                         print "<tr class=\"light\">\n";
6579                                 }
6580                                 $alternate ^= 1;
6581                                 %co = parse_commit($set{'commit'});
6582                                 my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6583                                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6584                                       "<td><i>$author</i></td>\n" .
6585                                       "<td>" .
6586                                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6587                                               -class => "list subject"},
6588                                               chop_and_escape_str($co{'title'}, 50) . "<br/>");
6589                         } elsif (defined $set{'to_id'}) {
6590                                 next if ($set{'to_id'} =~ m/^0{40}$/);
6591
6592                                 print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6593                                                              hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6594                                               -class => "list"},
6595                                               "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6596                                       "<br/>\n";
6597                         }
6598                 }
6599                 close $fd;
6600
6601                 # finish last commit (warning: repetition!)
6602                 if (%co) {
6603                         print "</td>\n" .
6604                               "<td class=\"link\">" .
6605                               $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6606                               " | " .
6607                               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6608                         print "</td>\n" .
6609                               "</tr>\n";
6610                 }
6611
6612                 print "</table>\n";
6613         }
6614
6615         if ($searchtype eq 'grep') {
6616                 git_print_page_nav('','', $hash,$co{'tree'},$hash);
6617                 git_print_header_div('commit', esc_html($co{'title'}), $hash);
6618
6619                 print "<table class=\"grep_search\">\n";
6620                 my $alternate = 1;
6621                 my $matches = 0;
6622                 local $/ = "\n";
6623                 open my $fd, "-|", git_cmd(), 'grep', '-n',
6624                         $search_use_regexp ? ('-E', '-i') : '-F',
6625                         $searchtext, $co{'tree'};
6626                 my $lastfile = '';
6627                 while (my $line = <$fd>) {
6628                         chomp $line;
6629                         my ($file, $lno, $ltext, $binary);
6630                         last if ($matches++ > 1000);
6631                         if ($line =~ /^Binary file (.+) matches$/) {
6632                                 $file = $1;
6633                                 $binary = 1;
6634                         } else {
6635                                 (undef, $file, $lno, $ltext) = split(/:/, $line, 4);
6636                         }
6637                         if ($file ne $lastfile) {
6638                                 $lastfile and print "</td></tr>\n";
6639                                 if ($alternate++) {
6640                                         print "<tr class=\"dark\">\n";
6641                                 } else {
6642                                         print "<tr class=\"light\">\n";
6643                                 }
6644                                 print "<td class=\"list\">".
6645                                         $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6646                                                                file_name=>"$file"),
6647                                                 -class => "list"}, esc_path($file));
6648                                 print "</td><td>\n";
6649                                 $lastfile = $file;
6650                         }
6651                         if ($binary) {
6652                                 print "<div class=\"binary\">Binary file</div>\n";
6653                         } else {
6654                                 $ltext = untabify($ltext);
6655                                 if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6656                                         $ltext = esc_html($1, -nbsp=>1);
6657                                         $ltext .= '<span class="match">';
6658                                         $ltext .= esc_html($2, -nbsp=>1);
6659                                         $ltext .= '</span>';
6660                                         $ltext .= esc_html($3, -nbsp=>1);
6661                                 } else {
6662                                         $ltext = esc_html($ltext, -nbsp=>1);
6663                                 }
6664                                 print "<div class=\"pre\">" .
6665                                         $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6666                                                                file_name=>"$file").'#l'.$lno,
6667                                                 -class => "linenr"}, sprintf('%4i', $lno))
6668                                         . ' ' .  $ltext . "</div>\n";
6669                         }
6670                 }
6671                 if ($lastfile) {
6672                         print "</td></tr>\n";
6673                         if ($matches > 1000) {
6674                                 print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6675                         }
6676                 } else {
6677                         print "<div class=\"diff nodifferences\">No matches found</div>\n";
6678                 }
6679                 close $fd;
6680
6681                 print "</table>\n";
6682         }
6683         git_footer_html();
6684 }
6685
6686 sub git_search_help {
6687         git_header_html();
6688         git_print_page_nav('','', $hash,$hash,$hash);
6689         print <<EOT;
6690 <p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
6691 regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
6692 the pattern entered is recognized as the POSIX extended
6693 <a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
6694 insensitive).</p>
6695 <dl>
6696 <dt><b>commit</b></dt>
6697 <dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
6698 EOT
6699         my $have_grep = gitweb_check_feature('grep');
6700         if ($have_grep) {
6701                 print <<EOT;
6702 <dt><b>grep</b></dt>
6703 <dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
6704     a different one) are searched for the given pattern. On large trees, this search can take
6705 a while and put some strain on the server, so please use it with some consideration. Note that
6706 due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
6707 case-sensitive.</dd>
6708 EOT
6709         }
6710         print <<EOT;
6711 <dt><b>author</b></dt>
6712 <dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
6713 <dt><b>committer</b></dt>
6714 <dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
6715 EOT
6716         my $have_pickaxe = gitweb_check_feature('pickaxe');
6717         if ($have_pickaxe) {
6718                 print <<EOT;
6719 <dt><b>pickaxe</b></dt>
6720 <dd>All commits that caused the string to appear or disappear from any file (changes that
6721 added, removed or "modified" the string) will be listed. This search can take a while and
6722 takes a lot of strain on the server, so please use it wisely. Note that since you may be
6723 interested even in changes just changing the case as well, this search is case sensitive.</dd>
6724 EOT
6725         }
6726         print "</dl>\n";
6727         git_footer_html();
6728 }
6729
6730 sub git_shortlog {
6731         git_log_generic('shortlog', \&git_shortlog_body,
6732                         $hash, $hash_parent);
6733 }
6734
6735 ## ......................................................................
6736 ## feeds (RSS, Atom; OPML)
6737
6738 sub git_feed {
6739         my $format = shift || 'atom';
6740         my $have_blame = gitweb_check_feature('blame');
6741
6742         # Atom: http://www.atomenabled.org/developers/syndication/
6743         # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
6744         if ($format ne 'rss' && $format ne 'atom') {
6745                 die_error(400, "Unknown web feed format");
6746         }
6747
6748         # log/feed of current (HEAD) branch, log of given branch, history of file/directory
6749         my $head = $hash || 'HEAD';
6750         my @commitlist = parse_commits($head, 150, 0, $file_name);
6751
6752         my %latest_commit;
6753         my %latest_date;
6754         my $content_type = "application/$format+xml";
6755         if (defined $cgi->http('HTTP_ACCEPT') &&
6756                  $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
6757                 # browser (feed reader) prefers text/xml
6758                 $content_type = 'text/xml';
6759         }
6760         if (defined($commitlist[0])) {
6761                 %latest_commit = %{$commitlist[0]};
6762                 my $latest_epoch = $latest_commit{'committer_epoch'};
6763                 %latest_date   = parse_date($latest_epoch);
6764                 my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
6765                 if (defined $if_modified) {
6766                         my $since;
6767                         if (eval { require HTTP::Date; 1; }) {
6768                                 $since = HTTP::Date::str2time($if_modified);
6769                         } elsif (eval { require Time::ParseDate; 1; }) {
6770                                 $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
6771                         }
6772                         if (defined $since && $latest_epoch <= $since) {
6773                                 print $cgi->header(
6774                                         -type => $content_type,
6775                                         -charset => 'utf-8',
6776                                         -last_modified => $latest_date{'rfc2822'},
6777                                         -status => '304 Not Modified');
6778                                 return;
6779                         }
6780                 }
6781                 print $cgi->header(
6782                         -type => $content_type,
6783                         -charset => 'utf-8',
6784                         -last_modified => $latest_date{'rfc2822'});
6785         } else {
6786                 print $cgi->header(
6787                         -type => $content_type,
6788                         -charset => 'utf-8');
6789         }
6790
6791         # Optimization: skip generating the body if client asks only
6792         # for Last-Modified date.
6793         return if ($cgi->request_method() eq 'HEAD');
6794
6795         # header variables
6796         my $title = "$site_name - $project/$action";
6797         my $feed_type = 'log';
6798         if (defined $hash) {
6799                 $title .= " - '$hash'";
6800                 $feed_type = 'branch log';
6801                 if (defined $file_name) {
6802                         $title .= " :: $file_name";
6803                         $feed_type = 'history';
6804                 }
6805         } elsif (defined $file_name) {
6806                 $title .= " - $file_name";
6807                 $feed_type = 'history';
6808         }
6809         $title .= " $feed_type";
6810         my $descr = git_get_project_description($project);
6811         if (defined $descr) {
6812                 $descr = esc_html($descr);
6813         } else {
6814                 $descr = "$project " .
6815                          ($format eq 'rss' ? 'RSS' : 'Atom') .
6816                          " feed";
6817         }
6818         my $owner = git_get_project_owner($project);
6819         $owner = esc_html($owner);
6820
6821         #header
6822         my $alt_url;
6823         if (defined $file_name) {
6824                 $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
6825         } elsif (defined $hash) {
6826                 $alt_url = href(-full=>1, action=>"log", hash=>$hash);
6827         } else {
6828                 $alt_url = href(-full=>1, action=>"summary");
6829         }
6830         print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
6831         if ($format eq 'rss') {
6832                 print <<XML;
6833 <rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
6834 <channel>
6835 XML
6836                 print "<title>$title</title>\n" .
6837                       "<link>$alt_url</link>\n" .
6838                       "<description>$descr</description>\n" .
6839                       "<language>en</language>\n" .
6840                       # project owner is responsible for 'editorial' content
6841                       "<managingEditor>$owner</managingEditor>\n";
6842                 if (defined $logo || defined $favicon) {
6843                         # prefer the logo to the favicon, since RSS
6844                         # doesn't allow both
6845                         my $img = esc_url($logo || $favicon);
6846                         print "<image>\n" .
6847                               "<url>$img</url>\n" .
6848                               "<title>$title</title>\n" .
6849                               "<link>$alt_url</link>\n" .
6850                               "</image>\n";
6851                 }
6852                 if (%latest_date) {
6853                         print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
6854                         print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
6855                 }
6856                 print "<generator>gitweb v.$version/$git_version</generator>\n";
6857         } elsif ($format eq 'atom') {
6858                 print <<XML;
6859 <feed xmlns="http://www.w3.org/2005/Atom">
6860 XML
6861                 print "<title>$title</title>\n" .
6862                       "<subtitle>$descr</subtitle>\n" .
6863                       '<link rel="alternate" type="text/html" href="' .
6864                       $alt_url . '" />' . "\n" .
6865                       '<link rel="self" type="' . $content_type . '" href="' .
6866                       $cgi->self_url() . '" />' . "\n" .
6867                       "<id>" . href(-full=>1) . "</id>\n" .
6868                       # use project owner for feed author
6869                       "<author><name>$owner</name></author>\n";
6870                 if (defined $favicon) {
6871                         print "<icon>" . esc_url($favicon) . "</icon>\n";
6872                 }
6873                 if (defined $logo_url) {
6874                         # not twice as wide as tall: 72 x 27 pixels
6875                         print "<logo>" . esc_url($logo) . "</logo>\n";
6876                 }
6877                 if (! %latest_date) {
6878                         # dummy date to keep the feed valid until commits trickle in:
6879                         print "<updated>1970-01-01T00:00:00Z</updated>\n";
6880                 } else {
6881                         print "<updated>$latest_date{'iso-8601'}</updated>\n";
6882                 }
6883                 print "<generator version='$version/$git_version'>gitweb</generator>\n";
6884         }
6885
6886         # contents
6887         for (my $i = 0; $i <= $#commitlist; $i++) {
6888                 my %co = %{$commitlist[$i]};
6889                 my $commit = $co{'id'};
6890                 # we read 150, we always show 30 and the ones more recent than 48 hours
6891                 if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
6892                         last;
6893                 }
6894                 my %cd = parse_date($co{'author_epoch'});
6895
6896                 # get list of changed files
6897                 open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6898                         $co{'parent'} || "--root",
6899                         $co{'id'}, "--", (defined $file_name ? $file_name : ())
6900                         or next;
6901                 my @difftree = map { chomp; $_ } <$fd>;
6902                 close $fd
6903                         or next;
6904
6905                 # print element (entry, item)
6906                 my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
6907                 if ($format eq 'rss') {
6908                         print "<item>\n" .
6909                               "<title>" . esc_html($co{'title'}) . "</title>\n" .
6910                               "<author>" . esc_html($co{'author'}) . "</author>\n" .
6911                               "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
6912                               "<guid isPermaLink=\"true\">$co_url</guid>\n" .
6913                               "<link>$co_url</link>\n" .
6914                               "<description>" . esc_html($co{'title'}) . "</description>\n" .
6915                               "<content:encoded>" .
6916                               "<![CDATA[\n";
6917                 } elsif ($format eq 'atom') {
6918                         print "<entry>\n" .
6919                               "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
6920                               "<updated>$cd{'iso-8601'}</updated>\n" .
6921                               "<author>\n" .
6922                               "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
6923                         if ($co{'author_email'}) {
6924                                 print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
6925                         }
6926                         print "</author>\n" .
6927                               # use committer for contributor
6928                               "<contributor>\n" .
6929                               "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
6930                         if ($co{'committer_email'}) {
6931                                 print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
6932                         }
6933                         print "</contributor>\n" .
6934                               "<published>$cd{'iso-8601'}</published>\n" .
6935                               "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
6936                               "<id>$co_url</id>\n" .
6937                               "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
6938                               "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
6939                 }
6940                 my $comment = $co{'comment'};
6941                 print "<pre>\n";
6942                 foreach my $line (@$comment) {
6943                         $line = esc_html($line);
6944                         print "$line\n";
6945                 }
6946                 print "</pre><ul>\n";
6947                 foreach my $difftree_line (@difftree) {
6948                         my %difftree = parse_difftree_raw_line($difftree_line);
6949                         next if !$difftree{'from_id'};
6950
6951                         my $file = $difftree{'file'} || $difftree{'to_file'};
6952
6953                         print "<li>" .
6954                               "[" .
6955                               $cgi->a({-href => href(-full=>1, action=>"blobdiff",
6956                                                      hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
6957                                                      hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
6958                                                      file_name=>$file, file_parent=>$difftree{'from_file'}),
6959                                       -title => "diff"}, 'D');
6960                         if ($have_blame) {
6961                                 print $cgi->a({-href => href(-full=>1, action=>"blame",
6962                                                              file_name=>$file, hash_base=>$commit),
6963                                               -title => "blame"}, 'B');
6964                         }
6965                         # if this is not a feed of a file history
6966                         if (!defined $file_name || $file_name ne $file) {
6967                                 print $cgi->a({-href => href(-full=>1, action=>"history",
6968                                                              file_name=>$file, hash=>$commit),
6969                                               -title => "history"}, 'H');
6970                         }
6971                         $file = esc_path($file);
6972                         print "] ".
6973                               "$file</li>\n";
6974                 }
6975                 if ($format eq 'rss') {
6976                         print "</ul>]]>\n" .
6977                               "</content:encoded>\n" .
6978                               "</item>\n";
6979                 } elsif ($format eq 'atom') {
6980                         print "</ul>\n</div>\n" .
6981                               "</content>\n" .
6982                               "</entry>\n";
6983                 }
6984         }
6985
6986         # end of feed
6987         if ($format eq 'rss') {
6988                 print "</channel>\n</rss>\n";
6989         } elsif ($format eq 'atom') {
6990                 print "</feed>\n";
6991         }
6992 }
6993
6994 sub git_rss {
6995         git_feed('rss');
6996 }
6997
6998 sub git_atom {
6999         git_feed('atom');
7000 }
7001
7002 sub git_opml {
7003         my @list = git_get_projects_list();
7004
7005         print $cgi->header(
7006                 -type => 'text/xml',
7007                 -charset => 'utf-8',
7008                 -content_disposition => 'inline; filename="opml.xml"');
7009
7010         print <<XML;
7011 <?xml version="1.0" encoding="utf-8"?>
7012 <opml version="1.0">
7013 <head>
7014   <title>$site_name OPML Export</title>
7015 </head>
7016 <body>
7017 <outline text="git RSS feeds">
7018 XML
7019
7020         foreach my $pr (@list) {
7021                 my %proj = %$pr;
7022                 my $head = git_get_head_hash($proj{'path'});
7023                 if (!defined $head) {
7024                         next;
7025                 }
7026                 $git_dir = "$projectroot/$proj{'path'}";
7027                 my %co = parse_commit($head);
7028                 if (!%co) {
7029                         next;
7030                 }
7031
7032                 my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7033                 my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7034                 my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7035                 print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7036         }
7037         print <<XML;
7038 </outline>
7039 </body>
7040 </opml>
7041 XML
7042 }