gitweb: Add support to Link: tag
[git] / gitweb / gitweb.perl
1 #!/usr/bin/perl
2
3 # gitweb - simple web interface to track changes in git repositories
4 #
5 # (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
6 # (C) 2005, Christian Gierke
7 #
8 # This program is licensed under the GPLv2
9
10 use 5.008;
11 use strict;
12 use warnings;
13 use CGI qw(:standard :escapeHTML -nosticky);
14 use CGI::Util qw(unescape);
15 use CGI::Carp qw(fatalsToBrowser set_message);
16 use Encode;
17 use Fcntl ':mode';
18 use File::Find qw();
19 use File::Basename qw(basename);
20 use Time::HiRes qw(gettimeofday tv_interval);
21 binmode STDOUT, ':utf8';
22
23 our $t0 = [ gettimeofday() ];
24 our $number_of_git_cmds = 0;
25
26 BEGIN {
27         CGI->compile() if $ENV{'MOD_PERL'};
28 }
29
30 our $version = "++GIT_VERSION++";
31
32 our ($my_url, $my_uri, $base_url, $path_info, $home_link);
33 sub evaluate_uri {
34         our $cgi;
35
36         our $my_url = $cgi->url();
37         our $my_uri = $cgi->url(-absolute => 1);
38
39         # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
40         # needed and used only for URLs with nonempty PATH_INFO
41         our $base_url = $my_url;
42
43         # When the script is used as DirectoryIndex, the URL does not contain the name
44         # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
45         # have to do it ourselves. We make $path_info global because it's also used
46         # later on.
47         #
48         # Another issue with the script being the DirectoryIndex is that the resulting
49         # $my_url data is not the full script URL: this is good, because we want
50         # generated links to keep implying the script name if it wasn't explicitly
51         # indicated in the URL we're handling, but it means that $my_url cannot be used
52         # as base URL.
53         # Therefore, if we needed to strip PATH_INFO, then we know that we have
54         # to build the base URL ourselves:
55         our $path_info = decode_utf8($ENV{"PATH_INFO"});
56         if ($path_info) {
57                 if ($my_url =~ s,\Q$path_info\E$,, &&
58                     $my_uri =~ s,\Q$path_info\E$,, &&
59                     defined $ENV{'SCRIPT_NAME'}) {
60                         $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
61                 }
62         }
63
64         # target of the home link on top of all pages
65         our $home_link = $my_uri || "/";
66 }
67
68 # core git executable to use
69 # this can just be "git" if your webserver has a sensible PATH
70 our $GIT = "++GIT_BINDIR++/git";
71
72 # absolute fs-path which will be prepended to the project path
73 #our $projectroot = "/pub/scm";
74 our $projectroot = "++GITWEB_PROJECTROOT++";
75
76 # fs traversing limit for getting project list
77 # the number is relative to the projectroot
78 our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
79
80 # string of the home link on top of all pages
81 our $home_link_str = "++GITWEB_HOME_LINK_STR++";
82
83 # name of your site or organization to appear in page titles
84 # replace this with something more descriptive for clearer bookmarks
85 our $site_name = "++GITWEB_SITENAME++"
86                  || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
87
88 # html snippet to include in the <head> section of each page
89 our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
90 # filename of html text to include at top of each page
91 our $site_header = "++GITWEB_SITE_HEADER++";
92 # html text to include at home page
93 our $home_text = "++GITWEB_HOMETEXT++";
94 # filename of html text to include at bottom of each page
95 our $site_footer = "++GITWEB_SITE_FOOTER++";
96
97 # URI of stylesheets
98 our @stylesheets = ("++GITWEB_CSS++");
99 # URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
100 our $stylesheet = undef;
101 # URI of GIT logo (72x27 size)
102 our $logo = "++GITWEB_LOGO++";
103 # URI of GIT favicon, assumed to be image/png type
104 our $favicon = "++GITWEB_FAVICON++";
105 # URI of gitweb.js (JavaScript code for gitweb)
106 our $javascript = "++GITWEB_JS++";
107
108 # URI and label (title) of GIT logo link
109 #our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
110 #our $logo_label = "git documentation";
111 our $logo_url = "http://git-scm.com/";
112 our $logo_label = "git homepage";
113
114 # source of projects list
115 our $projects_list = "++GITWEB_LIST++";
116
117 # the width (in characters) of the projects list "Description" column
118 our $projects_list_description_width = 25;
119
120 # group projects by category on the projects list
121 # (enabled if this variable evaluates to true)
122 our $projects_list_group_categories = 0;
123
124 # default category if none specified
125 # (leave the empty string for no category)
126 our $project_list_default_category = "";
127
128 # default order of projects list
129 # valid values are none, project, descr, owner, and age
130 our $default_projects_order = "project";
131
132 # show repository only if this file exists
133 # (only effective if this variable evaluates to true)
134 our $export_ok = "++GITWEB_EXPORT_OK++";
135
136 # show repository only if this subroutine returns true
137 # when given the path to the project, for example:
138 #    sub { return -e "$_[0]/git-daemon-export-ok"; }
139 our $export_auth_hook = undef;
140
141 # only allow viewing of repositories also shown on the overview page
142 our $strict_export = "++GITWEB_STRICT_EXPORT++";
143
144 # list of git base URLs used for URL to where fetch project from,
145 # i.e. full URL is "$git_base_url/$project"
146 our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
147
148 # default blob_plain mimetype and default charset for text/plain blob
149 our $default_blob_plain_mimetype = 'text/plain';
150 our $default_text_plain_charset  = undef;
151
152 # file to use for guessing MIME types before trying /etc/mime.types
153 # (relative to the current git repository)
154 our $mimetypes_file = undef;
155
156 # assume this charset if line contains non-UTF-8 characters;
157 # it should be valid encoding (see Encoding::Supported(3pm) for list),
158 # for which encoding all byte sequences are valid, for example
159 # 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
160 # could be even 'utf-8' for the old behavior)
161 our $fallback_encoding = 'latin1';
162
163 # rename detection options for git-diff and git-diff-tree
164 # - default is '-M', with the cost proportional to
165 #   (number of removed files) * (number of new files).
166 # - more costly is '-C' (which implies '-M'), with the cost proportional to
167 #   (number of changed files + number of removed files) * (number of new files)
168 # - even more costly is '-C', '--find-copies-harder' with cost
169 #   (number of files in the original tree) * (number of new files)
170 # - one might want to include '-B' option, e.g. '-B', '-M'
171 our @diff_opts = ('-M'); # taken from git_commit
172
173 # Disables features that would allow repository owners to inject script into
174 # the gitweb domain.
175 our $prevent_xss = 0;
176
177 # Path to the highlight executable to use (must be the one from
178 # http://www.andre-simon.de due to assumptions about parameters and output).
179 # Useful if highlight is not installed on your webserver's PATH.
180 # [Default: highlight]
181 our $highlight_bin = "++HIGHLIGHT_BIN++";
182
183 # information about snapshot formats that gitweb is capable of serving
184 our %known_snapshot_formats = (
185         # name => {
186         #       'display' => display name,
187         #       'type' => mime type,
188         #       'suffix' => filename suffix,
189         #       'format' => --format for git-archive,
190         #       'compressor' => [compressor command and arguments]
191         #                       (array reference, optional)
192         #       'disabled' => boolean (optional)}
193         #
194         'tgz' => {
195                 'display' => 'tar.gz',
196                 'type' => 'application/x-gzip',
197                 'suffix' => '.tar.gz',
198                 'format' => 'tar',
199                 'compressor' => ['gzip', '-n']},
200
201         'tbz2' => {
202                 'display' => 'tar.bz2',
203                 'type' => 'application/x-bzip2',
204                 'suffix' => '.tar.bz2',
205                 'format' => 'tar',
206                 'compressor' => ['bzip2']},
207
208         'txz' => {
209                 'display' => 'tar.xz',
210                 'type' => 'application/x-xz',
211                 'suffix' => '.tar.xz',
212                 'format' => 'tar',
213                 'compressor' => ['xz'],
214                 'disabled' => 1},
215
216         'zip' => {
217                 'display' => 'zip',
218                 'type' => 'application/x-zip',
219                 'suffix' => '.zip',
220                 'format' => 'zip'},
221 );
222
223 # Aliases so we understand old gitweb.snapshot values in repository
224 # configuration.
225 our %known_snapshot_format_aliases = (
226         'gzip'  => 'tgz',
227         'bzip2' => 'tbz2',
228         'xz'    => 'txz',
229
230         # backward compatibility: legacy gitweb config support
231         'x-gzip' => undef, 'gz' => undef,
232         'x-bzip2' => undef, 'bz2' => undef,
233         'x-zip' => undef, '' => undef,
234 );
235
236 # Pixel sizes for icons and avatars. If the default font sizes or lineheights
237 # are changed, it may be appropriate to change these values too via
238 # $GITWEB_CONFIG.
239 our %avatar_size = (
240         'default' => 16,
241         'double'  => 32
242 );
243
244 # Used to set the maximum load that we will still respond to gitweb queries.
245 # If server load exceed this value then return "503 server busy" error.
246 # If gitweb cannot determined server load, it is taken to be 0.
247 # Leave it undefined (or set to 'undef') to turn off load checking.
248 our $maxload = 300;
249
250 # configuration for 'highlight' (http://www.andre-simon.de/)
251 # match by basename
252 our %highlight_basename = (
253         #'Program' => 'py',
254         #'Library' => 'py',
255         'SConstruct' => 'py', # SCons equivalent of Makefile
256         'Makefile' => 'make',
257 );
258 # match by extension
259 our %highlight_ext = (
260         # main extensions, defining name of syntax;
261         # see files in /usr/share/highlight/langDefs/ directory
262         map { $_ => $_ }
263                 qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
264         # alternate extensions, see /etc/highlight/filetypes.conf
265         'h' => 'c',
266         map { $_ => 'sh'  } qw(bash zsh ksh),
267         map { $_ => 'cpp' } qw(cxx c++ cc),
268         map { $_ => 'php' } qw(php3 php4 php5 phps),
269         map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
270         map { $_ => 'make'} qw(mak mk),
271         map { $_ => 'xml' } qw(xhtml html htm),
272 );
273
274 # You define site-wide feature defaults here; override them with
275 # $GITWEB_CONFIG as necessary.
276 our %feature = (
277         # feature => {
278         #       'sub' => feature-sub (subroutine),
279         #       'override' => allow-override (boolean),
280         #       'default' => [ default options...] (array reference)}
281         #
282         # if feature is overridable (it means that allow-override has true value),
283         # then feature-sub will be called with default options as parameters;
284         # return value of feature-sub indicates if to enable specified feature
285         #
286         # if there is no 'sub' key (no feature-sub), then feature cannot be
287         # overridden
288         #
289         # use gitweb_get_feature(<feature>) to retrieve the <feature> value
290         # (an array) or gitweb_check_feature(<feature>) to check if <feature>
291         # is enabled
292
293         # Enable the 'blame' blob view, showing the last commit that modified
294         # each line in the file. This can be very CPU-intensive.
295
296         # To enable system wide have in $GITWEB_CONFIG
297         # $feature{'blame'}{'default'} = [1];
298         # To have project specific config enable override in $GITWEB_CONFIG
299         # $feature{'blame'}{'override'} = 1;
300         # and in project config gitweb.blame = 0|1;
301         'blame' => {
302                 'sub' => sub { feature_bool('blame', @_) },
303                 'override' => 0,
304                 'default' => [0]},
305
306         # Enable the 'snapshot' link, providing a compressed archive of any
307         # tree. This can potentially generate high traffic if you have large
308         # project.
309
310         # Value is a list of formats defined in %known_snapshot_formats that
311         # you wish to offer.
312         # To disable system wide have in $GITWEB_CONFIG
313         # $feature{'snapshot'}{'default'} = [];
314         # To have project specific config enable override in $GITWEB_CONFIG
315         # $feature{'snapshot'}{'override'} = 1;
316         # and in project config, a comma-separated list of formats or "none"
317         # to disable.  Example: gitweb.snapshot = tbz2,zip;
318         'snapshot' => {
319                 'sub' => \&feature_snapshot,
320                 'override' => 0,
321                 'default' => ['tgz']},
322
323         # Enable text search, which will list the commits which match author,
324         # committer or commit text to a given string.  Enabled by default.
325         # Project specific override is not supported.
326         #
327         # Note that this controls all search features, which means that if
328         # it is disabled, then 'grep' and 'pickaxe' search would also be
329         # disabled.
330         'search' => {
331                 'override' => 0,
332                 'default' => [1]},
333
334         # Enable grep search, which will list the files in currently selected
335         # tree containing the given string. Enabled by default. This can be
336         # potentially CPU-intensive, of course.
337         # Note that you need to have 'search' feature enabled too.
338
339         # To enable system wide have in $GITWEB_CONFIG
340         # $feature{'grep'}{'default'} = [1];
341         # To have project specific config enable override in $GITWEB_CONFIG
342         # $feature{'grep'}{'override'} = 1;
343         # and in project config gitweb.grep = 0|1;
344         'grep' => {
345                 'sub' => sub { feature_bool('grep', @_) },
346                 'override' => 0,
347                 'default' => [1]},
348
349         # Enable the pickaxe search, which will list the commits that modified
350         # a given string in a file. This can be practical and quite faster
351         # alternative to 'blame', but still potentially CPU-intensive.
352         # Note that you need to have 'search' feature enabled too.
353
354         # To enable system wide have in $GITWEB_CONFIG
355         # $feature{'pickaxe'}{'default'} = [1];
356         # To have project specific config enable override in $GITWEB_CONFIG
357         # $feature{'pickaxe'}{'override'} = 1;
358         # and in project config gitweb.pickaxe = 0|1;
359         'pickaxe' => {
360                 'sub' => sub { feature_bool('pickaxe', @_) },
361                 'override' => 0,
362                 'default' => [1]},
363
364         # Enable showing size of blobs in a 'tree' view, in a separate
365         # column, similar to what 'ls -l' does.  This cost a bit of IO.
366
367         # To disable system wide have in $GITWEB_CONFIG
368         # $feature{'show-sizes'}{'default'} = [0];
369         # To have project specific config enable override in $GITWEB_CONFIG
370         # $feature{'show-sizes'}{'override'} = 1;
371         # and in project config gitweb.showsizes = 0|1;
372         'show-sizes' => {
373                 'sub' => sub { feature_bool('showsizes', @_) },
374                 'override' => 0,
375                 'default' => [1]},
376
377         # Make gitweb use an alternative format of the URLs which can be
378         # more readable and natural-looking: project name is embedded
379         # directly in the path and the query string contains other
380         # auxiliary information. All gitweb installations recognize
381         # URL in either format; this configures in which formats gitweb
382         # generates links.
383
384         # To enable system wide have in $GITWEB_CONFIG
385         # $feature{'pathinfo'}{'default'} = [1];
386         # Project specific override is not supported.
387
388         # Note that you will need to change the default location of CSS,
389         # favicon, logo and possibly other files to an absolute URL. Also,
390         # if gitweb.cgi serves as your indexfile, you will need to force
391         # $my_uri to contain the script name in your $GITWEB_CONFIG.
392         'pathinfo' => {
393                 'override' => 0,
394                 'default' => [0]},
395
396         # Make gitweb consider projects in project root subdirectories
397         # to be forks of existing projects. Given project $projname.git,
398         # projects matching $projname/*.git will not be shown in the main
399         # projects list, instead a '+' mark will be added to $projname
400         # there and a 'forks' view will be enabled for the project, listing
401         # all the forks. If project list is taken from a file, forks have
402         # to be listed after the main project.
403
404         # To enable system wide have in $GITWEB_CONFIG
405         # $feature{'forks'}{'default'} = [1];
406         # Project specific override is not supported.
407         'forks' => {
408                 'override' => 0,
409                 'default' => [0]},
410
411         # Insert custom links to the action bar of all project pages.
412         # This enables you mainly to link to third-party scripts integrating
413         # into gitweb; e.g. git-browser for graphical history representation
414         # or custom web-based repository administration interface.
415
416         # The 'default' value consists of a list of triplets in the form
417         # (label, link, position) where position is the label after which
418         # to insert the link and link is a format string where %n expands
419         # to the project name, %f to the project path within the filesystem,
420         # %h to the current hash (h gitweb parameter) and %b to the current
421         # hash base (hb gitweb parameter); %% expands to %.
422
423         # To enable system wide have in $GITWEB_CONFIG e.g.
424         # $feature{'actions'}{'default'} = [('graphiclog',
425         #       '/git-browser/by-commit.html?r=%n', 'summary')];
426         # Project specific override is not supported.
427         'actions' => {
428                 'override' => 0,
429                 'default' => []},
430
431         # Allow gitweb scan project content tags of project repository,
432         # and display the popular Web 2.0-ish "tag cloud" near the projects
433         # list.  Note that this is something COMPLETELY different from the
434         # normal Git tags.
435
436         # gitweb by itself can show existing tags, but it does not handle
437         # tagging itself; you need to do it externally, outside gitweb.
438         # The format is described in git_get_project_ctags() subroutine.
439         # You may want to install the HTML::TagCloud Perl module to get
440         # a pretty tag cloud instead of just a list of tags.
441
442         # To enable system wide have in $GITWEB_CONFIG
443         # $feature{'ctags'}{'default'} = [1];
444         # Project specific override is not supported.
445
446         # In the future whether ctags editing is enabled might depend
447         # on the value, but using 1 should always mean no editing of ctags.
448         'ctags' => {
449                 'override' => 0,
450                 'default' => [0]},
451
452         # The maximum number of patches in a patchset generated in patch
453         # view. Set this to 0 or undef to disable patch view, or to a
454         # negative number to remove any limit.
455
456         # To disable system wide have in $GITWEB_CONFIG
457         # $feature{'patches'}{'default'} = [0];
458         # To have project specific config enable override in $GITWEB_CONFIG
459         # $feature{'patches'}{'override'} = 1;
460         # and in project config gitweb.patches = 0|n;
461         # where n is the maximum number of patches allowed in a patchset.
462         'patches' => {
463                 'sub' => \&feature_patches,
464                 'override' => 0,
465                 'default' => [16]},
466
467         # Avatar support. When this feature is enabled, views such as
468         # shortlog or commit will display an avatar associated with
469         # the email of the committer(s) and/or author(s).
470
471         # Currently available providers are gravatar and picon.
472         # If an unknown provider is specified, the feature is disabled.
473
474         # Gravatar depends on Digest::MD5.
475         # Picon currently relies on the indiana.edu database.
476
477         # To enable system wide have in $GITWEB_CONFIG
478         # $feature{'avatar'}{'default'} = ['<provider>'];
479         # where <provider> is either gravatar or picon.
480         # To have project specific config enable override in $GITWEB_CONFIG
481         # $feature{'avatar'}{'override'} = 1;
482         # and in project config gitweb.avatar = <provider>;
483         'avatar' => {
484                 'sub' => \&feature_avatar,
485                 'override' => 0,
486                 'default' => ['']},
487
488         # Enable displaying how much time and how many git commands
489         # it took to generate and display page.  Disabled by default.
490         # Project specific override is not supported.
491         'timed' => {
492                 'override' => 0,
493                 'default' => [0]},
494
495         # Enable turning some links into links to actions which require
496         # JavaScript to run (like 'blame_incremental').  Not enabled by
497         # default.  Project specific override is currently not supported.
498         'javascript-actions' => {
499                 'override' => 0,
500                 'default' => [0]},
501
502         # Enable and configure ability to change common timezone for dates
503         # in gitweb output via JavaScript.  Enabled by default.
504         # Project specific override is not supported.
505         'javascript-timezone' => {
506                 'override' => 0,
507                 'default' => [
508                         'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
509                                      # or undef to turn off this feature
510                         'gitweb_tz', # name of cookie where to store selected timezone
511                         'datetime',  # CSS class used to mark up dates for manipulation
512                 ]},
513
514         # Syntax highlighting support. This is based on Daniel Svensson's
515         # and Sham Chukoury's work in gitweb-xmms2.git.
516         # It requires the 'highlight' program present in $PATH,
517         # and therefore is disabled by default.
518
519         # To enable system wide have in $GITWEB_CONFIG
520         # $feature{'highlight'}{'default'} = [1];
521
522         'highlight' => {
523                 'sub' => sub { feature_bool('highlight', @_) },
524                 'override' => 0,
525                 'default' => [0]},
526
527         # Enable displaying of remote heads in the heads list
528
529         # To enable system wide have in $GITWEB_CONFIG
530         # $feature{'remote_heads'}{'default'} = [1];
531         # To have project specific config enable override in $GITWEB_CONFIG
532         # $feature{'remote_heads'}{'override'} = 1;
533         # and in project config gitweb.remote_heads = 0|1;
534         'remote_heads' => {
535                 'sub' => sub { feature_bool('remote_heads', @_) },
536                 'override' => 0,
537                 'default' => [0]},
538 );
539
540 sub gitweb_get_feature {
541         my ($name) = @_;
542         return unless exists $feature{$name};
543         my ($sub, $override, @defaults) = (
544                 $feature{$name}{'sub'},
545                 $feature{$name}{'override'},
546                 @{$feature{$name}{'default'}});
547         # project specific override is possible only if we have project
548         our $git_dir; # global variable, declared later
549         if (!$override || !defined $git_dir) {
550                 return @defaults;
551         }
552         if (!defined $sub) {
553                 warn "feature $name is not overridable";
554                 return @defaults;
555         }
556         return $sub->(@defaults);
557 }
558
559 # A wrapper to check if a given feature is enabled.
560 # With this, you can say
561 #
562 #   my $bool_feat = gitweb_check_feature('bool_feat');
563 #   gitweb_check_feature('bool_feat') or somecode;
564 #
565 # instead of
566 #
567 #   my ($bool_feat) = gitweb_get_feature('bool_feat');
568 #   (gitweb_get_feature('bool_feat'))[0] or somecode;
569 #
570 sub gitweb_check_feature {
571         return (gitweb_get_feature(@_))[0];
572 }
573
574
575 sub feature_bool {
576         my $key = shift;
577         my ($val) = git_get_project_config($key, '--bool');
578
579         if (!defined $val) {
580                 return ($_[0]);
581         } elsif ($val eq 'true') {
582                 return (1);
583         } elsif ($val eq 'false') {
584                 return (0);
585         }
586 }
587
588 sub feature_snapshot {
589         my (@fmts) = @_;
590
591         my ($val) = git_get_project_config('snapshot');
592
593         if ($val) {
594                 @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
595         }
596
597         return @fmts;
598 }
599
600 sub feature_patches {
601         my @val = (git_get_project_config('patches', '--int'));
602
603         if (@val) {
604                 return @val;
605         }
606
607         return ($_[0]);
608 }
609
610 sub feature_avatar {
611         my @val = (git_get_project_config('avatar'));
612
613         return @val ? @val : @_;
614 }
615
616 # checking HEAD file with -e is fragile if the repository was
617 # initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
618 # and then pruned.
619 sub check_head_link {
620         my ($dir) = @_;
621         my $headfile = "$dir/HEAD";
622         return ((-e $headfile) ||
623                 (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
624 }
625
626 sub check_export_ok {
627         my ($dir) = @_;
628         return (check_head_link($dir) &&
629                 (!$export_ok || -e "$dir/$export_ok") &&
630                 (!$export_auth_hook || $export_auth_hook->($dir)));
631 }
632
633 # process alternate names for backward compatibility
634 # filter out unsupported (unknown) snapshot formats
635 sub filter_snapshot_fmts {
636         my @fmts = @_;
637
638         @fmts = map {
639                 exists $known_snapshot_format_aliases{$_} ?
640                        $known_snapshot_format_aliases{$_} : $_} @fmts;
641         @fmts = grep {
642                 exists $known_snapshot_formats{$_} &&
643                 !$known_snapshot_formats{$_}{'disabled'}} @fmts;
644 }
645
646 # If it is set to code reference, it is code that it is to be run once per
647 # request, allowing updating configurations that change with each request,
648 # while running other code in config file only once.
649 #
650 # Otherwise, if it is false then gitweb would process config file only once;
651 # if it is true then gitweb config would be run for each request.
652 our $per_request_config = 1;
653
654 # read and parse gitweb config file given by its parameter.
655 # returns true on success, false on recoverable error, allowing
656 # to chain this subroutine, using first file that exists.
657 # dies on errors during parsing config file, as it is unrecoverable.
658 sub read_config_file {
659         my $filename = shift;
660         return unless defined $filename;
661         # die if there are errors parsing config file
662         if (-e $filename) {
663                 do $filename;
664                 die $@ if $@;
665                 return 1;
666         }
667         return;
668 }
669
670 our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
671 sub evaluate_gitweb_config {
672         our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
673         our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
674         our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
675
676         # Protect agains duplications of file names, to not read config twice.
677         # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
678         # there possibility of duplication of filename there doesn't matter.
679         $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
680         $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
681
682         # Common system-wide settings for convenience.
683         # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
684         read_config_file($GITWEB_CONFIG_COMMON);
685
686         # Use first config file that exists.  This means use the per-instance
687         # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
688         read_config_file($GITWEB_CONFIG) and return;
689         read_config_file($GITWEB_CONFIG_SYSTEM);
690 }
691
692 # Get loadavg of system, to compare against $maxload.
693 # Currently it requires '/proc/loadavg' present to get loadavg;
694 # if it is not present it returns 0, which means no load checking.
695 sub get_loadavg {
696         if( -e '/proc/loadavg' ){
697                 open my $fd, '<', '/proc/loadavg'
698                         or return 0;
699                 my @load = split(/\s+/, scalar <$fd>);
700                 close $fd;
701
702                 # The first three columns measure CPU and IO utilization of the last one,
703                 # five, and 10 minute periods.  The fourth column shows the number of
704                 # currently running processes and the total number of processes in the m/n
705                 # format.  The last column displays the last process ID used.
706                 return $load[0] || 0;
707         }
708         # additional checks for load average should go here for things that don't export
709         # /proc/loadavg
710
711         return 0;
712 }
713
714 # version of the core git binary
715 our $git_version;
716 sub evaluate_git_version {
717         our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
718         $number_of_git_cmds++;
719 }
720
721 sub check_loadavg {
722         if (defined $maxload && get_loadavg() > $maxload) {
723                 die_error(503, "The load average on the server is too high");
724         }
725 }
726
727 # ======================================================================
728 # input validation and dispatch
729
730 # input parameters can be collected from a variety of sources (presently, CGI
731 # and PATH_INFO), so we define an %input_params hash that collects them all
732 # together during validation: this allows subsequent uses (e.g. href()) to be
733 # agnostic of the parameter origin
734
735 our %input_params = ();
736
737 # input parameters are stored with the long parameter name as key. This will
738 # also be used in the href subroutine to convert parameters to their CGI
739 # equivalent, and since the href() usage is the most frequent one, we store
740 # the name -> CGI key mapping here, instead of the reverse.
741 #
742 # XXX: Warning: If you touch this, check the search form for updating,
743 # too.
744
745 our @cgi_param_mapping = (
746         project => "p",
747         action => "a",
748         file_name => "f",
749         file_parent => "fp",
750         hash => "h",
751         hash_parent => "hp",
752         hash_base => "hb",
753         hash_parent_base => "hpb",
754         page => "pg",
755         order => "o",
756         searchtext => "s",
757         searchtype => "st",
758         snapshot_format => "sf",
759         extra_options => "opt",
760         search_use_regexp => "sr",
761         ctag => "by_tag",
762         diff_style => "ds",
763         project_filter => "pf",
764         # this must be last entry (for manipulation from JavaScript)
765         javascript => "js"
766 );
767 our %cgi_param_mapping = @cgi_param_mapping;
768
769 # we will also need to know the possible actions, for validation
770 our %actions = (
771         "blame" => \&git_blame,
772         "blame_incremental" => \&git_blame_incremental,
773         "blame_data" => \&git_blame_data,
774         "blobdiff" => \&git_blobdiff,
775         "blobdiff_plain" => \&git_blobdiff_plain,
776         "blob" => \&git_blob,
777         "blob_plain" => \&git_blob_plain,
778         "commitdiff" => \&git_commitdiff,
779         "commitdiff_plain" => \&git_commitdiff_plain,
780         "commit" => \&git_commit,
781         "forks" => \&git_forks,
782         "heads" => \&git_heads,
783         "history" => \&git_history,
784         "log" => \&git_log,
785         "patch" => \&git_patch,
786         "patches" => \&git_patches,
787         "remotes" => \&git_remotes,
788         "rss" => \&git_rss,
789         "atom" => \&git_atom,
790         "search" => \&git_search,
791         "search_help" => \&git_search_help,
792         "shortlog" => \&git_shortlog,
793         "summary" => \&git_summary,
794         "tag" => \&git_tag,
795         "tags" => \&git_tags,
796         "tree" => \&git_tree,
797         "snapshot" => \&git_snapshot,
798         "object" => \&git_object,
799         # those below don't need $project
800         "opml" => \&git_opml,
801         "project_list" => \&git_project_list,
802         "project_index" => \&git_project_index,
803 );
804
805 # finally, we have the hash of allowed extra_options for the commands that
806 # allow them
807 our %allowed_options = (
808         "--no-merges" => [ qw(rss atom log shortlog history) ],
809 );
810
811 # fill %input_params with the CGI parameters. All values except for 'opt'
812 # should be single values, but opt can be an array. We should probably
813 # build an array of parameters that can be multi-valued, but since for the time
814 # being it's only this one, we just single it out
815 sub evaluate_query_params {
816         our $cgi;
817
818         while (my ($name, $symbol) = each %cgi_param_mapping) {
819                 if ($symbol eq 'opt') {
820                         $input_params{$name} = [ map { decode_utf8($_) } $cgi->param($symbol) ];
821                 } else {
822                         $input_params{$name} = decode_utf8($cgi->param($symbol));
823                 }
824         }
825 }
826
827 # now read PATH_INFO and update the parameter list for missing parameters
828 sub evaluate_path_info {
829         return if defined $input_params{'project'};
830         return if !$path_info;
831         $path_info =~ s,^/+,,;
832         return if !$path_info;
833
834         # find which part of PATH_INFO is project
835         my $project = $path_info;
836         $project =~ s,/+$,,;
837         while ($project && !check_head_link("$projectroot/$project")) {
838                 $project =~ s,/*[^/]*$,,;
839         }
840         return unless $project;
841         $input_params{'project'} = $project;
842
843         # do not change any parameters if an action is given using the query string
844         return if $input_params{'action'};
845         $path_info =~ s,^\Q$project\E/*,,;
846
847         # next, check if we have an action
848         my $action = $path_info;
849         $action =~ s,/.*$,,;
850         if (exists $actions{$action}) {
851                 $path_info =~ s,^$action/*,,;
852                 $input_params{'action'} = $action;
853         }
854
855         # list of actions that want hash_base instead of hash, but can have no
856         # pathname (f) parameter
857         my @wants_base = (
858                 'tree',
859                 'history',
860         );
861
862         # we want to catch, among others
863         # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
864         my ($parentrefname, $parentpathname, $refname, $pathname) =
865                 ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
866
867         # first, analyze the 'current' part
868         if (defined $pathname) {
869                 # we got "branch:filename" or "branch:dir/"
870                 # we could use git_get_type(branch:pathname), but:
871                 # - it needs $git_dir
872                 # - it does a git() call
873                 # - the convention of terminating directories with a slash
874                 #   makes it superfluous
875                 # - embedding the action in the PATH_INFO would make it even
876                 #   more superfluous
877                 $pathname =~ s,^/+,,;
878                 if (!$pathname || substr($pathname, -1) eq "/") {
879                         $input_params{'action'} ||= "tree";
880                         $pathname =~ s,/$,,;
881                 } else {
882                         # the default action depends on whether we had parent info
883                         # or not
884                         if ($parentrefname) {
885                                 $input_params{'action'} ||= "blobdiff_plain";
886                         } else {
887                                 $input_params{'action'} ||= "blob_plain";
888                         }
889                 }
890                 $input_params{'hash_base'} ||= $refname;
891                 $input_params{'file_name'} ||= $pathname;
892         } elsif (defined $refname) {
893                 # we got "branch". In this case we have to choose if we have to
894                 # set hash or hash_base.
895                 #
896                 # Most of the actions without a pathname only want hash to be
897                 # set, except for the ones specified in @wants_base that want
898                 # hash_base instead. It should also be noted that hand-crafted
899                 # links having 'history' as an action and no pathname or hash
900                 # set will fail, but that happens regardless of PATH_INFO.
901                 if (defined $parentrefname) {
902                         # if there is parent let the default be 'shortlog' action
903                         # (for http://git.example.com/repo.git/A..B links); if there
904                         # is no parent, dispatch will detect type of object and set
905                         # action appropriately if required (if action is not set)
906                         $input_params{'action'} ||= "shortlog";
907                 }
908                 if ($input_params{'action'} &&
909                     grep { $_ eq $input_params{'action'} } @wants_base) {
910                         $input_params{'hash_base'} ||= $refname;
911                 } else {
912                         $input_params{'hash'} ||= $refname;
913                 }
914         }
915
916         # next, handle the 'parent' part, if present
917         if (defined $parentrefname) {
918                 # a missing pathspec defaults to the 'current' filename, allowing e.g.
919                 # someproject/blobdiff/oldrev..newrev:/filename
920                 if ($parentpathname) {
921                         $parentpathname =~ s,^/+,,;
922                         $parentpathname =~ s,/$,,;
923                         $input_params{'file_parent'} ||= $parentpathname;
924                 } else {
925                         $input_params{'file_parent'} ||= $input_params{'file_name'};
926                 }
927                 # we assume that hash_parent_base is wanted if a path was specified,
928                 # or if the action wants hash_base instead of hash
929                 if (defined $input_params{'file_parent'} ||
930                         grep { $_ eq $input_params{'action'} } @wants_base) {
931                         $input_params{'hash_parent_base'} ||= $parentrefname;
932                 } else {
933                         $input_params{'hash_parent'} ||= $parentrefname;
934                 }
935         }
936
937         # for the snapshot action, we allow URLs in the form
938         # $project/snapshot/$hash.ext
939         # where .ext determines the snapshot and gets removed from the
940         # passed $refname to provide the $hash.
941         #
942         # To be able to tell that $refname includes the format extension, we
943         # require the following two conditions to be satisfied:
944         # - the hash input parameter MUST have been set from the $refname part
945         #   of the URL (i.e. they must be equal)
946         # - the snapshot format MUST NOT have been defined already (e.g. from
947         #   CGI parameter sf)
948         # It's also useless to try any matching unless $refname has a dot,
949         # so we check for that too
950         if (defined $input_params{'action'} &&
951                 $input_params{'action'} eq 'snapshot' &&
952                 defined $refname && index($refname, '.') != -1 &&
953                 $refname eq $input_params{'hash'} &&
954                 !defined $input_params{'snapshot_format'}) {
955                 # We loop over the known snapshot formats, checking for
956                 # extensions. Allowed extensions are both the defined suffix
957                 # (which includes the initial dot already) and the snapshot
958                 # format key itself, with a prepended dot
959                 while (my ($fmt, $opt) = each %known_snapshot_formats) {
960                         my $hash = $refname;
961                         unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
962                                 next;
963                         }
964                         my $sfx = $1;
965                         # a valid suffix was found, so set the snapshot format
966                         # and reset the hash parameter
967                         $input_params{'snapshot_format'} = $fmt;
968                         $input_params{'hash'} = $hash;
969                         # we also set the format suffix to the one requested
970                         # in the URL: this way a request for e.g. .tgz returns
971                         # a .tgz instead of a .tar.gz
972                         $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
973                         last;
974                 }
975         }
976 }
977
978 our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
979      $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
980      $searchtext, $search_regexp, $project_filter);
981 sub evaluate_and_validate_params {
982         our $action = $input_params{'action'};
983         if (defined $action) {
984                 if (!validate_action($action)) {
985                         die_error(400, "Invalid action parameter");
986                 }
987         }
988
989         # parameters which are pathnames
990         our $project = $input_params{'project'};
991         if (defined $project) {
992                 if (!validate_project($project)) {
993                         undef $project;
994                         die_error(404, "No such project");
995                 }
996         }
997
998         our $project_filter = $input_params{'project_filter'};
999         if (defined $project_filter) {
1000                 if (!validate_pathname($project_filter)) {
1001                         die_error(404, "Invalid project_filter parameter");
1002                 }
1003         }
1004
1005         our $file_name = $input_params{'file_name'};
1006         if (defined $file_name) {
1007                 if (!validate_pathname($file_name)) {
1008                         die_error(400, "Invalid file parameter");
1009                 }
1010         }
1011
1012         our $file_parent = $input_params{'file_parent'};
1013         if (defined $file_parent) {
1014                 if (!validate_pathname($file_parent)) {
1015                         die_error(400, "Invalid file parent parameter");
1016                 }
1017         }
1018
1019         # parameters which are refnames
1020         our $hash = $input_params{'hash'};
1021         if (defined $hash) {
1022                 if (!validate_refname($hash)) {
1023                         die_error(400, "Invalid hash parameter");
1024                 }
1025         }
1026
1027         our $hash_parent = $input_params{'hash_parent'};
1028         if (defined $hash_parent) {
1029                 if (!validate_refname($hash_parent)) {
1030                         die_error(400, "Invalid hash parent parameter");
1031                 }
1032         }
1033
1034         our $hash_base = $input_params{'hash_base'};
1035         if (defined $hash_base) {
1036                 if (!validate_refname($hash_base)) {
1037                         die_error(400, "Invalid hash base parameter");
1038                 }
1039         }
1040
1041         our @extra_options = @{$input_params{'extra_options'}};
1042         # @extra_options is always defined, since it can only be (currently) set from
1043         # CGI, and $cgi->param() returns the empty array in array context if the param
1044         # is not set
1045         foreach my $opt (@extra_options) {
1046                 if (not exists $allowed_options{$opt}) {
1047                         die_error(400, "Invalid option parameter");
1048                 }
1049                 if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1050                         die_error(400, "Invalid option parameter for this action");
1051                 }
1052         }
1053
1054         our $hash_parent_base = $input_params{'hash_parent_base'};
1055         if (defined $hash_parent_base) {
1056                 if (!validate_refname($hash_parent_base)) {
1057                         die_error(400, "Invalid hash parent base parameter");
1058                 }
1059         }
1060
1061         # other parameters
1062         our $page = $input_params{'page'};
1063         if (defined $page) {
1064                 if ($page =~ m/[^0-9]/) {
1065                         die_error(400, "Invalid page parameter");
1066                 }
1067         }
1068
1069         our $searchtype = $input_params{'searchtype'};
1070         if (defined $searchtype) {
1071                 if ($searchtype =~ m/[^a-z]/) {
1072                         die_error(400, "Invalid searchtype parameter");
1073                 }
1074         }
1075
1076         our $search_use_regexp = $input_params{'search_use_regexp'};
1077
1078         our $searchtext = $input_params{'searchtext'};
1079         our $search_regexp;
1080         if (defined $searchtext) {
1081                 if (length($searchtext) < 2) {
1082                         die_error(403, "At least two characters are required for search parameter");
1083                 }
1084                 if ($search_use_regexp) {
1085                         $search_regexp = $searchtext;
1086                         if (!eval { qr/$search_regexp/; 1; }) {
1087                                 (my $error = $@) =~ s/ at \S+ line \d+.*\n?//;
1088                                 die_error(400, "Invalid search regexp '$search_regexp'",
1089                                           esc_html($error));
1090                         }
1091                 } else {
1092                         $search_regexp = quotemeta $searchtext;
1093                 }
1094         }
1095 }
1096
1097 # path to the current git repository
1098 our $git_dir;
1099 sub evaluate_git_dir {
1100         our $git_dir = "$projectroot/$project" if $project;
1101 }
1102
1103 our (@snapshot_fmts, $git_avatar);
1104 sub configure_gitweb_features {
1105         # list of supported snapshot formats
1106         our @snapshot_fmts = gitweb_get_feature('snapshot');
1107         @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1108
1109         # check that the avatar feature is set to a known provider name,
1110         # and for each provider check if the dependencies are satisfied.
1111         # if the provider name is invalid or the dependencies are not met,
1112         # reset $git_avatar to the empty string.
1113         our ($git_avatar) = gitweb_get_feature('avatar');
1114         if ($git_avatar eq 'gravatar') {
1115                 $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1116         } elsif ($git_avatar eq 'picon') {
1117                 # no dependencies
1118         } else {
1119                 $git_avatar = '';
1120         }
1121 }
1122
1123 # custom error handler: 'die <message>' is Internal Server Error
1124 sub handle_errors_html {
1125         my $msg = shift; # it is already HTML escaped
1126
1127         # to avoid infinite loop where error occurs in die_error,
1128         # change handler to default handler, disabling handle_errors_html
1129         set_message("Error occured when inside die_error:\n$msg");
1130
1131         # you cannot jump out of die_error when called as error handler;
1132         # the subroutine set via CGI::Carp::set_message is called _after_
1133         # HTTP headers are already written, so it cannot write them itself
1134         die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1135 }
1136 set_message(\&handle_errors_html);
1137
1138 # dispatch
1139 sub dispatch {
1140         if (!defined $action) {
1141                 if (defined $hash) {
1142                         $action = git_get_type($hash);
1143                         $action or die_error(404, "Object does not exist");
1144                 } elsif (defined $hash_base && defined $file_name) {
1145                         $action = git_get_type("$hash_base:$file_name");
1146                         $action or die_error(404, "File or directory does not exist");
1147                 } elsif (defined $project) {
1148                         $action = 'summary';
1149                 } else {
1150                         $action = 'project_list';
1151                 }
1152         }
1153         if (!defined($actions{$action})) {
1154                 die_error(400, "Unknown action");
1155         }
1156         if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1157             !$project) {
1158                 die_error(400, "Project needed");
1159         }
1160         $actions{$action}->();
1161 }
1162
1163 sub reset_timer {
1164         our $t0 = [ gettimeofday() ]
1165                 if defined $t0;
1166         our $number_of_git_cmds = 0;
1167 }
1168
1169 our $first_request = 1;
1170 sub run_request {
1171         reset_timer();
1172
1173         evaluate_uri();
1174         if ($first_request) {
1175                 evaluate_gitweb_config();
1176                 evaluate_git_version();
1177         }
1178         if ($per_request_config) {
1179                 if (ref($per_request_config) eq 'CODE') {
1180                         $per_request_config->();
1181                 } elsif (!$first_request) {
1182                         evaluate_gitweb_config();
1183                 }
1184         }
1185         check_loadavg();
1186
1187         # $projectroot and $projects_list might be set in gitweb config file
1188         $projects_list ||= $projectroot;
1189
1190         evaluate_query_params();
1191         evaluate_path_info();
1192         evaluate_and_validate_params();
1193         evaluate_git_dir();
1194
1195         configure_gitweb_features();
1196
1197         dispatch();
1198 }
1199
1200 our $is_last_request = sub { 1 };
1201 our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1202 our $CGI = 'CGI';
1203 our $cgi;
1204 sub configure_as_fcgi {
1205         require CGI::Fast;
1206         our $CGI = 'CGI::Fast';
1207
1208         my $request_number = 0;
1209         # let each child service 100 requests
1210         our $is_last_request = sub { ++$request_number > 100 };
1211 }
1212 sub evaluate_argv {
1213         my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1214         configure_as_fcgi()
1215                 if $script_name =~ /\.fcgi$/;
1216
1217         return unless (@ARGV);
1218
1219         require Getopt::Long;
1220         Getopt::Long::GetOptions(
1221                 'fastcgi|fcgi|f' => \&configure_as_fcgi,
1222                 'nproc|n=i' => sub {
1223                         my ($arg, $val) = @_;
1224                         return unless eval { require FCGI::ProcManager; 1; };
1225                         my $proc_manager = FCGI::ProcManager->new({
1226                                 n_processes => $val,
1227                         });
1228                         our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1229                         our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1230                         our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1231                 },
1232         );
1233 }
1234
1235 sub run {
1236         evaluate_argv();
1237
1238         $first_request = 1;
1239         $pre_listen_hook->()
1240                 if $pre_listen_hook;
1241
1242  REQUEST:
1243         while ($cgi = $CGI->new()) {
1244                 $pre_dispatch_hook->()
1245                         if $pre_dispatch_hook;
1246
1247                 run_request();
1248
1249                 $post_dispatch_hook->()
1250                         if $post_dispatch_hook;
1251                 $first_request = 0;
1252
1253                 last REQUEST if ($is_last_request->());
1254         }
1255
1256  DONE_GITWEB:
1257         1;
1258 }
1259
1260 run();
1261
1262 if (defined caller) {
1263         # wrapped in a subroutine processing requests,
1264         # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1265         return;
1266 } else {
1267         # pure CGI script, serving single request
1268         exit;
1269 }
1270
1271 ## ======================================================================
1272 ## action links
1273
1274 # possible values of extra options
1275 # -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1276 # -replay => 1      - start from a current view (replay with modifications)
1277 # -path_info => 0|1 - don't use/use path_info URL (if possible)
1278 # -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1279 sub href {
1280         my %params = @_;
1281         # default is to use -absolute url() i.e. $my_uri
1282         my $href = $params{-full} ? $my_url : $my_uri;
1283
1284         # implicit -replay, must be first of implicit params
1285         $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1286
1287         $params{'project'} = $project unless exists $params{'project'};
1288
1289         if ($params{-replay}) {
1290                 while (my ($name, $symbol) = each %cgi_param_mapping) {
1291                         if (!exists $params{$name}) {
1292                                 $params{$name} = $input_params{$name};
1293                         }
1294                 }
1295         }
1296
1297         my $use_pathinfo = gitweb_check_feature('pathinfo');
1298         if (defined $params{'project'} &&
1299             (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1300                 # try to put as many parameters as possible in PATH_INFO:
1301                 #   - project name
1302                 #   - action
1303                 #   - hash_parent or hash_parent_base:/file_parent
1304                 #   - hash or hash_base:/filename
1305                 #   - the snapshot_format as an appropriate suffix
1306
1307                 # When the script is the root DirectoryIndex for the domain,
1308                 # $href here would be something like http://gitweb.example.com/
1309                 # Thus, we strip any trailing / from $href, to spare us double
1310                 # slashes in the final URL
1311                 $href =~ s,/$,,;
1312
1313                 # Then add the project name, if present
1314                 $href .= "/".esc_path_info($params{'project'});
1315                 delete $params{'project'};
1316
1317                 # since we destructively absorb parameters, we keep this
1318                 # boolean that remembers if we're handling a snapshot
1319                 my $is_snapshot = $params{'action'} eq 'snapshot';
1320
1321                 # Summary just uses the project path URL, any other action is
1322                 # added to the URL
1323                 if (defined $params{'action'}) {
1324                         $href .= "/".esc_path_info($params{'action'})
1325                                 unless $params{'action'} eq 'summary';
1326                         delete $params{'action'};
1327                 }
1328
1329                 # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1330                 # stripping nonexistent or useless pieces
1331                 $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1332                         || $params{'hash_parent'} || $params{'hash'});
1333                 if (defined $params{'hash_base'}) {
1334                         if (defined $params{'hash_parent_base'}) {
1335                                 $href .= esc_path_info($params{'hash_parent_base'});
1336                                 # skip the file_parent if it's the same as the file_name
1337                                 if (defined $params{'file_parent'}) {
1338                                         if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1339                                                 delete $params{'file_parent'};
1340                                         } elsif ($params{'file_parent'} !~ /\.\./) {
1341                                                 $href .= ":/".esc_path_info($params{'file_parent'});
1342                                                 delete $params{'file_parent'};
1343                                         }
1344                                 }
1345                                 $href .= "..";
1346                                 delete $params{'hash_parent'};
1347                                 delete $params{'hash_parent_base'};
1348                         } elsif (defined $params{'hash_parent'}) {
1349                                 $href .= esc_path_info($params{'hash_parent'}). "..";
1350                                 delete $params{'hash_parent'};
1351                         }
1352
1353                         $href .= esc_path_info($params{'hash_base'});
1354                         if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1355                                 $href .= ":/".esc_path_info($params{'file_name'});
1356                                 delete $params{'file_name'};
1357                         }
1358                         delete $params{'hash'};
1359                         delete $params{'hash_base'};
1360                 } elsif (defined $params{'hash'}) {
1361                         $href .= esc_path_info($params{'hash'});
1362                         delete $params{'hash'};
1363                 }
1364
1365                 # If the action was a snapshot, we can absorb the
1366                 # snapshot_format parameter too
1367                 if ($is_snapshot) {
1368                         my $fmt = $params{'snapshot_format'};
1369                         # snapshot_format should always be defined when href()
1370                         # is called, but just in case some code forgets, we
1371                         # fall back to the default
1372                         $fmt ||= $snapshot_fmts[0];
1373                         $href .= $known_snapshot_formats{$fmt}{'suffix'};
1374                         delete $params{'snapshot_format'};
1375                 }
1376         }
1377
1378         # now encode the parameters explicitly
1379         my @result = ();
1380         for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1381                 my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1382                 if (defined $params{$name}) {
1383                         if (ref($params{$name}) eq "ARRAY") {
1384                                 foreach my $par (@{$params{$name}}) {
1385                                         push @result, $symbol . "=" . esc_param($par);
1386                                 }
1387                         } else {
1388                                 push @result, $symbol . "=" . esc_param($params{$name});
1389                         }
1390                 }
1391         }
1392         $href .= "?" . join(';', @result) if scalar @result;
1393
1394         # final transformation: trailing spaces must be escaped (URI-encoded)
1395         $href =~ s/(\s+)$/CGI::escape($1)/e;
1396
1397         if ($params{-anchor}) {
1398                 $href .= "#".esc_param($params{-anchor});
1399         }
1400
1401         return $href;
1402 }
1403
1404
1405 ## ======================================================================
1406 ## validation, quoting/unquoting and escaping
1407
1408 sub validate_action {
1409         my $input = shift || return undef;
1410         return undef unless exists $actions{$input};
1411         return $input;
1412 }
1413
1414 sub validate_project {
1415         my $input = shift || return undef;
1416         if (!validate_pathname($input) ||
1417                 !(-d "$projectroot/$input") ||
1418                 !check_export_ok("$projectroot/$input") ||
1419                 ($strict_export && !project_in_list($input))) {
1420                 return undef;
1421         } else {
1422                 return $input;
1423         }
1424 }
1425
1426 sub validate_pathname {
1427         my $input = shift || return undef;
1428
1429         # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1430         # at the beginning, at the end, and between slashes.
1431         # also this catches doubled slashes
1432         if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1433                 return undef;
1434         }
1435         # no null characters
1436         if ($input =~ m!\0!) {
1437                 return undef;
1438         }
1439         return $input;
1440 }
1441
1442 sub validate_refname {
1443         my $input = shift || return undef;
1444
1445         # textual hashes are O.K.
1446         if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1447                 return $input;
1448         }
1449         # it must be correct pathname
1450         $input = validate_pathname($input)
1451                 or return undef;
1452         # restrictions on ref name according to git-check-ref-format
1453         if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1454                 return undef;
1455         }
1456         return $input;
1457 }
1458
1459 # decode sequences of octets in utf8 into Perl's internal form,
1460 # which is utf-8 with utf8 flag set if needed.  gitweb writes out
1461 # in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1462 sub to_utf8 {
1463         my $str = shift;
1464         return undef unless defined $str;
1465
1466         if (utf8::is_utf8($str) || utf8::decode($str)) {
1467                 return $str;
1468         } else {
1469                 return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1470         }
1471 }
1472
1473 # quote unsafe chars, but keep the slash, even when it's not
1474 # correct, but quoted slashes look too horrible in bookmarks
1475 sub esc_param {
1476         my $str = shift;
1477         return undef unless defined $str;
1478         $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1479         $str =~ s/ /\+/g;
1480         return $str;
1481 }
1482
1483 # the quoting rules for path_info fragment are slightly different
1484 sub esc_path_info {
1485         my $str = shift;
1486         return undef unless defined $str;
1487
1488         # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1489         $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1490
1491         return $str;
1492 }
1493
1494 # quote unsafe chars in whole URL, so some characters cannot be quoted
1495 sub esc_url {
1496         my $str = shift;
1497         return undef unless defined $str;
1498         $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1499         $str =~ s/ /\+/g;
1500         return $str;
1501 }
1502
1503 # quote unsafe characters in HTML attributes
1504 sub esc_attr {
1505
1506         # for XHTML conformance escaping '"' to '&quot;' is not enough
1507         return esc_html(@_);
1508 }
1509
1510 # replace invalid utf8 character with SUBSTITUTION sequence
1511 sub esc_html {
1512         my $str = shift;
1513         my %opts = @_;
1514
1515         return undef unless defined $str;
1516
1517         $str = to_utf8($str);
1518         $str = $cgi->escapeHTML($str);
1519         if ($opts{'-nbsp'}) {
1520                 $str =~ s/ /&nbsp;/g;
1521         }
1522         $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1523         return $str;
1524 }
1525
1526 # quote control characters and escape filename to HTML
1527 sub esc_path {
1528         my $str = shift;
1529         my %opts = @_;
1530
1531         return undef unless defined $str;
1532
1533         $str = to_utf8($str);
1534         $str = $cgi->escapeHTML($str);
1535         if ($opts{'-nbsp'}) {
1536                 $str =~ s/ /&nbsp;/g;
1537         }
1538         $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1539         return $str;
1540 }
1541
1542 # Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1543 sub sanitize {
1544         my $str = shift;
1545
1546         return undef unless defined $str;
1547
1548         $str = to_utf8($str);
1549         $str =~ s|([[:cntrl:]])|($1 =~ /[\t\n\r]/ ? $1 : quot_cec($1))|eg;
1550         return $str;
1551 }
1552
1553 # Make control characters "printable", using character escape codes (CEC)
1554 sub quot_cec {
1555         my $cntrl = shift;
1556         my %opts = @_;
1557         my %es = ( # character escape codes, aka escape sequences
1558                 "\t" => '\t',   # tab            (HT)
1559                 "\n" => '\n',   # line feed      (LF)
1560                 "\r" => '\r',   # carrige return (CR)
1561                 "\f" => '\f',   # form feed      (FF)
1562                 "\b" => '\b',   # backspace      (BS)
1563                 "\a" => '\a',   # alarm (bell)   (BEL)
1564                 "\e" => '\e',   # escape         (ESC)
1565                 "\013" => '\v', # vertical tab   (VT)
1566                 "\000" => '\0', # nul character  (NUL)
1567         );
1568         my $chr = ( (exists $es{$cntrl})
1569                     ? $es{$cntrl}
1570                     : sprintf('\%2x', ord($cntrl)) );
1571         if ($opts{-nohtml}) {
1572                 return $chr;
1573         } else {
1574                 return "<span class=\"cntrl\">$chr</span>";
1575         }
1576 }
1577
1578 # Alternatively use unicode control pictures codepoints,
1579 # Unicode "printable representation" (PR)
1580 sub quot_upr {
1581         my $cntrl = shift;
1582         my %opts = @_;
1583
1584         my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1585         if ($opts{-nohtml}) {
1586                 return $chr;
1587         } else {
1588                 return "<span class=\"cntrl\">$chr</span>";
1589         }
1590 }
1591
1592 # git may return quoted and escaped filenames
1593 sub unquote {
1594         my $str = shift;
1595
1596         sub unq {
1597                 my $seq = shift;
1598                 my %es = ( # character escape codes, aka escape sequences
1599                         't' => "\t",   # tab            (HT, TAB)
1600                         'n' => "\n",   # newline        (NL)
1601                         'r' => "\r",   # return         (CR)
1602                         'f' => "\f",   # form feed      (FF)
1603                         'b' => "\b",   # backspace      (BS)
1604                         'a' => "\a",   # alarm (bell)   (BEL)
1605                         'e' => "\e",   # escape         (ESC)
1606                         'v' => "\013", # vertical tab   (VT)
1607                 );
1608
1609                 if ($seq =~ m/^[0-7]{1,3}$/) {
1610                         # octal char sequence
1611                         return chr(oct($seq));
1612                 } elsif (exists $es{$seq}) {
1613                         # C escape sequence, aka character escape code
1614                         return $es{$seq};
1615                 }
1616                 # quoted ordinary character
1617                 return $seq;
1618         }
1619
1620         if ($str =~ m/^"(.*)"$/) {
1621                 # needs unquoting
1622                 $str = $1;
1623                 $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1624         }
1625         return $str;
1626 }
1627
1628 # escape tabs (convert tabs to spaces)
1629 sub untabify {
1630         my $line = shift;
1631
1632         while ((my $pos = index($line, "\t")) != -1) {
1633                 if (my $count = (8 - ($pos % 8))) {
1634                         my $spaces = ' ' x $count;
1635                         $line =~ s/\t/$spaces/;
1636                 }
1637         }
1638
1639         return $line;
1640 }
1641
1642 sub project_in_list {
1643         my $project = shift;
1644         my @list = git_get_projects_list();
1645         return @list && scalar(grep { $_->{'path'} eq $project } @list);
1646 }
1647
1648 ## ----------------------------------------------------------------------
1649 ## HTML aware string manipulation
1650
1651 # Try to chop given string on a word boundary between position
1652 # $len and $len+$add_len. If there is no word boundary there,
1653 # chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1654 # (marking chopped part) would be longer than given string.
1655 sub chop_str {
1656         my $str = shift;
1657         my $len = shift;
1658         my $add_len = shift || 10;
1659         my $where = shift || 'right'; # 'left' | 'center' | 'right'
1660
1661         # Make sure perl knows it is utf8 encoded so we don't
1662         # cut in the middle of a utf8 multibyte char.
1663         $str = to_utf8($str);
1664
1665         # allow only $len chars, but don't cut a word if it would fit in $add_len
1666         # if it doesn't fit, cut it if it's still longer than the dots we would add
1667         # remove chopped character entities entirely
1668
1669         # when chopping in the middle, distribute $len into left and right part
1670         # return early if chopping wouldn't make string shorter
1671         if ($where eq 'center') {
1672                 return $str if ($len + 5 >= length($str)); # filler is length 5
1673                 $len = int($len/2);
1674         } else {
1675                 return $str if ($len + 4 >= length($str)); # filler is length 4
1676         }
1677
1678         # regexps: ending and beginning with word part up to $add_len
1679         my $endre = qr/.{$len}\w{0,$add_len}/;
1680         my $begre = qr/\w{0,$add_len}.{$len}/;
1681
1682         if ($where eq 'left') {
1683                 $str =~ m/^(.*?)($begre)$/;
1684                 my ($lead, $body) = ($1, $2);
1685                 if (length($lead) > 4) {
1686                         $lead = " ...";
1687                 }
1688                 return "$lead$body";
1689
1690         } elsif ($where eq 'center') {
1691                 $str =~ m/^($endre)(.*)$/;
1692                 my ($left, $str)  = ($1, $2);
1693                 $str =~ m/^(.*?)($begre)$/;
1694                 my ($mid, $right) = ($1, $2);
1695                 if (length($mid) > 5) {
1696                         $mid = " ... ";
1697                 }
1698                 return "$left$mid$right";
1699
1700         } else {
1701                 $str =~ m/^($endre)(.*)$/;
1702                 my $body = $1;
1703                 my $tail = $2;
1704                 if (length($tail) > 4) {
1705                         $tail = "... ";
1706                 }
1707                 return "$body$tail";
1708         }
1709 }
1710
1711 # takes the same arguments as chop_str, but also wraps a <span> around the
1712 # result with a title attribute if it does get chopped. Additionally, the
1713 # string is HTML-escaped.
1714 sub chop_and_escape_str {
1715         my ($str) = @_;
1716
1717         my $chopped = chop_str(@_);
1718         $str = to_utf8($str);
1719         if ($chopped eq $str) {
1720                 return esc_html($chopped);
1721         } else {
1722                 $str =~ s/[[:cntrl:]]/?/g;
1723                 return $cgi->span({-title=>$str}, esc_html($chopped));
1724         }
1725 }
1726
1727 # Highlight selected fragments of string, using given CSS class,
1728 # and escape HTML.  It is assumed that fragments do not overlap.
1729 # Regions are passed as list of pairs (array references).
1730 #
1731 # Example: esc_html_hl_regions("foobar", "mark", [ 0, 3 ]) returns
1732 # '<span class="mark">foo</span>bar'
1733 sub esc_html_hl_regions {
1734         my ($str, $css_class, @sel) = @_;
1735         return esc_html($str) unless @sel;
1736
1737         my $out = '';
1738         my $pos = 0;
1739
1740         for my $s (@sel) {
1741                 $out .= esc_html(substr($str, $pos, $s->[0] - $pos))
1742                         if ($s->[0] - $pos > 0);
1743                 $out .= $cgi->span({-class => $css_class},
1744                                    esc_html(substr($str, $s->[0], $s->[1] - $s->[0])));
1745
1746                 $pos = $s->[1];
1747         }
1748         $out .= esc_html(substr($str, $pos))
1749                 if ($pos < length($str));
1750
1751         return $out;
1752 }
1753
1754 # return positions of beginning and end of each match
1755 sub matchpos_list {
1756         my ($str, $regexp) = @_;
1757         return unless (defined $str && defined $regexp);
1758
1759         my @matches;
1760         while ($str =~ /$regexp/g) {
1761                 push @matches, [$-[0], $+[0]];
1762         }
1763         return @matches;
1764 }
1765
1766 # highlight match (if any), and escape HTML
1767 sub esc_html_match_hl {
1768         my ($str, $regexp) = @_;
1769         return esc_html($str) unless defined $regexp;
1770
1771         my @matches = matchpos_list($str, $regexp);
1772         return esc_html($str) unless @matches;
1773
1774         return esc_html_hl_regions($str, 'match', @matches);
1775 }
1776
1777
1778 # highlight match (if any) of shortened string, and escape HTML
1779 sub esc_html_match_hl_chopped {
1780         my ($str, $chopped, $regexp) = @_;
1781         return esc_html_match_hl($str, $regexp) unless defined $chopped;
1782
1783         my @matches = matchpos_list($str, $regexp);
1784         return esc_html($chopped) unless @matches;
1785
1786         # filter matches so that we mark chopped string
1787         my $tail = "... "; # see chop_str
1788         unless ($chopped =~ s/\Q$tail\E$//) {
1789                 $tail = '';
1790         }
1791         my $chop_len = length($chopped);
1792         my $tail_len = length($tail);
1793         my @filtered;
1794
1795         for my $m (@matches) {
1796                 if ($m->[0] > $chop_len) {
1797                         push @filtered, [ $chop_len, $chop_len + $tail_len ] if ($tail_len > 0);
1798                         last;
1799                 } elsif ($m->[1] > $chop_len) {
1800                         push @filtered, [ $m->[0], $chop_len + $tail_len ];
1801                         last;
1802                 }
1803                 push @filtered, $m;
1804         }
1805
1806         return esc_html_hl_regions($chopped . $tail, 'match', @filtered);
1807 }
1808
1809 ## ----------------------------------------------------------------------
1810 ## functions returning short strings
1811
1812 # CSS class for given age value (in seconds)
1813 sub age_class {
1814         my $age = shift;
1815
1816         if (!defined $age) {
1817                 return "noage";
1818         } elsif ($age < 60*60*2) {
1819                 return "age0";
1820         } elsif ($age < 60*60*24*2) {
1821                 return "age1";
1822         } else {
1823                 return "age2";
1824         }
1825 }
1826
1827 # convert age in seconds to "nn units ago" string
1828 sub age_string {
1829         my $age = shift;
1830         my $age_str;
1831
1832         if ($age > 60*60*24*365*2) {
1833                 $age_str = (int $age/60/60/24/365);
1834                 $age_str .= " years ago";
1835         } elsif ($age > 60*60*24*(365/12)*2) {
1836                 $age_str = int $age/60/60/24/(365/12);
1837                 $age_str .= " months ago";
1838         } elsif ($age > 60*60*24*7*2) {
1839                 $age_str = int $age/60/60/24/7;
1840                 $age_str .= " weeks ago";
1841         } elsif ($age > 60*60*24*2) {
1842                 $age_str = int $age/60/60/24;
1843                 $age_str .= " days ago";
1844         } elsif ($age > 60*60*2) {
1845                 $age_str = int $age/60/60;
1846                 $age_str .= " hours ago";
1847         } elsif ($age > 60*2) {
1848                 $age_str = int $age/60;
1849                 $age_str .= " min ago";
1850         } elsif ($age > 2) {
1851                 $age_str = int $age;
1852                 $age_str .= " sec ago";
1853         } else {
1854                 $age_str .= " right now";
1855         }
1856         return $age_str;
1857 }
1858
1859 use constant {
1860         S_IFINVALID => 0030000,
1861         S_IFGITLINK => 0160000,
1862 };
1863
1864 # submodule/subproject, a commit object reference
1865 sub S_ISGITLINK {
1866         my $mode = shift;
1867
1868         return (($mode & S_IFMT) == S_IFGITLINK)
1869 }
1870
1871 # convert file mode in octal to symbolic file mode string
1872 sub mode_str {
1873         my $mode = oct shift;
1874
1875         if (S_ISGITLINK($mode)) {
1876                 return 'm---------';
1877         } elsif (S_ISDIR($mode & S_IFMT)) {
1878                 return 'drwxr-xr-x';
1879         } elsif (S_ISLNK($mode)) {
1880                 return 'lrwxrwxrwx';
1881         } elsif (S_ISREG($mode)) {
1882                 # git cares only about the executable bit
1883                 if ($mode & S_IXUSR) {
1884                         return '-rwxr-xr-x';
1885                 } else {
1886                         return '-rw-r--r--';
1887                 };
1888         } else {
1889                 return '----------';
1890         }
1891 }
1892
1893 # convert file mode in octal to file type string
1894 sub file_type {
1895         my $mode = shift;
1896
1897         if ($mode !~ m/^[0-7]+$/) {
1898                 return $mode;
1899         } else {
1900                 $mode = oct $mode;
1901         }
1902
1903         if (S_ISGITLINK($mode)) {
1904                 return "submodule";
1905         } elsif (S_ISDIR($mode & S_IFMT)) {
1906                 return "directory";
1907         } elsif (S_ISLNK($mode)) {
1908                 return "symlink";
1909         } elsif (S_ISREG($mode)) {
1910                 return "file";
1911         } else {
1912                 return "unknown";
1913         }
1914 }
1915
1916 # convert file mode in octal to file type description string
1917 sub file_type_long {
1918         my $mode = shift;
1919
1920         if ($mode !~ m/^[0-7]+$/) {
1921                 return $mode;
1922         } else {
1923                 $mode = oct $mode;
1924         }
1925
1926         if (S_ISGITLINK($mode)) {
1927                 return "submodule";
1928         } elsif (S_ISDIR($mode & S_IFMT)) {
1929                 return "directory";
1930         } elsif (S_ISLNK($mode)) {
1931                 return "symlink";
1932         } elsif (S_ISREG($mode)) {
1933                 if ($mode & S_IXUSR) {
1934                         return "executable";
1935                 } else {
1936                         return "file";
1937                 };
1938         } else {
1939                 return "unknown";
1940         }
1941 }
1942
1943
1944 ## ----------------------------------------------------------------------
1945 ## functions returning short HTML fragments, or transforming HTML fragments
1946 ## which don't belong to other sections
1947
1948 # format line of commit message.
1949 sub format_log_line_html {
1950         my $line = shift;
1951
1952         $line = esc_html($line, -nbsp=>1);
1953         $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1954                 $cgi->a({-href => href(action=>"object", hash=>$1),
1955                                         -class => "text"}, $1);
1956         }eg;
1957
1958         return $line;
1959 }
1960
1961 # format marker of refs pointing to given object
1962
1963 # the destination action is chosen based on object type and current context:
1964 # - for annotated tags, we choose the tag view unless it's the current view
1965 #   already, in which case we go to shortlog view
1966 # - for other refs, we keep the current view if we're in history, shortlog or
1967 #   log view, and select shortlog otherwise
1968 sub format_ref_marker {
1969         my ($refs, $id) = @_;
1970         my $markers = '';
1971
1972         if (defined $refs->{$id}) {
1973                 foreach my $ref (@{$refs->{$id}}) {
1974                         # this code exploits the fact that non-lightweight tags are the
1975                         # only indirect objects, and that they are the only objects for which
1976                         # we want to use tag instead of shortlog as action
1977                         my ($type, $name) = qw();
1978                         my $indirect = ($ref =~ s/\^\{\}$//);
1979                         # e.g. tags/v2.6.11 or heads/next
1980                         if ($ref =~ m!^(.*?)s?/(.*)$!) {
1981                                 $type = $1;
1982                                 $name = $2;
1983                         } else {
1984                                 $type = "ref";
1985                                 $name = $ref;
1986                         }
1987
1988                         my $class = $type;
1989                         $class .= " indirect" if $indirect;
1990
1991                         my $dest_action = "shortlog";
1992
1993                         if ($indirect) {
1994                                 $dest_action = "tag" unless $action eq "tag";
1995                         } elsif ($action =~ /^(history|(short)?log)$/) {
1996                                 $dest_action = $action;
1997                         }
1998
1999                         my $dest = "";
2000                         $dest .= "refs/" unless $ref =~ m!^refs/!;
2001                         $dest .= $ref;
2002
2003                         my $link = $cgi->a({
2004                                 -href => href(
2005                                         action=>$dest_action,
2006                                         hash=>$dest
2007                                 )}, $name);
2008
2009                         $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
2010                                 $link . "</span>";
2011                 }
2012         }
2013
2014         if ($markers) {
2015                 return ' <span class="refs">'. $markers . '</span>';
2016         } else {
2017                 return "";
2018         }
2019 }
2020
2021 # format, perhaps shortened and with markers, title line
2022 sub format_subject_html {
2023         my ($long, $short, $href, $extra) = @_;
2024         $extra = '' unless defined($extra);
2025
2026         if (length($short) < length($long)) {
2027                 $long =~ s/[[:cntrl:]]/?/g;
2028                 return $cgi->a({-href => $href, -class => "list subject",
2029                                 -title => to_utf8($long)},
2030                        esc_html($short)) . $extra;
2031         } else {
2032                 return $cgi->a({-href => $href, -class => "list subject"},
2033                        esc_html($long)) . $extra;
2034         }
2035 }
2036
2037 # Rather than recomputing the url for an email multiple times, we cache it
2038 # after the first hit. This gives a visible benefit in views where the avatar
2039 # for the same email is used repeatedly (e.g. shortlog).
2040 # The cache is shared by all avatar engines (currently gravatar only), which
2041 # are free to use it as preferred. Since only one avatar engine is used for any
2042 # given page, there's no risk for cache conflicts.
2043 our %avatar_cache = ();
2044
2045 # Compute the picon url for a given email, by using the picon search service over at
2046 # http://www.cs.indiana.edu/picons/search.html
2047 sub picon_url {
2048         my $email = lc shift;
2049         if (!$avatar_cache{$email}) {
2050                 my ($user, $domain) = split('@', $email);
2051                 $avatar_cache{$email} =
2052                         "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
2053                         "$domain/$user/" .
2054                         "users+domains+unknown/up/single";
2055         }
2056         return $avatar_cache{$email};
2057 }
2058
2059 # Compute the gravatar url for a given email, if it's not in the cache already.
2060 # Gravatar stores only the part of the URL before the size, since that's the
2061 # one computationally more expensive. This also allows reuse of the cache for
2062 # different sizes (for this particular engine).
2063 sub gravatar_url {
2064         my $email = lc shift;
2065         my $size = shift;
2066         $avatar_cache{$email} ||=
2067                 "http://www.gravatar.com/avatar/" .
2068                         Digest::MD5::md5_hex($email) . "?s=";
2069         return $avatar_cache{$email} . $size;
2070 }
2071
2072 # Insert an avatar for the given $email at the given $size if the feature
2073 # is enabled.
2074 sub git_get_avatar {
2075         my ($email, %opts) = @_;
2076         my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
2077         my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
2078         $opts{-size} ||= 'default';
2079         my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
2080         my $url = "";
2081         if ($git_avatar eq 'gravatar') {
2082                 $url = gravatar_url($email, $size);
2083         } elsif ($git_avatar eq 'picon') {
2084                 $url = picon_url($email);
2085         }
2086         # Other providers can be added by extending the if chain, defining $url
2087         # as needed. If no variant puts something in $url, we assume avatars
2088         # are completely disabled/unavailable.
2089         if ($url) {
2090                 return $pre_white .
2091                        "<img width=\"$size\" " .
2092                             "class=\"avatar\" " .
2093                             "src=\"".esc_url($url)."\" " .
2094                             "alt=\"\" " .
2095                        "/>" . $post_white;
2096         } else {
2097                 return "";
2098         }
2099 }
2100
2101 sub format_search_author {
2102         my ($author, $searchtype, $displaytext) = @_;
2103         my $have_search = gitweb_check_feature('search');
2104
2105         if ($have_search) {
2106                 my $performed = "";
2107                 if ($searchtype eq 'author') {
2108                         $performed = "authored";
2109                 } elsif ($searchtype eq 'committer') {
2110                         $performed = "committed";
2111                 }
2112
2113                 return $cgi->a({-href => href(action=>"search", hash=>$hash,
2114                                 searchtext=>$author,
2115                                 searchtype=>$searchtype), class=>"list",
2116                                 title=>"Search for commits $performed by $author"},
2117                                 $displaytext);
2118
2119         } else {
2120                 return $displaytext;
2121         }
2122 }
2123
2124 # format the author name of the given commit with the given tag
2125 # the author name is chopped and escaped according to the other
2126 # optional parameters (see chop_str).
2127 sub format_author_html {
2128         my $tag = shift;
2129         my $co = shift;
2130         my $author = chop_and_escape_str($co->{'author_name'}, @_);
2131         return "<$tag class=\"author\">" .
2132                format_search_author($co->{'author_name'}, "author",
2133                        git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2134                        $author) .
2135                "</$tag>";
2136 }
2137
2138 # format git diff header line, i.e. "diff --(git|combined|cc) ..."
2139 sub format_git_diff_header_line {
2140         my $line = shift;
2141         my $diffinfo = shift;
2142         my ($from, $to) = @_;
2143
2144         if ($diffinfo->{'nparents'}) {
2145                 # combined diff
2146                 $line =~ s!^(diff (.*?) )"?.*$!$1!;
2147                 if ($to->{'href'}) {
2148                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2149                                          esc_path($to->{'file'}));
2150                 } else { # file was deleted (no href)
2151                         $line .= esc_path($to->{'file'});
2152                 }
2153         } else {
2154                 # "ordinary" diff
2155                 $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2156                 if ($from->{'href'}) {
2157                         $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2158                                          'a/' . esc_path($from->{'file'}));
2159                 } else { # file was added (no href)
2160                         $line .= 'a/' . esc_path($from->{'file'});
2161                 }
2162                 $line .= ' ';
2163                 if ($to->{'href'}) {
2164                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2165                                          'b/' . esc_path($to->{'file'}));
2166                 } else { # file was deleted
2167                         $line .= 'b/' . esc_path($to->{'file'});
2168                 }
2169         }
2170
2171         return "<div class=\"diff header\">$line</div>\n";
2172 }
2173
2174 # format extended diff header line, before patch itself
2175 sub format_extended_diff_header_line {
2176         my $line = shift;
2177         my $diffinfo = shift;
2178         my ($from, $to) = @_;
2179
2180         # match <path>
2181         if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2182                 $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2183                                        esc_path($from->{'file'}));
2184         }
2185         if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2186                 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2187                                  esc_path($to->{'file'}));
2188         }
2189         # match single <mode>
2190         if ($line =~ m/\s(\d{6})$/) {
2191                 $line .= '<span class="info"> (' .
2192                          file_type_long($1) .
2193                          ')</span>';
2194         }
2195         # match <hash>
2196         if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2197                 # can match only for combined diff
2198                 $line = 'index ';
2199                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2200                         if ($from->{'href'}[$i]) {
2201                                 $line .= $cgi->a({-href=>$from->{'href'}[$i],
2202                                                   -class=>"hash"},
2203                                                  substr($diffinfo->{'from_id'}[$i],0,7));
2204                         } else {
2205                                 $line .= '0' x 7;
2206                         }
2207                         # separator
2208                         $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2209                 }
2210                 $line .= '..';
2211                 if ($to->{'href'}) {
2212                         $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2213                                          substr($diffinfo->{'to_id'},0,7));
2214                 } else {
2215                         $line .= '0' x 7;
2216                 }
2217
2218         } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2219                 # can match only for ordinary diff
2220                 my ($from_link, $to_link);
2221                 if ($from->{'href'}) {
2222                         $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2223                                              substr($diffinfo->{'from_id'},0,7));
2224                 } else {
2225                         $from_link = '0' x 7;
2226                 }
2227                 if ($to->{'href'}) {
2228                         $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2229                                            substr($diffinfo->{'to_id'},0,7));
2230                 } else {
2231                         $to_link = '0' x 7;
2232                 }
2233                 my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2234                 $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2235         }
2236
2237         return $line . "<br/>\n";
2238 }
2239
2240 # format from-file/to-file diff header
2241 sub format_diff_from_to_header {
2242         my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2243         my $line;
2244         my $result = '';
2245
2246         $line = $from_line;
2247         #assert($line =~ m/^---/) if DEBUG;
2248         # no extra formatting for "^--- /dev/null"
2249         if (! $diffinfo->{'nparents'}) {
2250                 # ordinary (single parent) diff
2251                 if ($line =~ m!^--- "?a/!) {
2252                         if ($from->{'href'}) {
2253                                 $line = '--- a/' .
2254                                         $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2255                                                 esc_path($from->{'file'}));
2256                         } else {
2257                                 $line = '--- a/' .
2258                                         esc_path($from->{'file'});
2259                         }
2260                 }
2261                 $result .= qq!<div class="diff from_file">$line</div>\n!;
2262
2263         } else {
2264                 # combined diff (merge commit)
2265                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2266                         if ($from->{'href'}[$i]) {
2267                                 $line = '--- ' .
2268                                         $cgi->a({-href=>href(action=>"blobdiff",
2269                                                              hash_parent=>$diffinfo->{'from_id'}[$i],
2270                                                              hash_parent_base=>$parents[$i],
2271                                                              file_parent=>$from->{'file'}[$i],
2272                                                              hash=>$diffinfo->{'to_id'},
2273                                                              hash_base=>$hash,
2274                                                              file_name=>$to->{'file'}),
2275                                                  -class=>"path",
2276                                                  -title=>"diff" . ($i+1)},
2277                                                 $i+1) .
2278                                         '/' .
2279                                         $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2280                                                 esc_path($from->{'file'}[$i]));
2281                         } else {
2282                                 $line = '--- /dev/null';
2283                         }
2284                         $result .= qq!<div class="diff from_file">$line</div>\n!;
2285                 }
2286         }
2287
2288         $line = $to_line;
2289         #assert($line =~ m/^\+\+\+/) if DEBUG;
2290         # no extra formatting for "^+++ /dev/null"
2291         if ($line =~ m!^\+\+\+ "?b/!) {
2292                 if ($to->{'href'}) {
2293                         $line = '+++ b/' .
2294                                 $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2295                                         esc_path($to->{'file'}));
2296                 } else {
2297                         $line = '+++ b/' .
2298                                 esc_path($to->{'file'});
2299                 }
2300         }
2301         $result .= qq!<div class="diff to_file">$line</div>\n!;
2302
2303         return $result;
2304 }
2305
2306 # create note for patch simplified by combined diff
2307 sub format_diff_cc_simplified {
2308         my ($diffinfo, @parents) = @_;
2309         my $result = '';
2310
2311         $result .= "<div class=\"diff header\">" .
2312                    "diff --cc ";
2313         if (!is_deleted($diffinfo)) {
2314                 $result .= $cgi->a({-href => href(action=>"blob",
2315                                                   hash_base=>$hash,
2316                                                   hash=>$diffinfo->{'to_id'},
2317                                                   file_name=>$diffinfo->{'to_file'}),
2318                                     -class => "path"},
2319                                    esc_path($diffinfo->{'to_file'}));
2320         } else {
2321                 $result .= esc_path($diffinfo->{'to_file'});
2322         }
2323         $result .= "</div>\n" . # class="diff header"
2324                    "<div class=\"diff nodifferences\">" .
2325                    "Simple merge" .
2326                    "</div>\n"; # class="diff nodifferences"
2327
2328         return $result;
2329 }
2330
2331 sub diff_line_class {
2332         my ($line, $from, $to) = @_;
2333
2334         # ordinary diff
2335         my $num_sign = 1;
2336         # combined diff
2337         if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2338                 $num_sign = scalar @{$from->{'href'}};
2339         }
2340
2341         my @diff_line_classifier = (
2342                 { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2343                 { regexp => qr/^\\/,               class => "incomplete"  },
2344                 { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2345                 # classifier for context must come before classifier add/rem,
2346                 # or we would have to use more complicated regexp, for example
2347                 # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2348                 { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2349                 { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2350         );
2351         for my $clsfy (@diff_line_classifier) {
2352                 return $clsfy->{'class'}
2353                         if ($line =~ $clsfy->{'regexp'});
2354         }
2355
2356         # fallback
2357         return "";
2358 }
2359
2360 # assumes that $from and $to are defined and correctly filled,
2361 # and that $line holds a line of chunk header for unified diff
2362 sub format_unidiff_chunk_header {
2363         my ($line, $from, $to) = @_;
2364
2365         my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2366                 $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2367
2368         $from_lines = 0 unless defined $from_lines;
2369         $to_lines   = 0 unless defined $to_lines;
2370
2371         if ($from->{'href'}) {
2372                 $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2373                                      -class=>"list"}, $from_text);
2374         }
2375         if ($to->{'href'}) {
2376                 $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2377                                      -class=>"list"}, $to_text);
2378         }
2379         $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2380                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2381         return $line;
2382 }
2383
2384 # assumes that $from and $to are defined and correctly filled,
2385 # and that $line holds a line of chunk header for combined diff
2386 sub format_cc_diff_chunk_header {
2387         my ($line, $from, $to) = @_;
2388
2389         my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2390         my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2391
2392         @from_text = split(' ', $ranges);
2393         for (my $i = 0; $i < @from_text; ++$i) {
2394                 ($from_start[$i], $from_nlines[$i]) =
2395                         (split(',', substr($from_text[$i], 1)), 0);
2396         }
2397
2398         $to_text   = pop @from_text;
2399         $to_start  = pop @from_start;
2400         $to_nlines = pop @from_nlines;
2401
2402         $line = "<span class=\"chunk_info\">$prefix ";
2403         for (my $i = 0; $i < @from_text; ++$i) {
2404                 if ($from->{'href'}[$i]) {
2405                         $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2406                                           -class=>"list"}, $from_text[$i]);
2407                 } else {
2408                         $line .= $from_text[$i];
2409                 }
2410                 $line .= " ";
2411         }
2412         if ($to->{'href'}) {
2413                 $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2414                                   -class=>"list"}, $to_text);
2415         } else {
2416                 $line .= $to_text;
2417         }
2418         $line .= " $prefix</span>" .
2419                  "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2420         return $line;
2421 }
2422
2423 # process patch (diff) line (not to be used for diff headers),
2424 # returning class and HTML-formatted (but not wrapped) line
2425 sub process_diff_line {
2426         my $line = shift;
2427         my ($from, $to) = @_;
2428
2429         my $diff_class = diff_line_class($line, $from, $to);
2430
2431         chomp $line;
2432         $line = untabify($line);
2433
2434         if ($from && $to && $line =~ m/^\@{2} /) {
2435                 $line = format_unidiff_chunk_header($line, $from, $to);
2436                 return $diff_class, $line;
2437
2438         } elsif ($from && $to && $line =~ m/^\@{3}/) {
2439                 $line = format_cc_diff_chunk_header($line, $from, $to);
2440                 return $diff_class, $line;
2441
2442         }
2443         return $diff_class, esc_html($line, -nbsp=>1);
2444 }
2445
2446 # Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2447 # linked.  Pass the hash of the tree/commit to snapshot.
2448 sub format_snapshot_links {
2449         my ($hash) = @_;
2450         my $num_fmts = @snapshot_fmts;
2451         if ($num_fmts > 1) {
2452                 # A parenthesized list of links bearing format names.
2453                 # e.g. "snapshot (_tar.gz_ _zip_)"
2454                 return "snapshot (" . join(' ', map
2455                         $cgi->a({
2456                                 -href => href(
2457                                         action=>"snapshot",
2458                                         hash=>$hash,
2459                                         snapshot_format=>$_
2460                                 )
2461                         }, $known_snapshot_formats{$_}{'display'})
2462                 , @snapshot_fmts) . ")";
2463         } elsif ($num_fmts == 1) {
2464                 # A single "snapshot" link whose tooltip bears the format name.
2465                 # i.e. "_snapshot_"
2466                 my ($fmt) = @snapshot_fmts;
2467                 return
2468                         $cgi->a({
2469                                 -href => href(
2470                                         action=>"snapshot",
2471                                         hash=>$hash,
2472                                         snapshot_format=>$fmt
2473                                 ),
2474                                 -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2475                         }, "snapshot");
2476         } else { # $num_fmts == 0
2477                 return undef;
2478         }
2479 }
2480
2481 ## ......................................................................
2482 ## functions returning values to be passed, perhaps after some
2483 ## transformation, to other functions; e.g. returning arguments to href()
2484
2485 # returns hash to be passed to href to generate gitweb URL
2486 # in -title key it returns description of link
2487 sub get_feed_info {
2488         my $format = shift || 'Atom';
2489         my %res = (action => lc($format));
2490
2491         # feed links are possible only for project views
2492         return unless (defined $project);
2493         # some views should link to OPML, or to generic project feed,
2494         # or don't have specific feed yet (so they should use generic)
2495         return if (!$action || $action =~ /^(?:tags|heads|forks|tag|search)$/x);
2496
2497         my $branch;
2498         # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2499         # from tag links; this also makes possible to detect branch links
2500         if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2501             (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2502                 $branch = $1;
2503         }
2504         # find log type for feed description (title)
2505         my $type = 'log';
2506         if (defined $file_name) {
2507                 $type  = "history of $file_name";
2508                 $type .= "/" if ($action eq 'tree');
2509                 $type .= " on '$branch'" if (defined $branch);
2510         } else {
2511                 $type = "log of $branch" if (defined $branch);
2512         }
2513
2514         $res{-title} = $type;
2515         $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2516         $res{'file_name'} = $file_name;
2517
2518         return %res;
2519 }
2520
2521 ## ----------------------------------------------------------------------
2522 ## git utility subroutines, invoking git commands
2523
2524 # returns path to the core git executable and the --git-dir parameter as list
2525 sub git_cmd {
2526         $number_of_git_cmds++;
2527         return $GIT, '--git-dir='.$git_dir;
2528 }
2529
2530 # quote the given arguments for passing them to the shell
2531 # quote_command("command", "arg 1", "arg with ' and ! characters")
2532 # => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2533 # Try to avoid using this function wherever possible.
2534 sub quote_command {
2535         return join(' ',
2536                 map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2537 }
2538
2539 # get HEAD ref of given project as hash
2540 sub git_get_head_hash {
2541         return git_get_full_hash(shift, 'HEAD');
2542 }
2543
2544 sub git_get_full_hash {
2545         return git_get_hash(@_);
2546 }
2547
2548 sub git_get_short_hash {
2549         return git_get_hash(@_, '--short=7');
2550 }
2551
2552 sub git_get_hash {
2553         my ($project, $hash, @options) = @_;
2554         my $o_git_dir = $git_dir;
2555         my $retval = undef;
2556         $git_dir = "$projectroot/$project";
2557         if (open my $fd, '-|', git_cmd(), 'rev-parse',
2558             '--verify', '-q', @options, $hash) {
2559                 $retval = <$fd>;
2560                 chomp $retval if defined $retval;
2561                 close $fd;
2562         }
2563         if (defined $o_git_dir) {
2564                 $git_dir = $o_git_dir;
2565         }
2566         return $retval;
2567 }
2568
2569 # get type of given object
2570 sub git_get_type {
2571         my $hash = shift;
2572
2573         open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2574         my $type = <$fd>;
2575         close $fd or return;
2576         chomp $type;
2577         return $type;
2578 }
2579
2580 # repository configuration
2581 our $config_file = '';
2582 our %config;
2583
2584 # store multiple values for single key as anonymous array reference
2585 # single values stored directly in the hash, not as [ <value> ]
2586 sub hash_set_multi {
2587         my ($hash, $key, $value) = @_;
2588
2589         if (!exists $hash->{$key}) {
2590                 $hash->{$key} = $value;
2591         } elsif (!ref $hash->{$key}) {
2592                 $hash->{$key} = [ $hash->{$key}, $value ];
2593         } else {
2594                 push @{$hash->{$key}}, $value;
2595         }
2596 }
2597
2598 # return hash of git project configuration
2599 # optionally limited to some section, e.g. 'gitweb'
2600 sub git_parse_project_config {
2601         my $section_regexp = shift;
2602         my %config;
2603
2604         local $/ = "\0";
2605
2606         open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2607                 or return;
2608
2609         while (my $keyval = <$fh>) {
2610                 chomp $keyval;
2611                 my ($key, $value) = split(/\n/, $keyval, 2);
2612
2613                 hash_set_multi(\%config, $key, $value)
2614                         if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2615         }
2616         close $fh;
2617
2618         return %config;
2619 }
2620
2621 # convert config value to boolean: 'true' or 'false'
2622 # no value, number > 0, 'true' and 'yes' values are true
2623 # rest of values are treated as false (never as error)
2624 sub config_to_bool {
2625         my $val = shift;
2626
2627         return 1 if !defined $val;             # section.key
2628
2629         # strip leading and trailing whitespace
2630         $val =~ s/^\s+//;
2631         $val =~ s/\s+$//;
2632
2633         return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2634                 ($val =~ /^(?:true|yes)$/i));  # section.key = true
2635 }
2636
2637 # convert config value to simple decimal number
2638 # an optional value suffix of 'k', 'm', or 'g' will cause the value
2639 # to be multiplied by 1024, 1048576, or 1073741824
2640 sub config_to_int {
2641         my $val = shift;
2642
2643         # strip leading and trailing whitespace
2644         $val =~ s/^\s+//;
2645         $val =~ s/\s+$//;
2646
2647         if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2648                 $unit = lc($unit);
2649                 # unknown unit is treated as 1
2650                 return $num * ($unit eq 'g' ? 1073741824 :
2651                                $unit eq 'm' ?    1048576 :
2652                                $unit eq 'k' ?       1024 : 1);
2653         }
2654         return $val;
2655 }
2656
2657 # convert config value to array reference, if needed
2658 sub config_to_multi {
2659         my $val = shift;
2660
2661         return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2662 }
2663
2664 sub git_get_project_config {
2665         my ($key, $type) = @_;
2666
2667         return unless defined $git_dir;
2668
2669         # key sanity check
2670         return unless ($key);
2671         # only subsection, if exists, is case sensitive,
2672         # and not lowercased by 'git config -z -l'
2673         if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2674                 $key = join(".", lc($hi), $mi, lc($lo));
2675         } else {
2676                 $key = lc($key);
2677         }
2678         $key =~ s/^gitweb\.//;
2679         return if ($key =~ m/\W/);
2680
2681         # type sanity check
2682         if (defined $type) {
2683                 $type =~ s/^--//;
2684                 $type = undef
2685                         unless ($type eq 'bool' || $type eq 'int');
2686         }
2687
2688         # get config
2689         if (!defined $config_file ||
2690             $config_file ne "$git_dir/config") {
2691                 %config = git_parse_project_config('gitweb');
2692                 $config_file = "$git_dir/config";
2693         }
2694
2695         # check if config variable (key) exists
2696         return unless exists $config{"gitweb.$key"};
2697
2698         # ensure given type
2699         if (!defined $type) {
2700                 return $config{"gitweb.$key"};
2701         } elsif ($type eq 'bool') {
2702                 # backward compatibility: 'git config --bool' returns true/false
2703                 return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2704         } elsif ($type eq 'int') {
2705                 return config_to_int($config{"gitweb.$key"});
2706         }
2707         return $config{"gitweb.$key"};
2708 }
2709
2710 # get hash of given path at given ref
2711 sub git_get_hash_by_path {
2712         my $base = shift;
2713         my $path = shift || return undef;
2714         my $type = shift;
2715
2716         $path =~ s,/+$,,;
2717
2718         open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2719                 or die_error(500, "Open git-ls-tree failed");
2720         my $line = <$fd>;
2721         close $fd or return undef;
2722
2723         if (!defined $line) {
2724                 # there is no tree or hash given by $path at $base
2725                 return undef;
2726         }
2727
2728         #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2729         $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2730         if (defined $type && $type ne $2) {
2731                 # type doesn't match
2732                 return undef;
2733         }
2734         return $3;
2735 }
2736
2737 # get path of entry with given hash at given tree-ish (ref)
2738 # used to get 'from' filename for combined diff (merge commit) for renames
2739 sub git_get_path_by_hash {
2740         my $base = shift || return;
2741         my $hash = shift || return;
2742
2743         local $/ = "\0";
2744
2745         open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2746                 or return undef;
2747         while (my $line = <$fd>) {
2748                 chomp $line;
2749
2750                 #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2751                 #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2752                 if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2753                         close $fd;
2754                         return $1;
2755                 }
2756         }
2757         close $fd;
2758         return undef;
2759 }
2760
2761 ## ......................................................................
2762 ## git utility functions, directly accessing git repository
2763
2764 # get the value of config variable either from file named as the variable
2765 # itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2766 # configuration variable in the repository config file.
2767 sub git_get_file_or_project_config {
2768         my ($path, $name) = @_;
2769
2770         $git_dir = "$projectroot/$path";
2771         open my $fd, '<', "$git_dir/$name"
2772                 or return git_get_project_config($name);
2773         my $conf = <$fd>;
2774         close $fd;
2775         if (defined $conf) {
2776                 chomp $conf;
2777         }
2778         return $conf;
2779 }
2780
2781 sub git_get_project_description {
2782         my $path = shift;
2783         return git_get_file_or_project_config($path, 'description');
2784 }
2785
2786 sub git_get_project_category {
2787         my $path = shift;
2788         return git_get_file_or_project_config($path, 'category');
2789 }
2790
2791
2792 # supported formats:
2793 # * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2794 #   - if its contents is a number, use it as tag weight,
2795 #   - otherwise add a tag with weight 1
2796 # * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2797 #   the same value multiple times increases tag weight
2798 # * `gitweb.ctag' multi-valued repo config variable
2799 sub git_get_project_ctags {
2800         my $project = shift;
2801         my $ctags = {};
2802
2803         $git_dir = "$projectroot/$project";
2804         if (opendir my $dh, "$git_dir/ctags") {
2805                 my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2806                 foreach my $tagfile (@files) {
2807                         open my $ct, '<', $tagfile
2808                                 or next;
2809                         my $val = <$ct>;
2810                         chomp $val if $val;
2811                         close $ct;
2812
2813                         (my $ctag = $tagfile) =~ s#.*/##;
2814                         if ($val =~ /^\d+$/) {
2815                                 $ctags->{$ctag} = $val;
2816                         } else {
2817                                 $ctags->{$ctag} = 1;
2818                         }
2819                 }
2820                 closedir $dh;
2821
2822         } elsif (open my $fh, '<', "$git_dir/ctags") {
2823                 while (my $line = <$fh>) {
2824                         chomp $line;
2825                         $ctags->{$line}++ if $line;
2826                 }
2827                 close $fh;
2828
2829         } else {
2830                 my $taglist = config_to_multi(git_get_project_config('ctag'));
2831                 foreach my $tag (@$taglist) {
2832                         $ctags->{$tag}++;
2833                 }
2834         }
2835
2836         return $ctags;
2837 }
2838
2839 # return hash, where keys are content tags ('ctags'),
2840 # and values are sum of weights of given tag in every project
2841 sub git_gather_all_ctags {
2842         my $projects = shift;
2843         my $ctags = {};
2844
2845         foreach my $p (@$projects) {
2846                 foreach my $ct (keys %{$p->{'ctags'}}) {
2847                         $ctags->{$ct} += $p->{'ctags'}->{$ct};
2848                 }
2849         }
2850
2851         return $ctags;
2852 }
2853
2854 sub git_populate_project_tagcloud {
2855         my $ctags = shift;
2856
2857         # First, merge different-cased tags; tags vote on casing
2858         my %ctags_lc;
2859         foreach (keys %$ctags) {
2860                 $ctags_lc{lc $_}->{count} += $ctags->{$_};
2861                 if (not $ctags_lc{lc $_}->{topcount}
2862                     or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2863                         $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2864                         $ctags_lc{lc $_}->{topname} = $_;
2865                 }
2866         }
2867
2868         my $cloud;
2869         my $matched = $input_params{'ctag'};
2870         if (eval { require HTML::TagCloud; 1; }) {
2871                 $cloud = HTML::TagCloud->new;
2872                 foreach my $ctag (sort keys %ctags_lc) {
2873                         # Pad the title with spaces so that the cloud looks
2874                         # less crammed.
2875                         my $title = esc_html($ctags_lc{$ctag}->{topname});
2876                         $title =~ s/ /&nbsp;/g;
2877                         $title =~ s/^/&nbsp;/g;
2878                         $title =~ s/$/&nbsp;/g;
2879                         if (defined $matched && $matched eq $ctag) {
2880                                 $title = qq(<span class="match">$title</span>);
2881                         }
2882                         $cloud->add($title, href(project=>undef, ctag=>$ctag),
2883                                     $ctags_lc{$ctag}->{count});
2884                 }
2885         } else {
2886                 $cloud = {};
2887                 foreach my $ctag (keys %ctags_lc) {
2888                         my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2889                         if (defined $matched && $matched eq $ctag) {
2890                                 $title = qq(<span class="match">$title</span>);
2891                         }
2892                         $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2893                         $cloud->{$ctag}{ctag} =
2894                                 $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2895                 }
2896         }
2897         return $cloud;
2898 }
2899
2900 sub git_show_project_tagcloud {
2901         my ($cloud, $count) = @_;
2902         if (ref $cloud eq 'HTML::TagCloud') {
2903                 return $cloud->html_and_css($count);
2904         } else {
2905                 my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2906                 return
2907                         '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2908                         join (', ', map {
2909                                 $cloud->{$_}->{'ctag'}
2910                         } splice(@tags, 0, $count)) .
2911                         '</div>';
2912         }
2913 }
2914
2915 sub git_get_project_url_list {
2916         my $path = shift;
2917
2918         $git_dir = "$projectroot/$path";
2919         open my $fd, '<', "$git_dir/cloneurl"
2920                 or return wantarray ?
2921                 @{ config_to_multi(git_get_project_config('url')) } :
2922                    config_to_multi(git_get_project_config('url'));
2923         my @git_project_url_list = map { chomp; $_ } <$fd>;
2924         close $fd;
2925
2926         return wantarray ? @git_project_url_list : \@git_project_url_list;
2927 }
2928
2929 sub git_get_projects_list {
2930         my $filter = shift || '';
2931         my $paranoid = shift;
2932         my @list;
2933
2934         if (-d $projects_list) {
2935                 # search in directory
2936                 my $dir = $projects_list;
2937                 # remove the trailing "/"
2938                 $dir =~ s!/+$!!;
2939                 my $pfxlen = length("$dir");
2940                 my $pfxdepth = ($dir =~ tr!/!!);
2941                 # when filtering, search only given subdirectory
2942                 if ($filter && !$paranoid) {
2943                         $dir .= "/$filter";
2944                         $dir =~ s!/+$!!;
2945                 }
2946
2947                 File::Find::find({
2948                         follow_fast => 1, # follow symbolic links
2949                         follow_skip => 2, # ignore duplicates
2950                         dangling_symlinks => 0, # ignore dangling symlinks, silently
2951                         wanted => sub {
2952                                 # global variables
2953                                 our $project_maxdepth;
2954                                 our $projectroot;
2955                                 # skip project-list toplevel, if we get it.
2956                                 return if (m!^[/.]$!);
2957                                 # only directories can be git repositories
2958                                 return unless (-d $_);
2959                                 # don't traverse too deep (Find is super slow on os x)
2960                                 # $project_maxdepth excludes depth of $projectroot
2961                                 if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2962                                         $File::Find::prune = 1;
2963                                         return;
2964                                 }
2965
2966                                 my $path = substr($File::Find::name, $pfxlen + 1);
2967                                 # paranoidly only filter here
2968                                 if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
2969                                         next;
2970                                 }
2971                                 # we check related file in $projectroot
2972                                 if (check_export_ok("$projectroot/$path")) {
2973                                         push @list, { path => $path };
2974                                         $File::Find::prune = 1;
2975                                 }
2976                         },
2977                 }, "$dir");
2978
2979         } elsif (-f $projects_list) {
2980                 # read from file(url-encoded):
2981                 # 'git%2Fgit.git Linus+Torvalds'
2982                 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2983                 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2984                 open my $fd, '<', $projects_list or return;
2985         PROJECT:
2986                 while (my $line = <$fd>) {
2987                         chomp $line;
2988                         my ($path, $owner) = split ' ', $line;
2989                         $path = unescape($path);
2990                         $owner = unescape($owner);
2991                         if (!defined $path) {
2992                                 next;
2993                         }
2994                         # if $filter is rpovided, check if $path begins with $filter
2995                         if ($filter && $path !~ m!^\Q$filter\E/!) {
2996                                 next;
2997                         }
2998                         if (check_export_ok("$projectroot/$path")) {
2999                                 my $pr = {
3000                                         path => $path,
3001                                         owner => to_utf8($owner),
3002                                 };
3003                                 push @list, $pr;
3004                         }
3005                 }
3006                 close $fd;
3007         }
3008         return @list;
3009 }
3010
3011 # written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
3012 # as side effects it sets 'forks' field to list of forks for forked projects
3013 sub filter_forks_from_projects_list {
3014         my $projects = shift;
3015
3016         my %trie; # prefix tree of directories (path components)
3017         # generate trie out of those directories that might contain forks
3018         foreach my $pr (@$projects) {
3019                 my $path = $pr->{'path'};
3020                 $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
3021                 next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
3022                 next unless ($path);      # skip '.git' repository: tests, git-instaweb
3023                 next unless (-d "$projectroot/$path"); # containing directory exists
3024                 $pr->{'forks'} = [];      # there can be 0 or more forks of project
3025
3026                 # add to trie
3027                 my @dirs = split('/', $path);
3028                 # walk the trie, until either runs out of components or out of trie
3029                 my $ref = \%trie;
3030                 while (scalar @dirs &&
3031                        exists($ref->{$dirs[0]})) {
3032                         $ref = $ref->{shift @dirs};
3033                 }
3034                 # create rest of trie structure from rest of components
3035                 foreach my $dir (@dirs) {
3036                         $ref = $ref->{$dir} = {};
3037                 }
3038                 # create end marker, store $pr as a data
3039                 $ref->{''} = $pr if (!exists $ref->{''});
3040         }
3041
3042         # filter out forks, by finding shortest prefix match for paths
3043         my @filtered;
3044  PROJECT:
3045         foreach my $pr (@$projects) {
3046                 # trie lookup
3047                 my $ref = \%trie;
3048         DIR:
3049                 foreach my $dir (split('/', $pr->{'path'})) {
3050                         if (exists $ref->{''}) {
3051                                 # found [shortest] prefix, is a fork - skip it
3052                                 push @{$ref->{''}{'forks'}}, $pr;
3053                                 next PROJECT;
3054                         }
3055                         if (!exists $ref->{$dir}) {
3056                                 # not in trie, cannot have prefix, not a fork
3057                                 push @filtered, $pr;
3058                                 next PROJECT;
3059                         }
3060                         # If the dir is there, we just walk one step down the trie.
3061                         $ref = $ref->{$dir};
3062                 }
3063                 # we ran out of trie
3064                 # (shouldn't happen: it's either no match, or end marker)
3065                 push @filtered, $pr;
3066         }
3067
3068         return @filtered;
3069 }
3070
3071 # note: fill_project_list_info must be run first,
3072 # for 'descr_long' and 'ctags' to be filled
3073 sub search_projects_list {
3074         my ($projlist, %opts) = @_;
3075         my $tagfilter  = $opts{'tagfilter'};
3076         my $search_re = $opts{'search_regexp'};
3077
3078         return @$projlist
3079                 unless ($tagfilter || $search_re);
3080
3081         # searching projects require filling to be run before it;
3082         fill_project_list_info($projlist,
3083                                $tagfilter  ? 'ctags' : (),
3084                                $search_re ? ('path', 'descr') : ());
3085         my @projects;
3086  PROJECT:
3087         foreach my $pr (@$projlist) {
3088
3089                 if ($tagfilter) {
3090                         next unless ref($pr->{'ctags'}) eq 'HASH';
3091                         next unless
3092                                 grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
3093                 }
3094
3095                 if ($search_re) {
3096                         next unless
3097                                 $pr->{'path'} =~ /$search_re/ ||
3098                                 $pr->{'descr_long'} =~ /$search_re/;
3099                 }
3100
3101                 push @projects, $pr;
3102         }
3103
3104         return @projects;
3105 }
3106
3107 our $gitweb_project_owner = undef;
3108 sub git_get_project_list_from_file {
3109
3110         return if (defined $gitweb_project_owner);
3111
3112         $gitweb_project_owner = {};
3113         # read from file (url-encoded):
3114         # 'git%2Fgit.git Linus+Torvalds'
3115         # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3116         # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3117         if (-f $projects_list) {
3118                 open(my $fd, '<', $projects_list);
3119                 while (my $line = <$fd>) {
3120                         chomp $line;
3121                         my ($pr, $ow) = split ' ', $line;
3122                         $pr = unescape($pr);
3123                         $ow = unescape($ow);
3124                         $gitweb_project_owner->{$pr} = to_utf8($ow);
3125                 }
3126                 close $fd;
3127         }
3128 }
3129
3130 sub git_get_project_owner {
3131         my $project = shift;
3132         my $owner;
3133
3134         return undef unless $project;
3135         $git_dir = "$projectroot/$project";
3136
3137         if (!defined $gitweb_project_owner) {
3138                 git_get_project_list_from_file();
3139         }
3140
3141         if (exists $gitweb_project_owner->{$project}) {
3142                 $owner = $gitweb_project_owner->{$project};
3143         }
3144         if (!defined $owner){
3145                 $owner = git_get_project_config('owner');
3146         }
3147         if (!defined $owner) {
3148                 $owner = get_file_owner("$git_dir");
3149         }
3150
3151         return $owner;
3152 }
3153
3154 sub git_get_last_activity {
3155         my ($path) = @_;
3156         my $fd;
3157
3158         $git_dir = "$projectroot/$path";
3159         open($fd, "-|", git_cmd(), 'for-each-ref',
3160              '--format=%(committer)',
3161              '--sort=-committerdate',
3162              '--count=1',
3163              'refs/heads') or return;
3164         my $most_recent = <$fd>;
3165         close $fd or return;
3166         if (defined $most_recent &&
3167             $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3168                 my $timestamp = $1;
3169                 my $age = time - $timestamp;
3170                 return ($age, age_string($age));
3171         }
3172         return (undef, undef);
3173 }
3174
3175 # Implementation note: when a single remote is wanted, we cannot use 'git
3176 # remote show -n' because that command always work (assuming it's a remote URL
3177 # if it's not defined), and we cannot use 'git remote show' because that would
3178 # try to make a network roundtrip. So the only way to find if that particular
3179 # remote is defined is to walk the list provided by 'git remote -v' and stop if
3180 # and when we find what we want.
3181 sub git_get_remotes_list {
3182         my $wanted = shift;
3183         my %remotes = ();
3184
3185         open my $fd, '-|' , git_cmd(), 'remote', '-v';
3186         return unless $fd;
3187         while (my $remote = <$fd>) {
3188                 chomp $remote;
3189                 $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3190                 next if $wanted and not $remote eq $wanted;
3191                 my ($url, $key) = ($1, $2);
3192
3193                 $remotes{$remote} ||= { 'heads' => () };
3194                 $remotes{$remote}{$key} = $url;
3195         }
3196         close $fd or return;
3197         return wantarray ? %remotes : \%remotes;
3198 }
3199
3200 # Takes a hash of remotes as first parameter and fills it by adding the
3201 # available remote heads for each of the indicated remotes.
3202 sub fill_remote_heads {
3203         my $remotes = shift;
3204         my @heads = map { "remotes/$_" } keys %$remotes;
3205         my @remoteheads = git_get_heads_list(undef, @heads);
3206         foreach my $remote (keys %$remotes) {
3207                 $remotes->{$remote}{'heads'} = [ grep {
3208                         $_->{'name'} =~ s!^$remote/!!
3209                         } @remoteheads ];
3210         }
3211 }
3212
3213 sub git_get_references {
3214         my $type = shift || "";
3215         my %refs;
3216         # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3217         # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3218         open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3219                 ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3220                 or return;
3221
3222         while (my $line = <$fd>) {
3223                 chomp $line;
3224                 if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3225                         if (defined $refs{$1}) {
3226                                 push @{$refs{$1}}, $2;
3227                         } else {
3228                                 $refs{$1} = [ $2 ];
3229                         }
3230                 }
3231         }
3232         close $fd or return;
3233         return \%refs;
3234 }
3235
3236 sub git_get_rev_name_tags {
3237         my $hash = shift || return undef;
3238
3239         open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3240                 or return;
3241         my $name_rev = <$fd>;
3242         close $fd;
3243
3244         if ($name_rev =~ m|^$hash tags/(.*)$|) {
3245                 return $1;
3246         } else {
3247                 # catches also '$hash undefined' output
3248                 return undef;
3249         }
3250 }
3251
3252 ## ----------------------------------------------------------------------
3253 ## parse to hash functions
3254
3255 sub parse_date {
3256         my $epoch = shift;
3257         my $tz = shift || "-0000";
3258
3259         my %date;
3260         my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3261         my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3262         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3263         $date{'hour'} = $hour;
3264         $date{'minute'} = $min;
3265         $date{'mday'} = $mday;
3266         $date{'day'} = $days[$wday];
3267         $date{'month'} = $months[$mon];
3268         $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3269                              $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3270         $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3271                              $mday, $months[$mon], $hour ,$min;
3272         $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3273                              1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3274
3275         my ($tz_sign, $tz_hour, $tz_min) =
3276                 ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3277         $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3278         my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3279         ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3280         $date{'hour_local'} = $hour;
3281         $date{'minute_local'} = $min;
3282         $date{'tz_local'} = $tz;
3283         $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3284                                   1900+$year, $mon+1, $mday,
3285                                   $hour, $min, $sec, $tz);
3286         return %date;
3287 }
3288
3289 sub parse_tag {
3290         my $tag_id = shift;
3291         my %tag;
3292         my @comment;
3293
3294         open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3295         $tag{'id'} = $tag_id;
3296         while (my $line = <$fd>) {
3297                 chomp $line;
3298                 if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3299                         $tag{'object'} = $1;
3300                 } elsif ($line =~ m/^type (.+)$/) {
3301                         $tag{'type'} = $1;
3302                 } elsif ($line =~ m/^tag (.+)$/) {
3303                         $tag{'name'} = $1;
3304                 } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3305                         $tag{'author'} = $1;
3306                         $tag{'author_epoch'} = $2;
3307                         $tag{'author_tz'} = $3;
3308                         if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3309                                 $tag{'author_name'}  = $1;
3310                                 $tag{'author_email'} = $2;
3311                         } else {
3312                                 $tag{'author_name'} = $tag{'author'};
3313                         }
3314                 } elsif ($line =~ m/--BEGIN/) {
3315                         push @comment, $line;
3316                         last;
3317                 } elsif ($line eq "") {
3318                         last;
3319                 }
3320         }
3321         push @comment, <$fd>;
3322         $tag{'comment'} = \@comment;
3323         close $fd or return;
3324         if (!defined $tag{'name'}) {
3325                 return
3326         };
3327         return %tag
3328 }
3329
3330 sub parse_commit_text {
3331         my ($commit_text, $withparents) = @_;
3332         my @commit_lines = split '\n', $commit_text;
3333         my %co;
3334
3335         pop @commit_lines; # Remove '\0'
3336
3337         if (! @commit_lines) {
3338                 return;
3339         }
3340
3341         my $header = shift @commit_lines;
3342         if ($header !~ m/^[0-9a-fA-F]{40}/) {
3343                 return;
3344         }
3345         ($co{'id'}, my @parents) = split ' ', $header;
3346         while (my $line = shift @commit_lines) {
3347                 last if $line eq "\n";
3348                 if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3349                         $co{'tree'} = $1;
3350                 } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3351                         push @parents, $1;
3352                 } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3353                         $co{'author'} = to_utf8($1);
3354                         $co{'author_epoch'} = $2;
3355                         $co{'author_tz'} = $3;
3356                         if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3357                                 $co{'author_name'}  = $1;
3358                                 $co{'author_email'} = $2;
3359                         } else {
3360                                 $co{'author_name'} = $co{'author'};
3361                         }
3362                 } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3363                         $co{'committer'} = to_utf8($1);
3364                         $co{'committer_epoch'} = $2;
3365                         $co{'committer_tz'} = $3;
3366                         if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3367                                 $co{'committer_name'}  = $1;
3368                                 $co{'committer_email'} = $2;
3369                         } else {
3370                                 $co{'committer_name'} = $co{'committer'};
3371                         }
3372                 }
3373         }
3374         if (!defined $co{'tree'}) {
3375                 return;
3376         };
3377         $co{'parents'} = \@parents;
3378         $co{'parent'} = $parents[0];
3379
3380         foreach my $title (@commit_lines) {
3381                 $title =~ s/^    //;
3382                 if ($title ne "") {
3383                         $co{'title'} = chop_str($title, 80, 5);
3384                         # remove leading stuff of merges to make the interesting part visible
3385                         if (length($title) > 50) {
3386                                 $title =~ s/^Automatic //;
3387                                 $title =~ s/^merge (of|with) /Merge ... /i;
3388                                 if (length($title) > 50) {
3389                                         $title =~ s/(http|rsync):\/\///;
3390                                 }
3391                                 if (length($title) > 50) {
3392                                         $title =~ s/(master|www|rsync)\.//;
3393                                 }
3394                                 if (length($title) > 50) {
3395                                         $title =~ s/kernel.org:?//;
3396                                 }
3397                                 if (length($title) > 50) {
3398                                         $title =~ s/\/pub\/scm//;
3399                                 }
3400                         }
3401                         $co{'title_short'} = chop_str($title, 50, 5);
3402                         last;
3403                 }
3404         }
3405         if (! defined $co{'title'} || $co{'title'} eq "") {
3406                 $co{'title'} = $co{'title_short'} = '(no commit message)';
3407         }
3408         # remove added spaces
3409         foreach my $line (@commit_lines) {
3410                 $line =~ s/^    //;
3411         }
3412         $co{'comment'} = \@commit_lines;
3413
3414         my $age = time - $co{'committer_epoch'};
3415         $co{'age'} = $age;
3416         $co{'age_string'} = age_string($age);
3417         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3418         if ($age > 60*60*24*7*2) {
3419                 $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3420                 $co{'age_string_age'} = $co{'age_string'};
3421         } else {
3422                 $co{'age_string_date'} = $co{'age_string'};
3423                 $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3424         }
3425         return %co;
3426 }
3427
3428 sub parse_commit {
3429         my ($commit_id) = @_;
3430         my %co;
3431
3432         local $/ = "\0";
3433
3434         open my $fd, "-|", git_cmd(), "rev-list",
3435                 "--parents",
3436                 "--header",
3437                 "--max-count=1",
3438                 $commit_id,
3439                 "--",
3440                 or die_error(500, "Open git-rev-list failed");
3441         %co = parse_commit_text(<$fd>, 1);
3442         close $fd;
3443
3444         return %co;
3445 }
3446
3447 sub parse_commits {
3448         my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3449         my @cos;
3450
3451         $maxcount ||= 1;
3452         $skip ||= 0;
3453
3454         local $/ = "\0";
3455
3456         open my $fd, "-|", git_cmd(), "rev-list",
3457                 "--header",
3458                 @args,
3459                 ("--max-count=" . $maxcount),
3460                 ("--skip=" . $skip),
3461                 @extra_options,
3462                 $commit_id,
3463                 "--",
3464                 ($filename ? ($filename) : ())
3465                 or die_error(500, "Open git-rev-list failed");
3466         while (my $line = <$fd>) {
3467                 my %co = parse_commit_text($line);
3468                 push @cos, \%co;
3469         }
3470         close $fd;
3471
3472         return wantarray ? @cos : \@cos;
3473 }
3474
3475 # parse line of git-diff-tree "raw" output
3476 sub parse_difftree_raw_line {
3477         my $line = shift;
3478         my %res;
3479
3480         # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3481         # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3482         if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3483                 $res{'from_mode'} = $1;
3484                 $res{'to_mode'} = $2;
3485                 $res{'from_id'} = $3;
3486                 $res{'to_id'} = $4;
3487                 $res{'status'} = $5;
3488                 $res{'similarity'} = $6;
3489                 if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3490                         ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3491                 } else {
3492                         $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3493                 }
3494         }
3495         # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3496         # combined diff (for merge commit)
3497         elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3498                 $res{'nparents'}  = length($1);
3499                 $res{'from_mode'} = [ split(' ', $2) ];
3500                 $res{'to_mode'} = pop @{$res{'from_mode'}};
3501                 $res{'from_id'} = [ split(' ', $3) ];
3502                 $res{'to_id'} = pop @{$res{'from_id'}};
3503                 $res{'status'} = [ split('', $4) ];
3504                 $res{'to_file'} = unquote($5);
3505         }
3506         # 'c512b523472485aef4fff9e57b229d9d243c967f'
3507         elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3508                 $res{'commit'} = $1;
3509         }
3510
3511         return wantarray ? %res : \%res;
3512 }
3513
3514 # wrapper: return parsed line of git-diff-tree "raw" output
3515 # (the argument might be raw line, or parsed info)
3516 sub parsed_difftree_line {
3517         my $line_or_ref = shift;
3518
3519         if (ref($line_or_ref) eq "HASH") {
3520                 # pre-parsed (or generated by hand)
3521                 return $line_or_ref;
3522         } else {
3523                 return parse_difftree_raw_line($line_or_ref);
3524         }
3525 }
3526
3527 # parse line of git-ls-tree output
3528 sub parse_ls_tree_line {
3529         my $line = shift;
3530         my %opts = @_;
3531         my %res;
3532
3533         if ($opts{'-l'}) {
3534                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3535                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3536
3537                 $res{'mode'} = $1;
3538                 $res{'type'} = $2;
3539                 $res{'hash'} = $3;
3540                 $res{'size'} = $4;
3541                 if ($opts{'-z'}) {
3542                         $res{'name'} = $5;
3543                 } else {
3544                         $res{'name'} = unquote($5);
3545                 }
3546         } else {
3547                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3548                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3549
3550                 $res{'mode'} = $1;
3551                 $res{'type'} = $2;
3552                 $res{'hash'} = $3;
3553                 if ($opts{'-z'}) {
3554                         $res{'name'} = $4;
3555                 } else {
3556                         $res{'name'} = unquote($4);
3557                 }
3558         }
3559
3560         return wantarray ? %res : \%res;
3561 }
3562
3563 # generates _two_ hashes, references to which are passed as 2 and 3 argument
3564 sub parse_from_to_diffinfo {
3565         my ($diffinfo, $from, $to, @parents) = @_;
3566
3567         if ($diffinfo->{'nparents'}) {
3568                 # combined diff
3569                 $from->{'file'} = [];
3570                 $from->{'href'} = [];
3571                 fill_from_file_info($diffinfo, @parents)
3572                         unless exists $diffinfo->{'from_file'};
3573                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3574                         $from->{'file'}[$i] =
3575                                 defined $diffinfo->{'from_file'}[$i] ?
3576                                         $diffinfo->{'from_file'}[$i] :
3577                                         $diffinfo->{'to_file'};
3578                         if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3579                                 $from->{'href'}[$i] = href(action=>"blob",
3580                                                            hash_base=>$parents[$i],
3581                                                            hash=>$diffinfo->{'from_id'}[$i],
3582                                                            file_name=>$from->{'file'}[$i]);
3583                         } else {
3584                                 $from->{'href'}[$i] = undef;
3585                         }
3586                 }
3587         } else {
3588                 # ordinary (not combined) diff
3589                 $from->{'file'} = $diffinfo->{'from_file'};
3590                 if ($diffinfo->{'status'} ne "A") { # not new (added) file
3591                         $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3592                                                hash=>$diffinfo->{'from_id'},
3593                                                file_name=>$from->{'file'});
3594                 } else {
3595                         delete $from->{'href'};
3596                 }
3597         }
3598
3599         $to->{'file'} = $diffinfo->{'to_file'};
3600         if (!is_deleted($diffinfo)) { # file exists in result
3601                 $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3602                                      hash=>$diffinfo->{'to_id'},
3603                                      file_name=>$to->{'file'});
3604         } else {
3605                 delete $to->{'href'};
3606         }
3607 }
3608
3609 ## ......................................................................
3610 ## parse to array of hashes functions
3611
3612 sub git_get_heads_list {
3613         my ($limit, @classes) = @_;
3614         @classes = ('heads') unless @classes;
3615         my @patterns = map { "refs/$_" } @classes;
3616         my @headslist;
3617
3618         open my $fd, '-|', git_cmd(), 'for-each-ref',
3619                 ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3620                 '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3621                 @patterns
3622                 or return;
3623         while (my $line = <$fd>) {
3624                 my %ref_item;
3625
3626                 chomp $line;
3627                 my ($refinfo, $committerinfo) = split(/\0/, $line);
3628                 my ($hash, $name, $title) = split(' ', $refinfo, 3);
3629                 my ($committer, $epoch, $tz) =
3630                         ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3631                 $ref_item{'fullname'}  = $name;
3632                 $name =~ s!^refs/(?:head|remote)s/!!;
3633
3634                 $ref_item{'name'}  = $name;
3635                 $ref_item{'id'}    = $hash;
3636                 $ref_item{'title'} = $title || '(no commit message)';
3637                 $ref_item{'epoch'} = $epoch;
3638                 if ($epoch) {
3639                         $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3640                 } else {
3641                         $ref_item{'age'} = "unknown";
3642                 }
3643
3644                 push @headslist, \%ref_item;
3645         }
3646         close $fd;
3647
3648         return wantarray ? @headslist : \@headslist;
3649 }
3650
3651 sub git_get_tags_list {
3652         my $limit = shift;
3653         my @tagslist;
3654
3655         open my $fd, '-|', git_cmd(), 'for-each-ref',
3656                 ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3657                 '--format=%(objectname) %(objecttype) %(refname) '.
3658                 '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3659                 'refs/tags'
3660                 or return;
3661         while (my $line = <$fd>) {
3662                 my %ref_item;
3663
3664                 chomp $line;
3665                 my ($refinfo, $creatorinfo) = split(/\0/, $line);
3666                 my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3667                 my ($creator, $epoch, $tz) =
3668                         ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3669                 $ref_item{'fullname'} = $name;
3670                 $name =~ s!^refs/tags/!!;
3671
3672                 $ref_item{'type'} = $type;
3673                 $ref_item{'id'} = $id;
3674                 $ref_item{'name'} = $name;
3675                 if ($type eq "tag") {
3676                         $ref_item{'subject'} = $title;
3677                         $ref_item{'reftype'} = $reftype;
3678                         $ref_item{'refid'}   = $refid;
3679                 } else {
3680                         $ref_item{'reftype'} = $type;
3681                         $ref_item{'refid'}   = $id;
3682                 }
3683
3684                 if ($type eq "tag" || $type eq "commit") {
3685                         $ref_item{'epoch'} = $epoch;
3686                         if ($epoch) {
3687                                 $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3688                         } else {
3689                                 $ref_item{'age'} = "unknown";
3690                         }
3691                 }
3692
3693                 push @tagslist, \%ref_item;
3694         }
3695         close $fd;
3696
3697         return wantarray ? @tagslist : \@tagslist;
3698 }
3699
3700 ## ----------------------------------------------------------------------
3701 ## filesystem-related functions
3702
3703 sub get_file_owner {
3704         my $path = shift;
3705
3706         my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3707         my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3708         if (!defined $gcos) {
3709                 return undef;
3710         }
3711         my $owner = $gcos;
3712         $owner =~ s/[,;].*$//;
3713         return to_utf8($owner);
3714 }
3715
3716 # assume that file exists
3717 sub insert_file {
3718         my $filename = shift;
3719
3720         open my $fd, '<', $filename;
3721         print map { to_utf8($_) } <$fd>;
3722         close $fd;
3723 }
3724
3725 ## ......................................................................
3726 ## mimetype related functions
3727
3728 sub mimetype_guess_file {
3729         my $filename = shift;
3730         my $mimemap = shift;
3731         -r $mimemap or return undef;
3732
3733         my %mimemap;
3734         open(my $mh, '<', $mimemap) or return undef;
3735         while (<$mh>) {
3736                 next if m/^#/; # skip comments
3737                 my ($mimetype, @exts) = split(/\s+/);
3738                 foreach my $ext (@exts) {
3739                         $mimemap{$ext} = $mimetype;
3740                 }
3741         }
3742         close($mh);
3743
3744         $filename =~ /\.([^.]*)$/;
3745         return $mimemap{$1};
3746 }
3747
3748 sub mimetype_guess {
3749         my $filename = shift;
3750         my $mime;
3751         $filename =~ /\./ or return undef;
3752
3753         if ($mimetypes_file) {
3754                 my $file = $mimetypes_file;
3755                 if ($file !~ m!^/!) { # if it is relative path
3756                         # it is relative to project
3757                         $file = "$projectroot/$project/$file";
3758                 }
3759                 $mime = mimetype_guess_file($filename, $file);
3760         }
3761         $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3762         return $mime;
3763 }
3764
3765 sub blob_mimetype {
3766         my $fd = shift;
3767         my $filename = shift;
3768
3769         if ($filename) {
3770                 my $mime = mimetype_guess($filename);
3771                 $mime and return $mime;
3772         }
3773
3774         # just in case
3775         return $default_blob_plain_mimetype unless $fd;
3776
3777         if (-T $fd) {
3778                 return 'text/plain';
3779         } elsif (! $filename) {
3780                 return 'application/octet-stream';
3781         } elsif ($filename =~ m/\.png$/i) {
3782                 return 'image/png';
3783         } elsif ($filename =~ m/\.gif$/i) {
3784                 return 'image/gif';
3785         } elsif ($filename =~ m/\.jpe?g$/i) {
3786                 return 'image/jpeg';
3787         } else {
3788                 return 'application/octet-stream';
3789         }
3790 }
3791
3792 sub blob_contenttype {
3793         my ($fd, $file_name, $type) = @_;
3794
3795         $type ||= blob_mimetype($fd, $file_name);
3796         if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3797                 $type .= "; charset=$default_text_plain_charset";
3798         }
3799
3800         return $type;
3801 }
3802
3803 # guess file syntax for syntax highlighting; return undef if no highlighting
3804 # the name of syntax can (in the future) depend on syntax highlighter used
3805 sub guess_file_syntax {
3806         my ($highlight, $mimetype, $file_name) = @_;
3807         return undef unless ($highlight && defined $file_name);
3808         my $basename = basename($file_name, '.in');
3809         return $highlight_basename{$basename}
3810                 if exists $highlight_basename{$basename};
3811
3812         $basename =~ /\.([^.]*)$/;
3813         my $ext = $1 or return undef;
3814         return $highlight_ext{$ext}
3815                 if exists $highlight_ext{$ext};
3816
3817         return undef;
3818 }
3819
3820 # run highlighter and return FD of its output,
3821 # or return original FD if no highlighting
3822 sub run_highlighter {
3823         my ($fd, $highlight, $syntax) = @_;
3824         return $fd unless ($highlight && defined $syntax);
3825
3826         close $fd;
3827         open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3828                   quote_command($highlight_bin).
3829                   " --replace-tabs=8 --fragment --syntax $syntax |"
3830                 or die_error(500, "Couldn't open file or run syntax highlighter");
3831         return $fd;
3832 }
3833
3834 ## ======================================================================
3835 ## functions printing HTML: header, footer, error page
3836
3837 sub get_page_title {
3838         my $title = to_utf8($site_name);
3839
3840         unless (defined $project) {
3841                 if (defined $project_filter) {
3842                         $title .= " - projects in '" . esc_path($project_filter) . "'";
3843                 }
3844                 return $title;
3845         }
3846         $title .= " - " . to_utf8($project);
3847
3848         return $title unless (defined $action);
3849         $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3850
3851         return $title unless (defined $file_name);
3852         $title .= " - " . esc_path($file_name);
3853         if ($action eq "tree" && $file_name !~ m|/$|) {
3854                 $title .= "/";
3855         }
3856
3857         return $title;
3858 }
3859
3860 sub get_content_type_html {
3861         # require explicit support from the UA if we are to send the page as
3862         # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3863         # we have to do this because MSIE sometimes globs '*/*', pretending to
3864         # support xhtml+xml but choking when it gets what it asked for.
3865         if (defined $cgi->http('HTTP_ACCEPT') &&
3866             $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3867             $cgi->Accept('application/xhtml+xml') != 0) {
3868                 return 'application/xhtml+xml';
3869         } else {
3870                 return 'text/html';
3871         }
3872 }
3873
3874 sub print_feed_meta {
3875         if (defined $project) {
3876                 my %href_params = get_feed_info();
3877                 if (!exists $href_params{'-title'}) {
3878                         $href_params{'-title'} = 'log';
3879                 }
3880
3881                 foreach my $format (qw(RSS Atom)) {
3882                         my $type = lc($format);
3883                         my %link_attr = (
3884                                 '-rel' => 'alternate',
3885                                 '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3886                                 '-type' => "application/$type+xml"
3887                         );
3888
3889                         $href_params{'action'} = $type;
3890                         $link_attr{'-href'} = href(%href_params);
3891                         print "<link ".
3892                               "rel=\"$link_attr{'-rel'}\" ".
3893                               "title=\"$link_attr{'-title'}\" ".
3894                               "href=\"$link_attr{'-href'}\" ".
3895                               "type=\"$link_attr{'-type'}\" ".
3896                               "/>\n";
3897
3898                         $href_params{'extra_options'} = '--no-merges';
3899                         $link_attr{'-href'} = href(%href_params);
3900                         $link_attr{'-title'} .= ' (no merges)';
3901                         print "<link ".
3902                               "rel=\"$link_attr{'-rel'}\" ".
3903                               "title=\"$link_attr{'-title'}\" ".
3904                               "href=\"$link_attr{'-href'}\" ".
3905                               "type=\"$link_attr{'-type'}\" ".
3906                               "/>\n";
3907                 }
3908
3909         } else {
3910                 printf('<link rel="alternate" title="%s projects list" '.
3911                        'href="%s" type="text/plain; charset=utf-8" />'."\n",
3912                        esc_attr($site_name), href(project=>undef, action=>"project_index"));
3913                 printf('<link rel="alternate" title="%s projects feeds" '.
3914                        'href="%s" type="text/x-opml" />'."\n",
3915                        esc_attr($site_name), href(project=>undef, action=>"opml"));
3916         }
3917 }
3918
3919 sub print_header_links {
3920         my $status = shift;
3921
3922         # print out each stylesheet that exist, providing backwards capability
3923         # for those people who defined $stylesheet in a config file
3924         if (defined $stylesheet) {
3925                 print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3926         } else {
3927                 foreach my $stylesheet (@stylesheets) {
3928                         next unless $stylesheet;
3929                         print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3930                 }
3931         }
3932         print_feed_meta()
3933                 if ($status eq '200 OK');
3934         if (defined $favicon) {
3935                 print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3936         }
3937 }
3938
3939 sub print_nav_breadcrumbs_path {
3940         my $dirprefix = undef;
3941         while (my $part = shift) {
3942                 $dirprefix .= "/" if defined $dirprefix;
3943                 $dirprefix .= $part;
3944                 print $cgi->a({-href => href(project => undef,
3945                                              project_filter => $dirprefix,
3946                                              action => "project_list")},
3947                               esc_html($part)) . " / ";
3948         }
3949 }
3950
3951 sub print_nav_breadcrumbs {
3952         my %opts = @_;
3953
3954         print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3955         if (defined $project) {
3956                 my @dirname = split '/', $project;
3957                 my $projectbasename = pop @dirname;
3958                 print_nav_breadcrumbs_path(@dirname);
3959                 print $cgi->a({-href => href(action=>"summary")}, esc_html($projectbasename));
3960                 if (defined $action) {
3961                         my $action_print = $action ;
3962                         if (defined $opts{-action_extra}) {
3963                                 $action_print = $cgi->a({-href => href(action=>$action)},
3964                                         $action);
3965                         }
3966                         print " / $action_print";
3967                 }
3968                 if (defined $opts{-action_extra}) {
3969                         print " / $opts{-action_extra}";
3970                 }
3971                 print "\n";
3972         } elsif (defined $project_filter) {
3973                 print_nav_breadcrumbs_path(split '/', $project_filter);
3974         }
3975 }
3976
3977 sub print_search_form {
3978         if (!defined $searchtext) {
3979                 $searchtext = "";
3980         }
3981         my $search_hash;
3982         if (defined $hash_base) {
3983                 $search_hash = $hash_base;
3984         } elsif (defined $hash) {
3985                 $search_hash = $hash;
3986         } else {
3987                 $search_hash = "HEAD";
3988         }
3989         my $action = $my_uri;
3990         my $use_pathinfo = gitweb_check_feature('pathinfo');
3991         if ($use_pathinfo) {
3992                 $action .= "/".esc_url($project);
3993         }
3994         print $cgi->startform(-method => "get", -action => $action) .
3995               "<div class=\"search\">\n" .
3996               (!$use_pathinfo &&
3997               $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3998               $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3999               $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
4000               $cgi->popup_menu(-name => 'st', -default => 'commit',
4001                                -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
4002               $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
4003               " search:\n",
4004               $cgi->textfield(-name => "s", -value => $searchtext, -override => 1) . "\n" .
4005               "<span title=\"Extended regular expression\">" .
4006               $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
4007                              -checked => $search_use_regexp) .
4008               "</span>" .
4009               "</div>" .
4010               $cgi->end_form() . "\n";
4011 }
4012
4013 sub git_header_html {
4014         my $status = shift || "200 OK";
4015         my $expires = shift;
4016         my %opts = @_;
4017
4018         my $title = get_page_title();
4019         my $content_type = get_content_type_html();
4020         print $cgi->header(-type=>$content_type, -charset => 'utf-8',
4021                            -status=> $status, -expires => $expires)
4022                 unless ($opts{'-no_http_header'});
4023         my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
4024         print <<EOF;
4025 <?xml version="1.0" encoding="utf-8"?>
4026 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
4027 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
4028 <!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
4029 <!-- git core binaries version $git_version -->
4030 <head>
4031 <meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
4032 <meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
4033 <meta name="robots" content="index, nofollow"/>
4034 <title>$title</title>
4035 EOF
4036         # the stylesheet, favicon etc urls won't work correctly with path_info
4037         # unless we set the appropriate base URL
4038         if ($ENV{'PATH_INFO'}) {
4039                 print "<base href=\"".esc_url($base_url)."\" />\n";
4040         }
4041         print_header_links($status);
4042
4043         if (defined $site_html_head_string) {
4044                 print to_utf8($site_html_head_string);
4045         }
4046
4047         print "</head>\n" .
4048               "<body>\n";
4049
4050         if (defined $site_header && -f $site_header) {
4051                 insert_file($site_header);
4052         }
4053
4054         print "<div class=\"page_header\">\n";
4055         if (defined $logo) {
4056                 print $cgi->a({-href => esc_url($logo_url),
4057                                -title => $logo_label},
4058                               $cgi->img({-src => esc_url($logo),
4059                                          -width => 72, -height => 27,
4060                                          -alt => "git",
4061                                          -class => "logo"}));
4062         }
4063         print_nav_breadcrumbs(%opts);
4064         print "</div>\n";
4065
4066         my $have_search = gitweb_check_feature('search');
4067         if (defined $project && $have_search) {
4068                 print_search_form();
4069         }
4070 }
4071
4072 sub git_footer_html {
4073         my $feed_class = 'rss_logo';
4074
4075         print "<div class=\"page_footer\">\n";
4076         if (defined $project) {
4077                 my $descr = git_get_project_description($project);
4078                 if (defined $descr) {
4079                         print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
4080                 }
4081
4082                 my %href_params = get_feed_info();
4083                 if (!%href_params) {
4084                         $feed_class .= ' generic';
4085                 }
4086                 $href_params{'-title'} ||= 'log';
4087
4088                 foreach my $format (qw(RSS Atom)) {
4089                         $href_params{'action'} = lc($format);
4090                         print $cgi->a({-href => href(%href_params),
4091                                       -title => "$href_params{'-title'} $format feed",
4092                                       -class => $feed_class}, $format)."\n";
4093                 }
4094
4095         } else {
4096                 print $cgi->a({-href => href(project=>undef, action=>"opml",
4097                                              project_filter => $project_filter),
4098                               -class => $feed_class}, "OPML") . " ";
4099                 print $cgi->a({-href => href(project=>undef, action=>"project_index",
4100                                              project_filter => $project_filter),
4101                               -class => $feed_class}, "TXT") . "\n";
4102         }
4103         print "</div>\n"; # class="page_footer"
4104
4105         if (defined $t0 && gitweb_check_feature('timed')) {
4106                 print "<div id=\"generating_info\">\n";
4107                 print 'This page took '.
4108                       '<span id="generating_time" class="time_span">'.
4109                       tv_interval($t0, [ gettimeofday() ]).
4110                       ' seconds </span>'.
4111                       ' and '.
4112                       '<span id="generating_cmd">'.
4113                       $number_of_git_cmds.
4114                       '</span> git commands '.
4115                       " to generate.\n";
4116                 print "</div>\n"; # class="page_footer"
4117         }
4118
4119         if (defined $site_footer && -f $site_footer) {
4120                 insert_file($site_footer);
4121         }
4122
4123         print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
4124         if (defined $action &&
4125             $action eq 'blame_incremental') {
4126                 print qq!<script type="text/javascript">\n!.
4127                       qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
4128                       qq!           "!. href() .qq!");\n!.
4129                       qq!</script>\n!;
4130         } else {
4131                 my ($jstimezone, $tz_cookie, $datetime_class) =
4132                         gitweb_get_feature('javascript-timezone');
4133
4134                 print qq!<script type="text/javascript">\n!.
4135                       qq!window.onload = function () {\n!;
4136                 if (gitweb_check_feature('javascript-actions')) {
4137                         print qq!       fixLinks();\n!;
4138                 }
4139                 if ($jstimezone && $tz_cookie && $datetime_class) {
4140                         print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4141                               qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4142                 }
4143                 print qq!};\n!.
4144                       qq!</script>\n!;
4145         }
4146
4147         print "</body>\n" .
4148               "</html>";
4149 }
4150
4151 # die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4152 # Example: die_error(404, 'Hash not found')
4153 # By convention, use the following status codes (as defined in RFC 2616):
4154 # 400: Invalid or missing CGI parameters, or
4155 #      requested object exists but has wrong type.
4156 # 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4157 #      this server or project.
4158 # 404: Requested object/revision/project doesn't exist.
4159 # 500: The server isn't configured properly, or
4160 #      an internal error occurred (e.g. failed assertions caused by bugs), or
4161 #      an unknown error occurred (e.g. the git binary died unexpectedly).
4162 # 503: The server is currently unavailable (because it is overloaded,
4163 #      or down for maintenance).  Generally, this is a temporary state.
4164 sub die_error {
4165         my $status = shift || 500;
4166         my $error = esc_html(shift) || "Internal Server Error";
4167         my $extra = shift;
4168         my %opts = @_;
4169
4170         my %http_responses = (
4171                 400 => '400 Bad Request',
4172                 403 => '403 Forbidden',
4173                 404 => '404 Not Found',
4174                 500 => '500 Internal Server Error',
4175                 503 => '503 Service Unavailable',
4176         );
4177         git_header_html($http_responses{$status}, undef, %opts);
4178         print <<EOF;
4179 <div class="page_body">
4180 <br /><br />
4181 $status - $error
4182 <br />
4183 EOF
4184         if (defined $extra) {
4185                 print "<hr />\n" .
4186                       "$extra\n";
4187         }
4188         print "</div>\n";
4189
4190         git_footer_html();
4191         goto DONE_GITWEB
4192                 unless ($opts{'-error_handler'});
4193 }
4194
4195 ## ----------------------------------------------------------------------
4196 ## functions printing or outputting HTML: navigation
4197
4198 sub git_print_page_nav {
4199         my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4200         $extra = '' if !defined $extra; # pager or formats
4201
4202         my @navs = qw(summary shortlog log commit commitdiff tree);
4203         if ($suppress) {
4204                 @navs = grep { $_ ne $suppress } @navs;
4205         }
4206
4207         my %arg = map { $_ => {action=>$_} } @navs;
4208         if (defined $head) {
4209                 for (qw(commit commitdiff)) {
4210                         $arg{$_}{'hash'} = $head;
4211                 }
4212                 if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4213                         for (qw(shortlog log)) {
4214                                 $arg{$_}{'hash'} = $head;
4215                         }
4216                 }
4217         }
4218
4219         $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4220         $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4221
4222         my @actions = gitweb_get_feature('actions');
4223         my %repl = (
4224                 '%' => '%',
4225                 'n' => $project,         # project name
4226                 'f' => $git_dir,         # project path within filesystem
4227                 'h' => $treehead || '',  # current hash ('h' parameter)
4228                 'b' => $treebase || '',  # hash base ('hb' parameter)
4229         );
4230         while (@actions) {
4231                 my ($label, $link, $pos) = splice(@actions,0,3);
4232                 # insert
4233                 @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4234                 # munch munch
4235                 $link =~ s/%([%nfhb])/$repl{$1}/g;
4236                 $arg{$label}{'_href'} = $link;
4237         }
4238
4239         print "<div class=\"page_nav\">\n" .
4240                 (join " | ",
4241                  map { $_ eq $current ?
4242                        $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4243                  } @navs);
4244         print "<br/>\n$extra<br/>\n" .
4245               "</div>\n";
4246 }
4247
4248 # returns a submenu for the nagivation of the refs views (tags, heads,
4249 # remotes) with the current view disabled and the remotes view only
4250 # available if the feature is enabled
4251 sub format_ref_views {
4252         my ($current) = @_;
4253         my @ref_views = qw{tags heads};
4254         push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4255         return join " | ", map {
4256                 $_ eq $current ? $_ :
4257                 $cgi->a({-href => href(action=>$_)}, $_)
4258         } @ref_views
4259 }
4260
4261 sub format_paging_nav {
4262         my ($action, $page, $has_next_link) = @_;
4263         my $paging_nav;
4264
4265
4266         if ($page > 0) {
4267                 $paging_nav .=
4268                         $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4269                         " &sdot; " .
4270                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
4271                                  -accesskey => "p", -title => "Alt-p"}, "prev");
4272         } else {
4273                 $paging_nav .= "first &sdot; prev";
4274         }
4275
4276         if ($has_next_link) {
4277                 $paging_nav .= " &sdot; " .
4278                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
4279                                  -accesskey => "n", -title => "Alt-n"}, "next");
4280         } else {
4281                 $paging_nav .= " &sdot; next";
4282         }
4283
4284         return $paging_nav;
4285 }
4286
4287 ## ......................................................................
4288 ## functions printing or outputting HTML: div
4289
4290 sub git_print_header_div {
4291         my ($action, $title, $hash, $hash_base) = @_;
4292         my %args = ();
4293
4294         $args{'action'} = $action;
4295         $args{'hash'} = $hash if $hash;
4296         $args{'hash_base'} = $hash_base if $hash_base;
4297
4298         print "<div class=\"header\">\n" .
4299               $cgi->a({-href => href(%args), -class => "title"},
4300               $title ? $title : $action) .
4301               "\n</div>\n";
4302 }
4303
4304 sub format_repo_url {
4305         my ($name, $url) = @_;
4306         return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4307 }
4308
4309 # Group output by placing it in a DIV element and adding a header.
4310 # Options for start_div() can be provided by passing a hash reference as the
4311 # first parameter to the function.
4312 # Options to git_print_header_div() can be provided by passing an array
4313 # reference. This must follow the options to start_div if they are present.
4314 # The content can be a scalar, which is output as-is, a scalar reference, which
4315 # is output after html escaping, an IO handle passed either as *handle or
4316 # *handle{IO}, or a function reference. In the latter case all following
4317 # parameters will be taken as argument to the content function call.
4318 sub git_print_section {
4319         my ($div_args, $header_args, $content);
4320         my $arg = shift;
4321         if (ref($arg) eq 'HASH') {
4322                 $div_args = $arg;
4323                 $arg = shift;
4324         }
4325         if (ref($arg) eq 'ARRAY') {
4326                 $header_args = $arg;
4327                 $arg = shift;
4328         }
4329         $content = $arg;
4330
4331         print $cgi->start_div($div_args);
4332         git_print_header_div(@$header_args);
4333
4334         if (ref($content) eq 'CODE') {
4335                 $content->(@_);
4336         } elsif (ref($content) eq 'SCALAR') {
4337                 print esc_html($$content);
4338         } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4339                 print <$content>;
4340         } elsif (!ref($content) && defined($content)) {
4341                 print $content;
4342         }
4343
4344         print $cgi->end_div;
4345 }
4346
4347 sub format_timestamp_html {
4348         my $date = shift;
4349         my $strtime = $date->{'rfc2822'};
4350
4351         my (undef, undef, $datetime_class) =
4352                 gitweb_get_feature('javascript-timezone');
4353         if ($datetime_class) {
4354                 $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4355         }
4356
4357         my $localtime_format = '(%02d:%02d %s)';
4358         if ($date->{'hour_local'} < 6) {
4359                 $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4360         }
4361         $strtime .= ' ' .
4362                     sprintf($localtime_format,
4363                             $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4364
4365         return $strtime;
4366 }
4367
4368 # Outputs the author name and date in long form
4369 sub git_print_authorship {
4370         my $co = shift;
4371         my %opts = @_;
4372         my $tag = $opts{-tag} || 'div';
4373         my $author = $co->{'author_name'};
4374
4375         my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4376         print "<$tag class=\"author_date\">" .
4377               format_search_author($author, "author", esc_html($author)) .
4378               " [".format_timestamp_html(\%ad)."]".
4379               git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4380               "</$tag>\n";
4381 }
4382
4383 # Outputs table rows containing the full author or committer information,
4384 # in the format expected for 'commit' view (& similar).
4385 # Parameters are a commit hash reference, followed by the list of people
4386 # to output information for. If the list is empty it defaults to both
4387 # author and committer.
4388 sub git_print_authorship_rows {
4389         my $co = shift;
4390         # too bad we can't use @people = @_ || ('author', 'committer')
4391         my @people = @_;
4392         @people = ('author', 'committer') unless @people;
4393         foreach my $who (@people) {
4394                 my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4395                 print "<tr><td>$who</td><td>" .
4396                       format_search_author($co->{"${who}_name"}, $who,
4397                                            esc_html($co->{"${who}_name"})) . " " .
4398                       format_search_author($co->{"${who}_email"}, $who,
4399                                            esc_html("<" . $co->{"${who}_email"} . ">")) .
4400                       "</td><td rowspan=\"2\">" .
4401                       git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4402                       "</td></tr>\n" .
4403                       "<tr>" .
4404                       "<td></td><td>" .
4405                       format_timestamp_html(\%wd) .
4406                       "</td>" .
4407                       "</tr>\n";
4408         }
4409 }
4410
4411 sub git_print_page_path {
4412         my $name = shift;
4413         my $type = shift;
4414         my $hb = shift;
4415
4416
4417         print "<div class=\"page_path\">";
4418         print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4419                       -title => 'tree root'}, to_utf8("[$project]"));
4420         print " / ";
4421         if (defined $name) {
4422                 my @dirname = split '/', $name;
4423                 my $basename = pop @dirname;
4424                 my $fullname = '';
4425
4426                 foreach my $dir (@dirname) {
4427                         $fullname .= ($fullname ? '/' : '') . $dir;
4428                         print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4429                                                      hash_base=>$hb),
4430                                       -title => $fullname}, esc_path($dir));
4431                         print " / ";
4432                 }
4433                 if (defined $type && $type eq 'blob') {
4434                         print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4435                                                      hash_base=>$hb),
4436                                       -title => $name}, esc_path($basename));
4437                 } elsif (defined $type && $type eq 'tree') {
4438                         print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4439                                                      hash_base=>$hb),
4440                                       -title => $name}, esc_path($basename));
4441                         print " / ";
4442                 } else {
4443                         print esc_path($basename);
4444                 }
4445         }
4446         print "<br/></div>\n";
4447 }
4448
4449 sub git_print_log {
4450         my $log = shift;
4451         my %opts = @_;
4452
4453         if ($opts{'-remove_title'}) {
4454                 # remove title, i.e. first line of log
4455                 shift @$log;
4456         }
4457         # remove leading empty lines
4458         while (defined $log->[0] && $log->[0] eq "") {
4459                 shift @$log;
4460         }
4461
4462         # print log
4463         my $skip_blank_line = 0;
4464         foreach my $line (@$log) {
4465                 if ($line =~ m/^\s*([A-Z][-A-Za-z]*-[Bb]y|C[Cc]): /) {
4466                         if (! $opts{'-remove_signoff'}) {
4467                                 print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4468                                 $skip_blank_line = 1;
4469                         }
4470                         next;
4471                 }
4472
4473                 if ($line =~ m,\s*([a-z]*link): (https?://\S+),i) {
4474                         if (! $opts{'-remove_signoff'}) {
4475                                 print "<span class=\"signoff\">" . esc_html($1) . ": " .
4476                                         "<a href=\"" . esc_html($2) . "\">" . esc_html($2) . "</a>" .
4477                                         "</span><br/>\n";
4478                                 $skip_blank_line = 1;
4479                         }
4480                         next;
4481                 }
4482
4483                 # print only one empty line
4484                 # do not print empty line after signoff
4485                 if ($line eq "") {
4486                         next if ($skip_blank_line);
4487                         $skip_blank_line = 1;
4488                 } else {
4489                         $skip_blank_line = 0;
4490                 }
4491
4492                 print format_log_line_html($line) . "<br/>\n";
4493         }
4494
4495         if ($opts{'-final_empty_line'}) {
4496                 # end with single empty line
4497                 print "<br/>\n" unless $skip_blank_line;
4498         }
4499 }
4500
4501 # return link target (what link points to)
4502 sub git_get_link_target {
4503         my $hash = shift;
4504         my $link_target;
4505
4506         # read link
4507         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4508                 or return;
4509         {
4510                 local $/ = undef;
4511                 $link_target = <$fd>;
4512         }
4513         close $fd
4514                 or return;
4515
4516         return $link_target;
4517 }
4518
4519 # given link target, and the directory (basedir) the link is in,
4520 # return target of link relative to top directory (top tree);
4521 # return undef if it is not possible (including absolute links).
4522 sub normalize_link_target {
4523         my ($link_target, $basedir) = @_;
4524
4525         # absolute symlinks (beginning with '/') cannot be normalized
4526         return if (substr($link_target, 0, 1) eq '/');
4527
4528         # normalize link target to path from top (root) tree (dir)
4529         my $path;
4530         if ($basedir) {
4531                 $path = $basedir . '/' . $link_target;
4532         } else {
4533                 # we are in top (root) tree (dir)
4534                 $path = $link_target;
4535         }
4536
4537         # remove //, /./, and /../
4538         my @path_parts;
4539         foreach my $part (split('/', $path)) {
4540                 # discard '.' and ''
4541                 next if (!$part || $part eq '.');
4542                 # handle '..'
4543                 if ($part eq '..') {
4544                         if (@path_parts) {
4545                                 pop @path_parts;
4546                         } else {
4547                                 # link leads outside repository (outside top dir)
4548                                 return;
4549                         }
4550                 } else {
4551                         push @path_parts, $part;
4552                 }
4553         }
4554         $path = join('/', @path_parts);
4555
4556         return $path;
4557 }
4558
4559 # print tree entry (row of git_tree), but without encompassing <tr> element
4560 sub git_print_tree_entry {
4561         my ($t, $basedir, $hash_base, $have_blame) = @_;
4562
4563         my %base_key = ();
4564         $base_key{'hash_base'} = $hash_base if defined $hash_base;
4565
4566         # The format of a table row is: mode list link.  Where mode is
4567         # the mode of the entry, list is the name of the entry, an href,
4568         # and link is the action links of the entry.
4569
4570         print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4571         if (exists $t->{'size'}) {
4572                 print "<td class=\"size\">$t->{'size'}</td>\n";
4573         }
4574         if ($t->{'type'} eq "blob") {
4575                 print "<td class=\"list\">" .
4576                         $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4577                                                file_name=>"$basedir$t->{'name'}", %base_key),
4578                                 -class => "list"}, esc_path($t->{'name'}));
4579                 if (S_ISLNK(oct $t->{'mode'})) {
4580                         my $link_target = git_get_link_target($t->{'hash'});
4581                         if ($link_target) {
4582                                 my $norm_target = normalize_link_target($link_target, $basedir);
4583                                 if (defined $norm_target) {
4584                                         print " -> " .
4585                                               $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4586                                                                      file_name=>$norm_target),
4587                                                        -title => $norm_target}, esc_path($link_target));
4588                                 } else {
4589                                         print " -> " . esc_path($link_target);
4590                                 }
4591                         }
4592                 }
4593                 print "</td>\n";
4594                 print "<td class=\"link\">";
4595                 print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4596                                              file_name=>"$basedir$t->{'name'}", %base_key)},
4597                               "blob");
4598                 if ($have_blame) {
4599                         print " | " .
4600                               $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4601                                                      file_name=>"$basedir$t->{'name'}", %base_key)},
4602                                       "blame");
4603                 }
4604                 if (defined $hash_base) {
4605                         print " | " .
4606                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4607                                                      hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4608                                       "history");
4609                 }
4610                 print " | " .
4611                         $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4612                                                file_name=>"$basedir$t->{'name'}")},
4613                                 "raw");
4614                 print "</td>\n";
4615
4616         } elsif ($t->{'type'} eq "tree") {
4617                 print "<td class=\"list\">";
4618                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4619                                              file_name=>"$basedir$t->{'name'}",
4620                                              %base_key)},
4621                               esc_path($t->{'name'}));
4622                 print "</td>\n";
4623                 print "<td class=\"link\">";
4624                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4625                                              file_name=>"$basedir$t->{'name'}",
4626                                              %base_key)},
4627                               "tree");
4628                 if (defined $hash_base) {
4629                         print " | " .
4630                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4631                                                      file_name=>"$basedir$t->{'name'}")},
4632                                       "history");
4633                 }
4634                 print "</td>\n";
4635         } else {
4636                 # unknown object: we can only present history for it
4637                 # (this includes 'commit' object, i.e. submodule support)
4638                 print "<td class=\"list\">" .
4639                       esc_path($t->{'name'}) .
4640                       "</td>\n";
4641                 print "<td class=\"link\">";
4642                 if (defined $hash_base) {
4643                         print $cgi->a({-href => href(action=>"history",
4644                                                      hash_base=>$hash_base,
4645                                                      file_name=>"$basedir$t->{'name'}")},
4646                                       "history");
4647                 }
4648                 print "</td>\n";
4649         }
4650 }
4651
4652 ## ......................................................................
4653 ## functions printing large fragments of HTML
4654
4655 # get pre-image filenames for merge (combined) diff
4656 sub fill_from_file_info {
4657         my ($diff, @parents) = @_;
4658
4659         $diff->{'from_file'} = [ ];
4660         $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4661         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4662                 if ($diff->{'status'}[$i] eq 'R' ||
4663                     $diff->{'status'}[$i] eq 'C') {
4664                         $diff->{'from_file'}[$i] =
4665                                 git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4666                 }
4667         }
4668
4669         return $diff;
4670 }
4671
4672 # is current raw difftree line of file deletion
4673 sub is_deleted {
4674         my $diffinfo = shift;
4675
4676         return $diffinfo->{'to_id'} eq ('0' x 40);
4677 }
4678
4679 # does patch correspond to [previous] difftree raw line
4680 # $diffinfo  - hashref of parsed raw diff format
4681 # $patchinfo - hashref of parsed patch diff format
4682 #              (the same keys as in $diffinfo)
4683 sub is_patch_split {
4684         my ($diffinfo, $patchinfo) = @_;
4685
4686         return defined $diffinfo && defined $patchinfo
4687                 && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4688 }
4689
4690
4691 sub git_difftree_body {
4692         my ($difftree, $hash, @parents) = @_;
4693         my ($parent) = $parents[0];
4694         my $have_blame = gitweb_check_feature('blame');
4695         print "<div class=\"list_head\">\n";
4696         if ($#{$difftree} > 10) {
4697                 print(($#{$difftree} + 1) . " files changed:\n");
4698         }
4699         print "</div>\n";
4700
4701         print "<table class=\"" .
4702               (@parents > 1 ? "combined " : "") .
4703               "diff_tree\">\n";
4704
4705         # header only for combined diff in 'commitdiff' view
4706         my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4707         if ($has_header) {
4708                 # table header
4709                 print "<thead><tr>\n" .
4710                        "<th></th><th></th>\n"; # filename, patchN link
4711                 for (my $i = 0; $i < @parents; $i++) {
4712                         my $par = $parents[$i];
4713                         print "<th>" .
4714                               $cgi->a({-href => href(action=>"commitdiff",
4715                                                      hash=>$hash, hash_parent=>$par),
4716                                        -title => 'commitdiff to parent number ' .
4717                                                   ($i+1) . ': ' . substr($par,0,7)},
4718                                       $i+1) .
4719                               "&nbsp;</th>\n";
4720                 }
4721                 print "</tr></thead>\n<tbody>\n";
4722         }
4723
4724         my $alternate = 1;
4725         my $patchno = 0;
4726         foreach my $line (@{$difftree}) {
4727                 my $diff = parsed_difftree_line($line);
4728
4729                 if ($alternate) {
4730                         print "<tr class=\"dark\">\n";
4731                 } else {
4732                         print "<tr class=\"light\">\n";
4733                 }
4734                 $alternate ^= 1;
4735
4736                 if (exists $diff->{'nparents'}) { # combined diff
4737
4738                         fill_from_file_info($diff, @parents)
4739                                 unless exists $diff->{'from_file'};
4740
4741                         if (!is_deleted($diff)) {
4742                                 # file exists in the result (child) commit
4743                                 print "<td>" .
4744                                       $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4745                                                              file_name=>$diff->{'to_file'},
4746                                                              hash_base=>$hash),
4747                                               -class => "list"}, esc_path($diff->{'to_file'})) .
4748                                       "</td>\n";
4749                         } else {
4750                                 print "<td>" .
4751                                       esc_path($diff->{'to_file'}) .
4752                                       "</td>\n";
4753                         }
4754
4755                         if ($action eq 'commitdiff') {
4756                                 # link to patch
4757                                 $patchno++;
4758                                 print "<td class=\"link\">" .
4759                                       $cgi->a({-href => href(-anchor=>"patch$patchno")},
4760                                               "patch") .
4761                                       " | " .
4762                                       "</td>\n";
4763                         }
4764
4765                         my $has_history = 0;
4766                         my $not_deleted = 0;
4767                         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4768                                 my $hash_parent = $parents[$i];
4769                                 my $from_hash = $diff->{'from_id'}[$i];
4770                                 my $from_path = $diff->{'from_file'}[$i];
4771                                 my $status = $diff->{'status'}[$i];
4772
4773                                 $has_history ||= ($status ne 'A');
4774                                 $not_deleted ||= ($status ne 'D');
4775
4776                                 if ($status eq 'A') {
4777                                         print "<td  class=\"link\" align=\"right\"> | </td>\n";
4778                                 } elsif ($status eq 'D') {
4779                                         print "<td class=\"link\">" .
4780                                               $cgi->a({-href => href(action=>"blob",
4781                                                                      hash_base=>$hash,
4782                                                                      hash=>$from_hash,
4783                                                                      file_name=>$from_path)},
4784                                                       "blob" . ($i+1)) .
4785                                               " | </td>\n";
4786                                 } else {
4787                                         if ($diff->{'to_id'} eq $from_hash) {
4788                                                 print "<td class=\"link nochange\">";
4789                                         } else {
4790                                                 print "<td class=\"link\">";
4791                                         }
4792                                         print $cgi->a({-href => href(action=>"blobdiff",
4793                                                                      hash=>$diff->{'to_id'},
4794                                                                      hash_parent=>$from_hash,
4795                                                                      hash_base=>$hash,
4796                                                                      hash_parent_base=>$hash_parent,
4797                                                                      file_name=>$diff->{'to_file'},
4798                                                                      file_parent=>$from_path)},
4799                                                       "diff" . ($i+1)) .
4800                                               " | </td>\n";
4801                                 }
4802                         }
4803
4804                         print "<td class=\"link\">";
4805                         if ($not_deleted) {
4806                                 print $cgi->a({-href => href(action=>"blob",
4807                                                              hash=>$diff->{'to_id'},
4808                                                              file_name=>$diff->{'to_file'},
4809                                                              hash_base=>$hash)},
4810                                               "blob");
4811                                 print " | " if ($has_history);
4812                         }
4813                         if ($has_history) {
4814                                 print $cgi->a({-href => href(action=>"history",
4815                                                              file_name=>$diff->{'to_file'},
4816                                                              hash_base=>$hash)},
4817                                               "history");
4818                         }
4819                         print "</td>\n";
4820
4821                         print "</tr>\n";
4822                         next; # instead of 'else' clause, to avoid extra indent
4823                 }
4824                 # else ordinary diff
4825
4826                 my ($to_mode_oct, $to_mode_str, $to_file_type);
4827                 my ($from_mode_oct, $from_mode_str, $from_file_type);
4828                 if ($diff->{'to_mode'} ne ('0' x 6)) {
4829                         $to_mode_oct = oct $diff->{'to_mode'};
4830                         if (S_ISREG($to_mode_oct)) { # only for regular file
4831                                 $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4832                         }
4833                         $to_file_type = file_type($diff->{'to_mode'});
4834                 }
4835                 if ($diff->{'from_mode'} ne ('0' x 6)) {
4836                         $from_mode_oct = oct $diff->{'from_mode'};
4837                         if (S_ISREG($from_mode_oct)) { # only for regular file
4838                                 $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4839                         }
4840                         $from_file_type = file_type($diff->{'from_mode'});
4841                 }
4842
4843                 if ($diff->{'status'} eq "A") { # created
4844                         my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4845                         $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4846                         $mode_chng   .= "]</span>";
4847                         print "<td>";
4848                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4849                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4850                                       -class => "list"}, esc_path($diff->{'file'}));
4851                         print "</td>\n";
4852                         print "<td>$mode_chng</td>\n";
4853                         print "<td class=\"link\">";
4854                         if ($action eq 'commitdiff') {
4855                                 # link to patch
4856                                 $patchno++;
4857                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4858                                               "patch") .
4859                                       " | ";
4860                         }
4861                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4862                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4863                                       "blob");
4864                         print "</td>\n";
4865
4866                 } elsif ($diff->{'status'} eq "D") { # deleted
4867                         my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4868                         print "<td>";
4869                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4870                                                      hash_base=>$parent, file_name=>$diff->{'file'}),
4871                                        -class => "list"}, esc_path($diff->{'file'}));
4872                         print "</td>\n";
4873                         print "<td>$mode_chng</td>\n";
4874                         print "<td class=\"link\">";
4875                         if ($action eq 'commitdiff') {
4876                                 # link to patch
4877                                 $patchno++;
4878                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4879                                               "patch") .
4880                                       " | ";
4881                         }
4882                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4883                                                      hash_base=>$parent, file_name=>$diff->{'file'})},
4884                                       "blob") . " | ";
4885                         if ($have_blame) {
4886                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4887                                                              file_name=>$diff->{'file'})},
4888                                               "blame") . " | ";
4889                         }
4890                         print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4891                                                      file_name=>$diff->{'file'})},
4892                                       "history");
4893                         print "</td>\n";
4894
4895                 } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4896                         my $mode_chnge = "";
4897                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4898                                 $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4899                                 if ($from_file_type ne $to_file_type) {
4900                                         $mode_chnge .= " from $from_file_type to $to_file_type";
4901                                 }
4902                                 if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4903                                         if ($from_mode_str && $to_mode_str) {
4904                                                 $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4905                                         } elsif ($to_mode_str) {
4906                                                 $mode_chnge .= " mode: $to_mode_str";
4907                                         }
4908                                 }
4909                                 $mode_chnge .= "]</span>\n";
4910                         }
4911                         print "<td>";
4912                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4913                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4914                                       -class => "list"}, esc_path($diff->{'file'}));
4915                         print "</td>\n";
4916                         print "<td>$mode_chnge</td>\n";
4917                         print "<td class=\"link\">";
4918                         if ($action eq 'commitdiff') {
4919                                 # link to patch
4920                                 $patchno++;
4921                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4922                                               "patch") .
4923                                       " | ";
4924                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4925                                 # "commit" view and modified file (not onlu mode changed)
4926                                 print $cgi->a({-href => href(action=>"blobdiff",
4927                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4928                                                              hash_base=>$hash, hash_parent_base=>$parent,
4929                                                              file_name=>$diff->{'file'})},
4930                                               "diff") .
4931                                       " | ";
4932                         }
4933                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4934                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4935                                        "blob") . " | ";
4936                         if ($have_blame) {
4937                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4938                                                              file_name=>$diff->{'file'})},
4939                                               "blame") . " | ";
4940                         }
4941                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4942                                                      file_name=>$diff->{'file'})},
4943                                       "history");
4944                         print "</td>\n";
4945
4946                 } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4947                         my %status_name = ('R' => 'moved', 'C' => 'copied');
4948                         my $nstatus = $status_name{$diff->{'status'}};
4949                         my $mode_chng = "";
4950                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4951                                 # mode also for directories, so we cannot use $to_mode_str
4952                                 $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4953                         }
4954                         print "<td>" .
4955                               $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4956                                                      hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4957                                       -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4958                               "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4959                               $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4960                                                      hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4961                                       -class => "list"}, esc_path($diff->{'from_file'})) .
4962                               " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4963                               "<td class=\"link\">";
4964                         if ($action eq 'commitdiff') {
4965                                 # link to patch
4966                                 $patchno++;
4967                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4968                                               "patch") .
4969                                       " | ";
4970                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4971                                 # "commit" view and modified file (not only pure rename or copy)
4972                                 print $cgi->a({-href => href(action=>"blobdiff",
4973                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4974                                                              hash_base=>$hash, hash_parent_base=>$parent,
4975                                                              file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4976                                               "diff") .
4977                                       " | ";
4978                         }
4979                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4980                                                      hash_base=>$parent, file_name=>$diff->{'to_file'})},
4981                                       "blob") . " | ";
4982                         if ($have_blame) {
4983                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4984                                                              file_name=>$diff->{'to_file'})},
4985                                               "blame") . " | ";
4986                         }
4987                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4988                                                     file_name=>$diff->{'to_file'})},
4989                                       "history");
4990                         print "</td>\n";
4991
4992                 } # we should not encounter Unmerged (U) or Unknown (X) status
4993                 print "</tr>\n";
4994         }
4995         print "</tbody>" if $has_header;
4996         print "</table>\n";
4997 }
4998
4999 sub print_sidebyside_diff_chunk {
5000         my @chunk = @_;
5001         my (@ctx, @rem, @add);
5002
5003         return unless @chunk;
5004
5005         # incomplete last line might be among removed or added lines,
5006         # or both, or among context lines: find which
5007         for (my $i = 1; $i < @chunk; $i++) {
5008                 if ($chunk[$i][0] eq 'incomplete') {
5009                         $chunk[$i][0] = $chunk[$i-1][0];
5010                 }
5011         }
5012
5013         # guardian
5014         push @chunk, ["", ""];
5015
5016         foreach my $line_info (@chunk) {
5017                 my ($class, $line) = @$line_info;
5018
5019                 # print chunk headers
5020                 if ($class && $class eq 'chunk_header') {
5021                         print $line;
5022                         next;
5023                 }
5024
5025                 ## print from accumulator when type of class of lines change
5026                 # empty contents block on start rem/add block, or end of chunk
5027                 if (@ctx && (!$class || $class eq 'rem' || $class eq 'add')) {
5028                         print join '',
5029                                 '<div class="chunk_block ctx">',
5030                                         '<div class="old">',
5031                                         @ctx,
5032                                         '</div>',
5033                                         '<div class="new">',
5034                                         @ctx,
5035                                         '</div>',
5036                                 '</div>';
5037                         @ctx = ();
5038                 }
5039                 # empty add/rem block on start context block, or end of chunk
5040                 if ((@rem || @add) && (!$class || $class eq 'ctx')) {
5041                         if (!@add) {
5042                                 # pure removal
5043                                 print join '',
5044                                         '<div class="chunk_block rem">',
5045                                                 '<div class="old">',
5046                                                 @rem,
5047                                                 '</div>',
5048                                         '</div>';
5049                         } elsif (!@rem) {
5050                                 # pure addition
5051                                 print join '',
5052                                         '<div class="chunk_block add">',
5053                                                 '<div class="new">',
5054                                                 @add,
5055                                                 '</div>',
5056                                         '</div>';
5057                         } else {
5058                                 # assume that it is change
5059                                 print join '',
5060                                         '<div class="chunk_block chg">',
5061                                                 '<div class="old">',
5062                                                 @rem,
5063                                                 '</div>',
5064                                                 '<div class="new">',
5065                                                 @add,
5066                                                 '</div>',
5067                                         '</div>';
5068                         }
5069                         @rem = @add = ();
5070                 }
5071
5072                 ## adding lines to accumulator
5073                 # guardian value
5074                 last unless $line;
5075                 # rem, add or change
5076                 if ($class eq 'rem') {
5077                         push @rem, $line;
5078                 } elsif ($class eq 'add') {
5079                         push @add, $line;
5080                 }
5081                 # context line
5082                 if ($class eq 'ctx') {
5083                         push @ctx, $line;
5084                 }
5085         }
5086 }
5087
5088 sub git_patchset_body {
5089         my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
5090         my ($hash_parent) = $hash_parents[0];
5091
5092         my $is_combined = (@hash_parents > 1);
5093         my $patch_idx = 0;
5094         my $patch_number = 0;
5095         my $patch_line;
5096         my $diffinfo;
5097         my $to_name;
5098         my (%from, %to);
5099         my @chunk; # for side-by-side diff
5100
5101         print "<div class=\"patchset\">\n";
5102
5103         # skip to first patch
5104         while ($patch_line = <$fd>) {
5105                 chomp $patch_line;
5106
5107                 last if ($patch_line =~ m/^diff /);
5108         }
5109
5110  PATCH:
5111         while ($patch_line) {
5112
5113                 # parse "git diff" header line
5114                 if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
5115                         # $1 is from_name, which we do not use
5116                         $to_name = unquote($2);
5117                         $to_name =~ s!^b/!!;
5118                 } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
5119                         # $1 is 'cc' or 'combined', which we do not use
5120                         $to_name = unquote($2);
5121                 } else {
5122                         $to_name = undef;
5123                 }
5124
5125                 # check if current patch belong to current raw line
5126                 # and parse raw git-diff line if needed
5127                 if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
5128                         # this is continuation of a split patch
5129                         print "<div class=\"patch cont\">\n";
5130                 } else {
5131                         # advance raw git-diff output if needed
5132                         $patch_idx++ if defined $diffinfo;
5133
5134                         # read and prepare patch information
5135                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5136
5137                         # compact combined diff output can have some patches skipped
5138                         # find which patch (using pathname of result) we are at now;
5139                         if ($is_combined) {
5140                                 while ($to_name ne $diffinfo->{'to_file'}) {
5141                                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5142                                               format_diff_cc_simplified($diffinfo, @hash_parents) .
5143                                               "</div>\n";  # class="patch"
5144
5145                                         $patch_idx++;
5146                                         $patch_number++;
5147
5148                                         last if $patch_idx > $#$difftree;
5149                                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5150                                 }
5151                         }
5152
5153                         # modifies %from, %to hashes
5154                         parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5155
5156                         # this is first patch for raw difftree line with $patch_idx index
5157                         # we index @$difftree array from 0, but number patches from 1
5158                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5159                 }
5160
5161                 # git diff header
5162                 #assert($patch_line =~ m/^diff /) if DEBUG;
5163                 #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5164                 $patch_number++;
5165                 # print "git diff" header
5166                 print format_git_diff_header_line($patch_line, $diffinfo,
5167                                                   \%from, \%to);
5168
5169                 # print extended diff header
5170                 print "<div class=\"diff extended_header\">\n";
5171         EXTENDED_HEADER:
5172                 while ($patch_line = <$fd>) {
5173                         chomp $patch_line;
5174
5175                         last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5176
5177                         print format_extended_diff_header_line($patch_line, $diffinfo,
5178                                                                \%from, \%to);
5179                 }
5180                 print "</div>\n"; # class="diff extended_header"
5181
5182                 # from-file/to-file diff header
5183                 if (! $patch_line) {
5184                         print "</div>\n"; # class="patch"
5185                         last PATCH;
5186                 }
5187                 next PATCH if ($patch_line =~ m/^diff /);
5188                 #assert($patch_line =~ m/^---/) if DEBUG;
5189
5190                 my $last_patch_line = $patch_line;
5191                 $patch_line = <$fd>;
5192                 chomp $patch_line;
5193                 #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5194
5195                 print format_diff_from_to_header($last_patch_line, $patch_line,
5196                                                  $diffinfo, \%from, \%to,
5197                                                  @hash_parents);
5198
5199                 # the patch itself
5200         LINE:
5201                 while ($patch_line = <$fd>) {
5202                         chomp $patch_line;
5203
5204                         next PATCH if ($patch_line =~ m/^diff /);
5205
5206                         my ($class, $line) = process_diff_line($patch_line, \%from, \%to);
5207                         my $diff_classes = "diff";
5208                         $diff_classes .= " $class" if ($class);
5209                         $line = "<div class=\"$diff_classes\">$line</div>\n";
5210
5211                         if ($diff_style eq 'sidebyside' && !$is_combined) {
5212                                 if ($class eq 'chunk_header') {
5213                                         print_sidebyside_diff_chunk(@chunk);
5214                                         @chunk = ( [ $class, $line ] );
5215                                 } else {
5216                                         push @chunk, [ $class, $line ];
5217                                 }
5218                         } else {
5219                                 # default 'inline' style and unknown styles
5220                                 print $line;
5221                         }
5222                 }
5223
5224         } continue {
5225                 if (@chunk) {
5226                         print_sidebyside_diff_chunk(@chunk);
5227                         @chunk = ();
5228                 }
5229                 print "</div>\n"; # class="patch"
5230         }
5231
5232         # for compact combined (--cc) format, with chunk and patch simplification
5233         # the patchset might be empty, but there might be unprocessed raw lines
5234         for (++$patch_idx if $patch_number > 0;
5235              $patch_idx < @$difftree;
5236              ++$patch_idx) {
5237                 # read and prepare patch information
5238                 $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5239
5240                 # generate anchor for "patch" links in difftree / whatchanged part
5241                 print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5242                       format_diff_cc_simplified($diffinfo, @hash_parents) .
5243                       "</div>\n";  # class="patch"
5244
5245                 $patch_number++;
5246         }
5247
5248         if ($patch_number == 0) {
5249                 if (@hash_parents > 1) {
5250                         print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5251                 } else {
5252                         print "<div class=\"diff nodifferences\">No differences found</div>\n";
5253                 }
5254         }
5255
5256         print "</div>\n"; # class="patchset"
5257 }
5258
5259 # . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5260
5261 sub git_project_search_form {
5262         my ($searchtext, $search_use_regexp) = @_;
5263
5264         my $limit = '';
5265         if ($project_filter) {
5266                 $limit = " in '$project_filter/'";
5267         }
5268
5269         print "<div class=\"projsearch\">\n";
5270         print $cgi->startform(-method => 'get', -action => $my_uri) .
5271               $cgi->hidden(-name => 'a', -value => 'project_list')  . "\n";
5272         print $cgi->hidden(-name => 'pf', -value => $project_filter). "\n"
5273                 if (defined $project_filter);
5274         print $cgi->textfield(-name => 's', -value => $searchtext,
5275                               -title => "Search project by name and description$limit",
5276                               -size => 60) . "\n" .
5277               "<span title=\"Extended regular expression\">" .
5278               $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
5279                              -checked => $search_use_regexp) .
5280               "</span>\n" .
5281               $cgi->submit(-name => 'btnS', -value => 'Search') .
5282               $cgi->end_form() . "\n" .
5283               $cgi->a({-href => href(project => undef, searchtext => undef,
5284                                      project_filter => $project_filter)},
5285                       esc_html("List all projects$limit")) . "<br />\n";
5286         print "</div>\n";
5287 }
5288
5289 # entry for given @keys needs filling if at least one of keys in list
5290 # is not present in %$project_info
5291 sub project_info_needs_filling {
5292         my ($project_info, @keys) = @_;
5293
5294         # return List::MoreUtils::any { !exists $project_info->{$_} } @keys;
5295         foreach my $key (@keys) {
5296                 if (!exists $project_info->{$key}) {
5297                         return 1;
5298                 }
5299         }
5300         return;
5301 }
5302
5303 # fills project list info (age, description, owner, category, forks, etc.)
5304 # for each project in the list, removing invalid projects from
5305 # returned list, or fill only specified info.
5306 #
5307 # Invalid projects are removed from the returned list if and only if you
5308 # ask 'age' or 'age_string' to be filled, because they are the only fields
5309 # that run unconditionally git command that requires repository, and
5310 # therefore do always check if project repository is invalid.
5311 #
5312 # USAGE:
5313 # * fill_project_list_info(\@project_list, 'descr_long', 'ctags')
5314 #   ensures that 'descr_long' and 'ctags' fields are filled
5315 # * @project_list = fill_project_list_info(\@project_list)
5316 #   ensures that all fields are filled (and invalid projects removed)
5317 #
5318 # NOTE: modifies $projlist, but does not remove entries from it
5319 sub fill_project_list_info {
5320         my ($projlist, @wanted_keys) = @_;
5321         my @projects;
5322         my $filter_set = sub { return @_; };
5323         if (@wanted_keys) {
5324                 my %wanted_keys = map { $_ => 1 } @wanted_keys;
5325                 $filter_set = sub { return grep { $wanted_keys{$_} } @_; };
5326         }
5327
5328         my $show_ctags = gitweb_check_feature('ctags');
5329  PROJECT:
5330         foreach my $pr (@$projlist) {
5331                 if (project_info_needs_filling($pr, $filter_set->('age', 'age_string'))) {
5332                         my (@activity) = git_get_last_activity($pr->{'path'});
5333                         unless (@activity) {
5334                                 next PROJECT;
5335                         }
5336                         ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5337                 }
5338                 if (project_info_needs_filling($pr, $filter_set->('descr', 'descr_long'))) {
5339                         my $descr = git_get_project_description($pr->{'path'}) || "";
5340                         $descr = to_utf8($descr);
5341                         $pr->{'descr_long'} = $descr;
5342                         $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5343                 }
5344                 if (project_info_needs_filling($pr, $filter_set->('owner'))) {
5345                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5346                 }
5347                 if ($show_ctags &&
5348                     project_info_needs_filling($pr, $filter_set->('ctags'))) {
5349                         $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5350                 }
5351                 if ($projects_list_group_categories &&
5352                     project_info_needs_filling($pr, $filter_set->('category'))) {
5353                         my $cat = git_get_project_category($pr->{'path'}) ||
5354                                                            $project_list_default_category;
5355                         $pr->{'category'} = to_utf8($cat);
5356                 }
5357
5358                 push @projects, $pr;
5359         }
5360
5361         return @projects;
5362 }
5363
5364 sub sort_projects_list {
5365         my ($projlist, $order) = @_;
5366         my @projects;
5367
5368         my %order_info = (
5369                 project => { key => 'path', type => 'str' },
5370                 descr => { key => 'descr_long', type => 'str' },
5371                 owner => { key => 'owner', type => 'str' },
5372                 age => { key => 'age', type => 'num' }
5373         );
5374         my $oi = $order_info{$order};
5375         return @$projlist unless defined $oi;
5376         if ($oi->{'type'} eq 'str') {
5377                 @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5378         } else {
5379                 @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5380         }
5381
5382         return @projects;
5383 }
5384
5385 # returns a hash of categories, containing the list of project
5386 # belonging to each category
5387 sub build_projlist_by_category {
5388         my ($projlist, $from, $to) = @_;
5389         my %categories;
5390
5391         $from = 0 unless defined $from;
5392         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5393
5394         for (my $i = $from; $i <= $to; $i++) {
5395                 my $pr = $projlist->[$i];
5396                 push @{$categories{ $pr->{'category'} }}, $pr;
5397         }
5398
5399         return wantarray ? %categories : \%categories;
5400 }
5401
5402 # print 'sort by' <th> element, generating 'sort by $name' replay link
5403 # if that order is not selected
5404 sub print_sort_th {
5405         print format_sort_th(@_);
5406 }
5407
5408 sub format_sort_th {
5409         my ($name, $order, $header) = @_;
5410         my $sort_th = "";
5411         $header ||= ucfirst($name);
5412
5413         if ($order eq $name) {
5414                 $sort_th .= "<th>$header</th>\n";
5415         } else {
5416                 $sort_th .= "<th>" .
5417                             $cgi->a({-href => href(-replay=>1, order=>$name),
5418                                      -class => "header"}, $header) .
5419                             "</th>\n";
5420         }
5421
5422         return $sort_th;
5423 }
5424
5425 sub git_project_list_rows {
5426         my ($projlist, $from, $to, $check_forks) = @_;
5427
5428         $from = 0 unless defined $from;
5429         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5430
5431         my $alternate = 1;
5432         for (my $i = $from; $i <= $to; $i++) {
5433                 my $pr = $projlist->[$i];
5434
5435                 if ($alternate) {
5436                         print "<tr class=\"dark\">\n";
5437                 } else {
5438                         print "<tr class=\"light\">\n";
5439                 }
5440                 $alternate ^= 1;
5441
5442                 if ($check_forks) {
5443                         print "<td>";
5444                         if ($pr->{'forks'}) {
5445                                 my $nforks = scalar @{$pr->{'forks'}};
5446                                 if ($nforks > 0) {
5447                                         print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5448                                                        -title => "$nforks forks"}, "+");
5449                                 } else {
5450                                         print $cgi->span({-title => "$nforks forks"}, "+");
5451                                 }
5452                         }
5453                         print "</td>\n";
5454                 }
5455                 print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5456                                         -class => "list"},
5457                                        esc_html_match_hl($pr->{'path'}, $search_regexp)) .
5458                       "</td>\n" .
5459                       "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5460                                         -class => "list",
5461                                         -title => $pr->{'descr_long'}},
5462                                         $search_regexp
5463                                         ? esc_html_match_hl_chopped($pr->{'descr_long'},
5464                                                                     $pr->{'descr'}, $search_regexp)
5465                                         : esc_html($pr->{'descr'})) .
5466                       "</td>\n" .
5467                       "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5468                 print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5469                       (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
5470                       "<td class=\"link\">" .
5471                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5472                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5473                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5474                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5475                       ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5476                       "</td>\n" .
5477                       "</tr>\n";
5478         }
5479 }
5480
5481 sub git_project_list_body {
5482         # actually uses global variable $project
5483         my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5484         my @projects = @$projlist;
5485
5486         my $check_forks = gitweb_check_feature('forks');
5487         my $show_ctags  = gitweb_check_feature('ctags');
5488         my $tagfilter = $show_ctags ? $input_params{'ctag'} : undef;
5489         $check_forks = undef
5490                 if ($tagfilter || $search_regexp);
5491
5492         # filtering out forks before filling info allows to do less work
5493         @projects = filter_forks_from_projects_list(\@projects)
5494                 if ($check_forks);
5495         # search_projects_list pre-fills required info
5496         @projects = search_projects_list(\@projects,
5497                                          'search_regexp' => $search_regexp,
5498                                          'tagfilter'  => $tagfilter)
5499                 if ($tagfilter || $search_regexp);
5500         # fill the rest
5501         @projects = fill_project_list_info(\@projects);
5502
5503         $order ||= $default_projects_order;
5504         $from = 0 unless defined $from;
5505         $to = $#projects if (!defined $to || $#projects < $to);
5506
5507         # short circuit
5508         if ($from > $to) {
5509                 print "<center>\n".
5510                       "<b>No such projects found</b><br />\n".
5511                       "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5512                       "</center>\n<br />\n";
5513                 return;
5514         }
5515
5516         @projects = sort_projects_list(\@projects, $order);
5517
5518         if ($show_ctags) {
5519                 my $ctags = git_gather_all_ctags(\@projects);
5520                 my $cloud = git_populate_project_tagcloud($ctags);
5521                 print git_show_project_tagcloud($cloud, 64);
5522         }
5523
5524         print "<table class=\"project_list\">\n";
5525         unless ($no_header) {
5526                 print "<tr>\n";
5527                 if ($check_forks) {
5528                         print "<th></th>\n";
5529                 }
5530                 print_sort_th('project', $order, 'Project');
5531                 print_sort_th('descr', $order, 'Description');
5532                 print_sort_th('owner', $order, 'Owner');
5533                 print_sort_th('age', $order, 'Last Change');
5534                 print "<th></th>\n" . # for links
5535                       "</tr>\n";
5536         }
5537
5538         if ($projects_list_group_categories) {
5539                 # only display categories with projects in the $from-$to window
5540                 @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5541                 my %categories = build_projlist_by_category(\@projects, $from, $to);
5542                 foreach my $cat (sort keys %categories) {
5543                         unless ($cat eq "") {
5544                                 print "<tr>\n";
5545                                 if ($check_forks) {
5546                                         print "<td></td>\n";
5547                                 }
5548                                 print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5549                                 print "</tr>\n";
5550                         }
5551
5552                         git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5553                 }
5554         } else {
5555                 git_project_list_rows(\@projects, $from, $to, $check_forks);
5556         }
5557
5558         if (defined $extra) {
5559                 print "<tr>\n";
5560                 if ($check_forks) {
5561                         print "<td></td>\n";
5562                 }
5563                 print "<td colspan=\"5\">$extra</td>\n" .
5564                       "</tr>\n";
5565         }
5566         print "</table>\n";
5567 }
5568
5569 sub git_log_body {
5570         # uses global variable $project
5571         my ($commitlist, $from, $to, $refs, $extra) = @_;
5572
5573         $from = 0 unless defined $from;
5574         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5575
5576         for (my $i = 0; $i <= $to; $i++) {
5577                 my %co = %{$commitlist->[$i]};
5578                 next if !%co;
5579                 my $commit = $co{'id'};
5580                 my $ref = format_ref_marker($refs, $commit);
5581                 git_print_header_div('commit',
5582                                "<span class=\"age\">$co{'age_string'}</span>" .
5583                                esc_html($co{'title'}) . $ref,
5584                                $commit);
5585                 print "<div class=\"title_text\">\n" .
5586                       "<div class=\"log_link\">\n" .
5587                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5588                       " | " .
5589                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5590                       " | " .
5591                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5592                       "<br/>\n" .
5593                       "</div>\n";
5594                       git_print_authorship(\%co, -tag => 'span');
5595                       print "<br/>\n</div>\n";
5596
5597                 print "<div class=\"log_body\">\n";
5598                 git_print_log($co{'comment'}, -final_empty_line=> 1);
5599                 print "</div>\n";
5600         }
5601         if ($extra) {
5602                 print "<div class=\"page_nav\">\n";
5603                 print "$extra\n";
5604                 print "</div>\n";
5605         }
5606 }
5607
5608 sub git_shortlog_body {
5609         # uses global variable $project
5610         my ($commitlist, $from, $to, $refs, $extra) = @_;
5611
5612         $from = 0 unless defined $from;
5613         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5614
5615         print "<table class=\"shortlog\">\n";
5616         my $alternate = 1;
5617         for (my $i = $from; $i <= $to; $i++) {
5618                 my %co = %{$commitlist->[$i]};
5619                 my $commit = $co{'id'};
5620                 my $ref = format_ref_marker($refs, $commit);
5621                 if ($alternate) {
5622                         print "<tr class=\"dark\">\n";
5623                 } else {
5624                         print "<tr class=\"light\">\n";
5625                 }
5626                 $alternate ^= 1;
5627                 # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5628                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5629                       format_author_html('td', \%co, 10) . "<td>";
5630                 print format_subject_html($co{'title'}, $co{'title_short'},
5631                                           href(action=>"commit", hash=>$commit), $ref);
5632                 print "</td>\n" .
5633                       "<td class=\"link\">" .
5634                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5635                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5636                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5637                 my $snapshot_links = format_snapshot_links($commit);
5638                 if (defined $snapshot_links) {
5639                         print " | " . $snapshot_links;
5640                 }
5641                 print "</td>\n" .
5642                       "</tr>\n";
5643         }
5644         if (defined $extra) {
5645                 print "<tr>\n" .
5646                       "<td colspan=\"4\">$extra</td>\n" .
5647                       "</tr>\n";
5648         }
5649         print "</table>\n";
5650 }
5651
5652 sub git_history_body {
5653         # Warning: assumes constant type (blob or tree) during history
5654         my ($commitlist, $from, $to, $refs, $extra,
5655             $file_name, $file_hash, $ftype) = @_;
5656
5657         $from = 0 unless defined $from;
5658         $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5659
5660         print "<table class=\"history\">\n";
5661         my $alternate = 1;
5662         for (my $i = $from; $i <= $to; $i++) {
5663                 my %co = %{$commitlist->[$i]};
5664                 if (!%co) {
5665                         next;
5666                 }
5667                 my $commit = $co{'id'};
5668
5669                 my $ref = format_ref_marker($refs, $commit);
5670
5671                 if ($alternate) {
5672                         print "<tr class=\"dark\">\n";
5673                 } else {
5674                         print "<tr class=\"light\">\n";
5675                 }
5676                 $alternate ^= 1;
5677                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5678         # shortlog:   format_author_html('td', \%co, 10)
5679                       format_author_html('td', \%co, 15, 3) . "<td>";
5680                 # originally git_history used chop_str($co{'title'}, 50)
5681                 print format_subject_html($co{'title'}, $co{'title_short'},
5682                                           href(action=>"commit", hash=>$commit), $ref);
5683                 print "</td>\n" .
5684                       "<td class=\"link\">" .
5685                       $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5686                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5687
5688                 if ($ftype eq 'blob') {
5689                         my $blob_current = $file_hash;
5690                         my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5691                         if (defined $blob_current && defined $blob_parent &&
5692                                         $blob_current ne $blob_parent) {
5693                                 print " | " .
5694                                         $cgi->a({-href => href(action=>"blobdiff",
5695                                                                hash=>$blob_current, hash_parent=>$blob_parent,
5696                                                                hash_base=>$hash_base, hash_parent_base=>$commit,
5697                                                                file_name=>$file_name)},
5698                                                 "diff to current");
5699                         }
5700                 }
5701                 print "</td>\n" .
5702                       "</tr>\n";
5703         }
5704         if (defined $extra) {
5705                 print "<tr>\n" .
5706                       "<td colspan=\"4\">$extra</td>\n" .
5707                       "</tr>\n";
5708         }
5709         print "</table>\n";
5710 }
5711
5712 sub git_tags_body {
5713         # uses global variable $project
5714         my ($taglist, $from, $to, $extra) = @_;
5715         $from = 0 unless defined $from;
5716         $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5717
5718         print "<table class=\"tags\">\n";
5719         my $alternate = 1;
5720         for (my $i = $from; $i <= $to; $i++) {
5721                 my $entry = $taglist->[$i];
5722                 my %tag = %$entry;
5723                 my $comment = $tag{'subject'};
5724                 my $comment_short;
5725                 if (defined $comment) {
5726                         $comment_short = chop_str($comment, 30, 5);
5727                 }
5728                 if ($alternate) {
5729                         print "<tr class=\"dark\">\n";
5730                 } else {
5731                         print "<tr class=\"light\">\n";
5732                 }
5733                 $alternate ^= 1;
5734                 if (defined $tag{'age'}) {
5735                         print "<td><i>$tag{'age'}</i></td>\n";
5736                 } else {
5737                         print "<td></td>\n";
5738                 }
5739                 print "<td>" .
5740                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5741                                -class => "list name"}, esc_html($tag{'name'})) .
5742                       "</td>\n" .
5743                       "<td>";
5744                 if (defined $comment) {
5745                         print format_subject_html($comment, $comment_short,
5746                                                   href(action=>"tag", hash=>$tag{'id'}));
5747                 }
5748                 print "</td>\n" .
5749                       "<td class=\"selflink\">";
5750                 if ($tag{'type'} eq "tag") {
5751                         print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5752                 } else {
5753                         print "&nbsp;";
5754                 }
5755                 print "</td>\n" .
5756                       "<td class=\"link\">" . " | " .
5757                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5758                 if ($tag{'reftype'} eq "commit") {
5759                         print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5760                               " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5761                 } elsif ($tag{'reftype'} eq "blob") {
5762                         print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5763                 }
5764                 print "</td>\n" .
5765                       "</tr>";
5766         }
5767         if (defined $extra) {
5768                 print "<tr>\n" .
5769                       "<td colspan=\"5\">$extra</td>\n" .
5770                       "</tr>\n";
5771         }
5772         print "</table>\n";
5773 }
5774
5775 sub git_heads_body {
5776         # uses global variable $project
5777         my ($headlist, $head_at, $from, $to, $extra) = @_;
5778         $from = 0 unless defined $from;
5779         $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5780
5781         print "<table class=\"heads\">\n";
5782         my $alternate = 1;
5783         for (my $i = $from; $i <= $to; $i++) {
5784                 my $entry = $headlist->[$i];
5785                 my %ref = %$entry;
5786                 my $curr = defined $head_at && $ref{'id'} eq $head_at;
5787                 if ($alternate) {
5788                         print "<tr class=\"dark\">\n";
5789                 } else {
5790                         print "<tr class=\"light\">\n";
5791                 }
5792                 $alternate ^= 1;
5793                 print "<td><i>$ref{'age'}</i></td>\n" .
5794                       ($curr ? "<td class=\"current_head\">" : "<td>") .
5795                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5796                                -class => "list name"},esc_html($ref{'name'})) .
5797                       "</td>\n" .
5798                       "<td class=\"link\">" .
5799                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5800                       $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5801                       $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5802                       "</td>\n" .
5803                       "</tr>";
5804         }
5805         if (defined $extra) {
5806                 print "<tr>\n" .
5807                       "<td colspan=\"3\">$extra</td>\n" .
5808                       "</tr>\n";
5809         }
5810         print "</table>\n";
5811 }
5812
5813 # Display a single remote block
5814 sub git_remote_block {
5815         my ($remote, $rdata, $limit, $head) = @_;
5816
5817         my $heads = $rdata->{'heads'};
5818         my $fetch = $rdata->{'fetch'};
5819         my $push = $rdata->{'push'};
5820
5821         my $urls_table = "<table class=\"projects_list\">\n" ;
5822
5823         if (defined $fetch) {
5824                 if ($fetch eq $push) {
5825                         $urls_table .= format_repo_url("URL", $fetch);
5826                 } else {
5827                         $urls_table .= format_repo_url("Fetch URL", $fetch);
5828                         $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5829                 }
5830         } elsif (defined $push) {
5831                 $urls_table .= format_repo_url("Push URL", $push);
5832         } else {
5833                 $urls_table .= format_repo_url("", "No remote URL");
5834         }
5835
5836         $urls_table .= "</table>\n";
5837
5838         my $dots;
5839         if (defined $limit && $limit < @$heads) {
5840                 $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5841         }
5842
5843         print $urls_table;
5844         git_heads_body($heads, $head, 0, $limit, $dots);
5845 }
5846
5847 # Display a list of remote names with the respective fetch and push URLs
5848 sub git_remotes_list {
5849         my ($remotedata, $limit) = @_;
5850         print "<table class=\"heads\">\n";
5851         my $alternate = 1;
5852         my @remotes = sort keys %$remotedata;
5853
5854         my $limited = $limit && $limit < @remotes;
5855
5856         $#remotes = $limit - 1 if $limited;
5857
5858         while (my $remote = shift @remotes) {
5859                 my $rdata = $remotedata->{$remote};
5860                 my $fetch = $rdata->{'fetch'};
5861                 my $push = $rdata->{'push'};
5862                 if ($alternate) {
5863                         print "<tr class=\"dark\">\n";
5864                 } else {
5865                         print "<tr class=\"light\">\n";
5866                 }
5867                 $alternate ^= 1;
5868                 print "<td>" .
5869                       $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5870                                -class=> "list name"},esc_html($remote)) .
5871                       "</td>";
5872                 print "<td class=\"link\">" .
5873                       (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5874                       " | " .
5875                       (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5876                       "</td>";
5877
5878                 print "</tr>\n";
5879         }
5880
5881         if ($limited) {
5882                 print "<tr>\n" .
5883                       "<td colspan=\"3\">" .
5884                       $cgi->a({-href => href(action=>"remotes")}, "...") .
5885                       "</td>\n" . "</tr>\n";
5886         }
5887
5888         print "</table>";
5889 }
5890
5891 # Display remote heads grouped by remote, unless there are too many
5892 # remotes, in which case we only display the remote names
5893 sub git_remotes_body {
5894         my ($remotedata, $limit, $head) = @_;
5895         if ($limit and $limit < keys %$remotedata) {
5896                 git_remotes_list($remotedata, $limit);
5897         } else {
5898                 fill_remote_heads($remotedata);
5899                 while (my ($remote, $rdata) = each %$remotedata) {
5900                         git_print_section({-class=>"remote", -id=>$remote},
5901                                 ["remotes", $remote, $remote], sub {
5902                                         git_remote_block($remote, $rdata, $limit, $head);
5903                                 });
5904                 }
5905         }
5906 }
5907
5908 sub git_search_message {
5909         my %co = @_;
5910
5911         my $greptype;
5912         if ($searchtype eq 'commit') {
5913                 $greptype = "--grep=";
5914         } elsif ($searchtype eq 'author') {
5915                 $greptype = "--author=";
5916         } elsif ($searchtype eq 'committer') {
5917                 $greptype = "--committer=";
5918         }
5919         $greptype .= $searchtext;
5920         my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
5921                                        $greptype, '--regexp-ignore-case',
5922                                        $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
5923
5924         my $paging_nav = '';
5925         if ($page > 0) {
5926                 $paging_nav .=
5927                         $cgi->a({-href => href(-replay=>1, page=>undef)},
5928                                 "first") .
5929                         " &sdot; " .
5930                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
5931                                  -accesskey => "p", -title => "Alt-p"}, "prev");
5932         } else {
5933                 $paging_nav .= "first &sdot; prev";
5934         }
5935         my $next_link = '';
5936         if ($#commitlist >= 100) {
5937                 $next_link =
5938                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
5939                                  -accesskey => "n", -title => "Alt-n"}, "next");
5940                 $paging_nav .= " &sdot; $next_link";
5941         } else {
5942                 $paging_nav .= " &sdot; next";
5943         }
5944
5945         git_header_html();
5946
5947         git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
5948         git_print_header_div('commit', esc_html($co{'title'}), $hash);
5949         if ($page == 0 && !@commitlist) {
5950                 print "<p>No match.</p>\n";
5951         } else {
5952                 git_search_grep_body(\@commitlist, 0, 99, $next_link);
5953         }
5954
5955         git_footer_html();
5956 }
5957
5958 sub git_search_changes {
5959         my %co = @_;
5960
5961         local $/ = "\n";
5962         open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
5963                 '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
5964                 ($search_use_regexp ? '--pickaxe-regex' : ())
5965                         or die_error(500, "Open git-log failed");
5966
5967         git_header_html();
5968
5969         git_print_page_nav('','', $hash,$co{'tree'},$hash);
5970         git_print_header_div('commit', esc_html($co{'title'}), $hash);
5971
5972         print "<table class=\"pickaxe search\">\n";
5973         my $alternate = 1;
5974         undef %co;
5975         my @files;
5976         while (my $line = <$fd>) {
5977                 chomp $line;
5978                 next unless $line;
5979
5980                 my %set = parse_difftree_raw_line($line);
5981                 if (defined $set{'commit'}) {
5982                         # finish previous commit
5983                         if (%co) {
5984                                 print "</td>\n" .
5985                                       "<td class=\"link\">" .
5986                                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5987                                               "commit") .
5988                                       " | " .
5989                                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5990                                                              hash_base=>$co{'id'})},
5991                                               "tree") .
5992                                       "</td>\n" .
5993                                       "</tr>\n";
5994                         }
5995
5996                         if ($alternate) {
5997                                 print "<tr class=\"dark\">\n";
5998                         } else {
5999                                 print "<tr class=\"light\">\n";
6000                         }
6001                         $alternate ^= 1;
6002                         %co = parse_commit($set{'commit'});
6003                         my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6004                         print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6005                               "<td><i>$author</i></td>\n" .
6006                               "<td>" .
6007                               $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6008                                       -class => "list subject"},
6009                                       chop_and_escape_str($co{'title'}, 50) . "<br/>");
6010                 } elsif (defined $set{'to_id'}) {
6011                         next if ($set{'to_id'} =~ m/^0{40}$/);
6012
6013                         print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6014                                                      hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6015                                       -class => "list"},
6016                                       "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6017                               "<br/>\n";
6018                 }
6019         }
6020         close $fd;
6021
6022         # finish last commit (warning: repetition!)
6023         if (%co) {
6024                 print "</td>\n" .
6025                       "<td class=\"link\">" .
6026                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
6027                               "commit") .
6028                       " | " .
6029                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
6030                                              hash_base=>$co{'id'})},
6031                               "tree") .
6032                       "</td>\n" .
6033                       "</tr>\n";
6034         }
6035
6036         print "</table>\n";
6037
6038         git_footer_html();
6039 }
6040
6041 sub git_search_files {
6042         my %co = @_;
6043
6044         local $/ = "\n";
6045         open my $fd, "-|", git_cmd(), 'grep', '-n', '-z',
6046                 $search_use_regexp ? ('-E', '-i') : '-F',
6047                 $searchtext, $co{'tree'}
6048                         or die_error(500, "Open git-grep failed");
6049
6050         git_header_html();
6051
6052         git_print_page_nav('','', $hash,$co{'tree'},$hash);
6053         git_print_header_div('commit', esc_html($co{'title'}), $hash);
6054
6055         print "<table class=\"grep_search\">\n";
6056         my $alternate = 1;
6057         my $matches = 0;
6058         my $lastfile = '';
6059         my $file_href;
6060         while (my $line = <$fd>) {
6061                 chomp $line;
6062                 my ($file, $lno, $ltext, $binary);
6063                 last if ($matches++ > 1000);
6064                 if ($line =~ /^Binary file (.+) matches$/) {
6065                         $file = $1;
6066                         $binary = 1;
6067                 } else {
6068                         ($file, $lno, $ltext) = split(/\0/, $line, 3);
6069                         $file =~ s/^$co{'tree'}://;
6070                 }
6071                 if ($file ne $lastfile) {
6072                         $lastfile and print "</td></tr>\n";
6073                         if ($alternate++) {
6074                                 print "<tr class=\"dark\">\n";
6075                         } else {
6076                                 print "<tr class=\"light\">\n";
6077                         }
6078                         $file_href = href(action=>"blob", hash_base=>$co{'id'},
6079                                           file_name=>$file);
6080                         print "<td class=\"list\">".
6081                                 $cgi->a({-href => $file_href, -class => "list"}, esc_path($file));
6082                         print "</td><td>\n";
6083                         $lastfile = $file;
6084                 }
6085                 if ($binary) {
6086                         print "<div class=\"binary\">Binary file</div>\n";
6087                 } else {
6088                         $ltext = untabify($ltext);
6089                         if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6090                                 $ltext = esc_html($1, -nbsp=>1);
6091                                 $ltext .= '<span class="match">';
6092                                 $ltext .= esc_html($2, -nbsp=>1);
6093                                 $ltext .= '</span>';
6094                                 $ltext .= esc_html($3, -nbsp=>1);
6095                         } else {
6096                                 $ltext = esc_html($ltext, -nbsp=>1);
6097                         }
6098                         print "<div class=\"pre\">" .
6099                                 $cgi->a({-href => $file_href.'#l'.$lno,
6100                                         -class => "linenr"}, sprintf('%4i', $lno)) .
6101                                 ' ' .  $ltext . "</div>\n";
6102                 }
6103         }
6104         if ($lastfile) {
6105                 print "</td></tr>\n";
6106                 if ($matches > 1000) {
6107                         print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6108                 }
6109         } else {
6110                 print "<div class=\"diff nodifferences\">No matches found</div>\n";
6111         }
6112         close $fd;
6113
6114         print "</table>\n";
6115
6116         git_footer_html();
6117 }
6118
6119 sub git_search_grep_body {
6120         my ($commitlist, $from, $to, $extra) = @_;
6121         $from = 0 unless defined $from;
6122         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
6123
6124         print "<table class=\"commit_search\">\n";
6125         my $alternate = 1;
6126         for (my $i = $from; $i <= $to; $i++) {
6127                 my %co = %{$commitlist->[$i]};
6128                 if (!%co) {
6129                         next;
6130                 }
6131                 my $commit = $co{'id'};
6132                 if ($alternate) {
6133                         print "<tr class=\"dark\">\n";
6134                 } else {
6135                         print "<tr class=\"light\">\n";
6136                 }
6137                 $alternate ^= 1;
6138                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6139                       format_author_html('td', \%co, 15, 5) .
6140                       "<td>" .
6141                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6142                                -class => "list subject"},
6143                               chop_and_escape_str($co{'title'}, 50) . "<br/>");
6144                 my $comment = $co{'comment'};
6145                 foreach my $line (@$comment) {
6146                         if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
6147                                 my ($lead, $match, $trail) = ($1, $2, $3);
6148                                 $match = chop_str($match, 70, 5, 'center');
6149                                 my $contextlen = int((80 - length($match))/2);
6150                                 $contextlen = 30 if ($contextlen > 30);
6151                                 $lead  = chop_str($lead,  $contextlen, 10, 'left');
6152                                 $trail = chop_str($trail, $contextlen, 10, 'right');
6153
6154                                 $lead  = esc_html($lead);
6155                                 $match = esc_html($match);
6156                                 $trail = esc_html($trail);
6157
6158                                 print "$lead<span class=\"match\">$match</span>$trail<br />";
6159                         }
6160                 }
6161                 print "</td>\n" .
6162                       "<td class=\"link\">" .
6163                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6164                       " | " .
6165                       $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
6166                       " | " .
6167                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6168                 print "</td>\n" .
6169                       "</tr>\n";
6170         }
6171         if (defined $extra) {
6172                 print "<tr>\n" .
6173                       "<td colspan=\"3\">$extra</td>\n" .
6174                       "</tr>\n";
6175         }
6176         print "</table>\n";
6177 }
6178
6179 ## ======================================================================
6180 ## ======================================================================
6181 ## actions
6182
6183 sub git_project_list {
6184         my $order = $input_params{'order'};
6185         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6186                 die_error(400, "Unknown order parameter");
6187         }
6188
6189         my @list = git_get_projects_list($project_filter, $strict_export);
6190         if (!@list) {
6191                 die_error(404, "No projects found");
6192         }
6193
6194         git_header_html();
6195         if (defined $home_text && -f $home_text) {
6196                 print "<div class=\"index_include\">\n";
6197                 insert_file($home_text);
6198                 print "</div>\n";
6199         }
6200
6201         git_project_search_form($searchtext, $search_use_regexp);
6202         git_project_list_body(\@list, $order);
6203         git_footer_html();
6204 }
6205
6206 sub git_forks {
6207         my $order = $input_params{'order'};
6208         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6209                 die_error(400, "Unknown order parameter");
6210         }
6211
6212         my $filter = $project;
6213         $filter =~ s/\.git$//;
6214         my @list = git_get_projects_list($filter);
6215         if (!@list) {
6216                 die_error(404, "No forks found");
6217         }
6218
6219         git_header_html();
6220         git_print_page_nav('','');
6221         git_print_header_div('summary', "$project forks");
6222         git_project_list_body(\@list, $order);
6223         git_footer_html();
6224 }
6225
6226 sub git_project_index {
6227         my @projects = git_get_projects_list($project_filter, $strict_export);
6228         if (!@projects) {
6229                 die_error(404, "No projects found");
6230         }
6231
6232         print $cgi->header(
6233                 -type => 'text/plain',
6234                 -charset => 'utf-8',
6235                 -content_disposition => 'inline; filename="index.aux"');
6236
6237         foreach my $pr (@projects) {
6238                 if (!exists $pr->{'owner'}) {
6239                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6240                 }
6241
6242                 my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6243                 # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6244                 $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6245                 $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6246                 $path  =~ s/ /\+/g;
6247                 $owner =~ s/ /\+/g;
6248
6249                 print "$path $owner\n";
6250         }
6251 }
6252
6253 sub git_summary {
6254         my $descr = git_get_project_description($project) || "none";
6255         my %co = parse_commit("HEAD");
6256         my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6257         my $head = $co{'id'};
6258         my $remote_heads = gitweb_check_feature('remote_heads');
6259
6260         my $owner = git_get_project_owner($project);
6261
6262         my $refs = git_get_references();
6263         # These get_*_list functions return one more to allow us to see if
6264         # there are more ...
6265         my @taglist  = git_get_tags_list(16);
6266         my @headlist = git_get_heads_list(16);
6267         my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6268         my @forklist;
6269         my $check_forks = gitweb_check_feature('forks');
6270
6271         if ($check_forks) {
6272                 # find forks of a project
6273                 my $filter = $project;
6274                 $filter =~ s/\.git$//;
6275                 @forklist = git_get_projects_list($filter);
6276                 # filter out forks of forks
6277                 @forklist = filter_forks_from_projects_list(\@forklist)
6278                         if (@forklist);
6279         }
6280
6281         git_header_html();
6282         git_print_page_nav('summary','', $head);
6283
6284         print "<div class=\"title\">&nbsp;</div>\n";
6285         print "<table class=\"projects_list\">\n" .
6286               "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
6287               "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6288         if (defined $cd{'rfc2822'}) {
6289                 print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6290                       "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6291         }
6292
6293         # use per project git URL list in $projectroot/$project/cloneurl
6294         # or make project git URL from git base URL and project name
6295         my $url_tag = "URL";
6296         my @url_list = git_get_project_url_list($project);
6297         @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6298         foreach my $git_url (@url_list) {
6299                 next unless $git_url;
6300                 print format_repo_url($url_tag, $git_url);
6301                 $url_tag = "";
6302         }
6303
6304         # Tag cloud
6305         my $show_ctags = gitweb_check_feature('ctags');
6306         if ($show_ctags) {
6307                 my $ctags = git_get_project_ctags($project);
6308                 if (%$ctags) {
6309                         # without ability to add tags, don't show if there are none
6310                         my $cloud = git_populate_project_tagcloud($ctags);
6311                         print "<tr id=\"metadata_ctags\">" .
6312                               "<td>content tags</td>" .
6313                               "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6314                               "</tr>\n";
6315                 }
6316         }
6317
6318         print "</table>\n";
6319
6320         # If XSS prevention is on, we don't include README.html.
6321         # TODO: Allow a readme in some safe format.
6322         if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6323                 print "<div class=\"title\">readme</div>\n" .
6324                       "<div class=\"readme\">\n";
6325                 insert_file("$projectroot/$project/README.html");
6326                 print "\n</div>\n"; # class="readme"
6327         }
6328
6329         # we need to request one more than 16 (0..15) to check if
6330         # those 16 are all
6331         my @commitlist = $head ? parse_commits($head, 17) : ();
6332         if (@commitlist) {
6333                 git_print_header_div('shortlog');
6334                 git_shortlog_body(\@commitlist, 0, 15, $refs,
6335                                   $#commitlist <=  15 ? undef :
6336                                   $cgi->a({-href => href(action=>"shortlog")}, "..."));
6337         }
6338
6339         if (@taglist) {
6340                 git_print_header_div('tags');
6341                 git_tags_body(\@taglist, 0, 15,
6342                               $#taglist <=  15 ? undef :
6343                               $cgi->a({-href => href(action=>"tags")}, "..."));
6344         }
6345
6346         if (@headlist) {
6347                 git_print_header_div('heads');
6348                 git_heads_body(\@headlist, $head, 0, 15,
6349                                $#headlist <= 15 ? undef :
6350                                $cgi->a({-href => href(action=>"heads")}, "..."));
6351         }
6352
6353         if (%remotedata) {
6354                 git_print_header_div('remotes');
6355                 git_remotes_body(\%remotedata, 15, $head);
6356         }
6357
6358         if (@forklist) {
6359                 git_print_header_div('forks');
6360                 git_project_list_body(\@forklist, 'age', 0, 15,
6361                                       $#forklist <= 15 ? undef :
6362                                       $cgi->a({-href => href(action=>"forks")}, "..."),
6363                                       'no_header');
6364         }
6365
6366         git_footer_html();
6367 }
6368
6369 sub git_tag {
6370         my %tag = parse_tag($hash);
6371
6372         if (! %tag) {
6373                 die_error(404, "Unknown tag object");
6374         }
6375
6376         my $head = git_get_head_hash($project);
6377         git_header_html();
6378         git_print_page_nav('','', $head,undef,$head);
6379         git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6380         print "<div class=\"title_text\">\n" .
6381               "<table class=\"object_header\">\n" .
6382               "<tr>\n" .
6383               "<td>object</td>\n" .
6384               "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6385                                $tag{'object'}) . "</td>\n" .
6386               "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6387                                               $tag{'type'}) . "</td>\n" .
6388               "</tr>\n";
6389         if (defined($tag{'author'})) {
6390                 git_print_authorship_rows(\%tag, 'author');
6391         }
6392         print "</table>\n\n" .
6393               "</div>\n";
6394         print "<div class=\"page_body\">";
6395         my $comment = $tag{'comment'};
6396         foreach my $line (@$comment) {
6397                 chomp $line;
6398                 print esc_html($line, -nbsp=>1) . "<br/>\n";
6399         }
6400         print "</div>\n";
6401         git_footer_html();
6402 }
6403
6404 sub git_blame_common {
6405         my $format = shift || 'porcelain';
6406         if ($format eq 'porcelain' && $input_params{'javascript'}) {
6407                 $format = 'incremental';
6408                 $action = 'blame_incremental'; # for page title etc
6409         }
6410
6411         # permissions
6412         gitweb_check_feature('blame')
6413                 or die_error(403, "Blame view not allowed");
6414
6415         # error checking
6416         die_error(400, "No file name given") unless $file_name;
6417         $hash_base ||= git_get_head_hash($project);
6418         die_error(404, "Couldn't find base commit") unless $hash_base;
6419         my %co = parse_commit($hash_base)
6420                 or die_error(404, "Commit not found");
6421         my $ftype = "blob";
6422         if (!defined $hash) {
6423                 $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6424                         or die_error(404, "Error looking up file");
6425         } else {
6426                 $ftype = git_get_type($hash);
6427                 if ($ftype !~ "blob") {
6428                         die_error(400, "Object is not a blob");
6429                 }
6430         }
6431
6432         my $fd;
6433         if ($format eq 'incremental') {
6434                 # get file contents (as base)
6435                 open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6436                         or die_error(500, "Open git-cat-file failed");
6437         } elsif ($format eq 'data') {
6438                 # run git-blame --incremental
6439                 open $fd, "-|", git_cmd(), "blame", "--incremental",
6440                         $hash_base, "--", $file_name
6441                         or die_error(500, "Open git-blame --incremental failed");
6442         } else {
6443                 # run git-blame --porcelain
6444                 open $fd, "-|", git_cmd(), "blame", '-p',
6445                         $hash_base, '--', $file_name
6446                         or die_error(500, "Open git-blame --porcelain failed");
6447         }
6448
6449         # incremental blame data returns early
6450         if ($format eq 'data') {
6451                 print $cgi->header(
6452                         -type=>"text/plain", -charset => "utf-8",
6453                         -status=> "200 OK");
6454                 local $| = 1; # output autoflush
6455                 while (my $line = <$fd>) {
6456                         print to_utf8($line);
6457                 }
6458                 close $fd
6459                         or print "ERROR $!\n";
6460
6461                 print 'END';
6462                 if (defined $t0 && gitweb_check_feature('timed')) {
6463                         print ' '.
6464                               tv_interval($t0, [ gettimeofday() ]).
6465                               ' '.$number_of_git_cmds;
6466                 }
6467                 print "\n";
6468
6469                 return;
6470         }
6471
6472         # page header
6473         git_header_html();
6474         my $formats_nav =
6475                 $cgi->a({-href => href(action=>"blob", -replay=>1)},
6476                         "blob") .
6477                 " | ";
6478         if ($format eq 'incremental') {
6479                 $formats_nav .=
6480                         $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6481                                 "blame") . " (non-incremental)";
6482         } else {
6483                 $formats_nav .=
6484                         $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6485                                 "blame") . " (incremental)";
6486         }
6487         $formats_nav .=
6488                 " | " .
6489                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6490                         "history") .
6491                 " | " .
6492                 $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6493                         "HEAD");
6494         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6495         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6496         git_print_page_path($file_name, $ftype, $hash_base);
6497
6498         # page body
6499         if ($format eq 'incremental') {
6500                 print "<noscript>\n<div class=\"error\"><center><b>\n".
6501                       "This page requires JavaScript to run.\n Use ".
6502                       $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6503                               'this page').
6504                       " instead.\n".
6505                       "</b></center></div>\n</noscript>\n";
6506
6507                 print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6508         }
6509
6510         print qq!<div class="page_body">\n!;
6511         print qq!<div id="progress_info">... / ...</div>\n!
6512                 if ($format eq 'incremental');
6513         print qq!<table id="blame_table" class="blame" width="100%">\n!.
6514               #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6515               qq!<thead>\n!.
6516               qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6517               qq!</thead>\n!.
6518               qq!<tbody>\n!;
6519
6520         my @rev_color = qw(light dark);
6521         my $num_colors = scalar(@rev_color);
6522         my $current_color = 0;
6523
6524         if ($format eq 'incremental') {
6525                 my $color_class = $rev_color[$current_color];
6526
6527                 #contents of a file
6528                 my $linenr = 0;
6529         LINE:
6530                 while (my $line = <$fd>) {
6531                         chomp $line;
6532                         $linenr++;
6533
6534                         print qq!<tr id="l$linenr" class="$color_class">!.
6535                               qq!<td class="sha1"><a href=""> </a></td>!.
6536                               qq!<td class="linenr">!.
6537                               qq!<a class="linenr" href="">$linenr</a></td>!;
6538                         print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6539                         print qq!</tr>\n!;
6540                 }
6541
6542         } else { # porcelain, i.e. ordinary blame
6543                 my %metainfo = (); # saves information about commits
6544
6545                 # blame data
6546         LINE:
6547                 while (my $line = <$fd>) {
6548                         chomp $line;
6549                         # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6550                         # no <lines in group> for subsequent lines in group of lines
6551                         my ($full_rev, $orig_lineno, $lineno, $group_size) =
6552                            ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6553                         if (!exists $metainfo{$full_rev}) {
6554                                 $metainfo{$full_rev} = { 'nprevious' => 0 };
6555                         }
6556                         my $meta = $metainfo{$full_rev};
6557                         my $data;
6558                         while ($data = <$fd>) {
6559                                 chomp $data;
6560                                 last if ($data =~ s/^\t//); # contents of line
6561                                 if ($data =~ /^(\S+)(?: (.*))?$/) {
6562                                         $meta->{$1} = $2 unless exists $meta->{$1};
6563                                 }
6564                                 if ($data =~ /^previous /) {
6565                                         $meta->{'nprevious'}++;
6566                                 }
6567                         }
6568                         my $short_rev = substr($full_rev, 0, 8);
6569                         my $author = $meta->{'author'};
6570                         my %date =
6571                                 parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6572                         my $date = $date{'iso-tz'};
6573                         if ($group_size) {
6574                                 $current_color = ($current_color + 1) % $num_colors;
6575                         }
6576                         my $tr_class = $rev_color[$current_color];
6577                         $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6578                         $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6579                         $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6580                         print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6581                         if ($group_size) {
6582                                 print "<td class=\"sha1\"";
6583                                 print " title=\"". esc_html($author) . ", $date\"";
6584                                 print " rowspan=\"$group_size\"" if ($group_size > 1);
6585                                 print ">";
6586                                 print $cgi->a({-href => href(action=>"commit",
6587                                                              hash=>$full_rev,
6588                                                              file_name=>$file_name)},
6589                                               esc_html($short_rev));
6590                                 if ($group_size >= 2) {
6591                                         my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6592                                         if (@author_initials) {
6593                                                 print "<br />" .
6594                                                       esc_html(join('', @author_initials));
6595                                                 #           or join('.', ...)
6596                                         }
6597                                 }
6598                                 print "</td>\n";
6599                         }
6600                         # 'previous' <sha1 of parent commit> <filename at commit>
6601                         if (exists $meta->{'previous'} &&
6602                             $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6603                                 $meta->{'parent'} = $1;
6604                                 $meta->{'file_parent'} = unquote($2);
6605                         }
6606                         my $linenr_commit =
6607                                 exists($meta->{'parent'}) ?
6608                                 $meta->{'parent'} : $full_rev;
6609                         my $linenr_filename =
6610                                 exists($meta->{'file_parent'}) ?
6611                                 $meta->{'file_parent'} : unquote($meta->{'filename'});
6612                         my $blamed = href(action => 'blame',
6613                                           file_name => $linenr_filename,
6614                                           hash_base => $linenr_commit);
6615                         print "<td class=\"linenr\">";
6616                         print $cgi->a({ -href => "$blamed#l$orig_lineno",
6617                                         -class => "linenr" },
6618                                       esc_html($lineno));
6619                         print "</td>";
6620                         print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6621                         print "</tr>\n";
6622                 } # end while
6623
6624         }
6625
6626         # footer
6627         print "</tbody>\n".
6628               "</table>\n"; # class="blame"
6629         print "</div>\n";   # class="blame_body"
6630         close $fd
6631                 or print "Reading blob failed\n";
6632
6633         git_footer_html();
6634 }
6635
6636 sub git_blame {
6637         git_blame_common();
6638 }
6639
6640 sub git_blame_incremental {
6641         git_blame_common('incremental');
6642 }
6643
6644 sub git_blame_data {
6645         git_blame_common('data');
6646 }
6647
6648 sub git_tags {
6649         my $head = git_get_head_hash($project);
6650         git_header_html();
6651         git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6652         git_print_header_div('summary', $project);
6653
6654         my @tagslist = git_get_tags_list();
6655         if (@tagslist) {
6656                 git_tags_body(\@tagslist);
6657         }
6658         git_footer_html();
6659 }
6660
6661 sub git_heads {
6662         my $head = git_get_head_hash($project);
6663         git_header_html();
6664         git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6665         git_print_header_div('summary', $project);
6666
6667         my @headslist = git_get_heads_list();
6668         if (@headslist) {
6669                 git_heads_body(\@headslist, $head);
6670         }
6671         git_footer_html();
6672 }
6673
6674 # used both for single remote view and for list of all the remotes
6675 sub git_remotes {
6676         gitweb_check_feature('remote_heads')
6677                 or die_error(403, "Remote heads view is disabled");
6678
6679         my $head = git_get_head_hash($project);
6680         my $remote = $input_params{'hash'};
6681
6682         my $remotedata = git_get_remotes_list($remote);
6683         die_error(500, "Unable to get remote information") unless defined $remotedata;
6684
6685         unless (%$remotedata) {
6686                 die_error(404, defined $remote ?
6687                         "Remote $remote not found" :
6688                         "No remotes found");
6689         }
6690
6691         git_header_html(undef, undef, -action_extra => $remote);
6692         git_print_page_nav('', '',  $head, undef, $head,
6693                 format_ref_views($remote ? '' : 'remotes'));
6694
6695         fill_remote_heads($remotedata);
6696         if (defined $remote) {
6697                 git_print_header_div('remotes', "$remote remote for $project");
6698                 git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6699         } else {
6700                 git_print_header_div('summary', "$project remotes");
6701                 git_remotes_body($remotedata, undef, $head);
6702         }
6703
6704         git_footer_html();
6705 }
6706
6707 sub git_blob_plain {
6708         my $type = shift;
6709         my $expires;
6710
6711         if (!defined $hash) {
6712                 if (defined $file_name) {
6713                         my $base = $hash_base || git_get_head_hash($project);
6714                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6715                                 or die_error(404, "Cannot find file");
6716                 } else {
6717                         die_error(400, "No file name defined");
6718                 }
6719         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6720                 # blobs defined by non-textual hash id's can be cached
6721                 $expires = "+1d";
6722         }
6723
6724         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6725                 or die_error(500, "Open git-cat-file blob '$hash' failed");
6726
6727         # content-type (can include charset)
6728         $type = blob_contenttype($fd, $file_name, $type);
6729
6730         # "save as" filename, even when no $file_name is given
6731         my $save_as = "$hash";
6732         if (defined $file_name) {
6733                 $save_as = $file_name;
6734         } elsif ($type =~ m/^text\//) {
6735                 $save_as .= '.txt';
6736         }
6737
6738         # With XSS prevention on, blobs of all types except a few known safe
6739         # ones are served with "Content-Disposition: attachment" to make sure
6740         # they don't run in our security domain.  For certain image types,
6741         # blob view writes an <img> tag referring to blob_plain view, and we
6742         # want to be sure not to break that by serving the image as an
6743         # attachment (though Firefox 3 doesn't seem to care).
6744         my $sandbox = $prevent_xss &&
6745                 $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6746
6747         # serve text/* as text/plain
6748         if ($prevent_xss &&
6749             ($type =~ m!^text/[a-z]+\b(.*)$! ||
6750              ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
6751                 my $rest = $1;
6752                 $rest = defined $rest ? $rest : '';
6753                 $type = "text/plain$rest";
6754         }
6755
6756         print $cgi->header(
6757                 -type => $type,
6758                 -expires => $expires,
6759                 -content_disposition =>
6760                         ($sandbox ? 'attachment' : 'inline')
6761                         . '; filename="' . $save_as . '"');
6762         local $/ = undef;
6763         binmode STDOUT, ':raw';
6764         print <$fd>;
6765         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6766         close $fd;
6767 }
6768
6769 sub git_blob {
6770         my $expires;
6771
6772         if (!defined $hash) {
6773                 if (defined $file_name) {
6774                         my $base = $hash_base || git_get_head_hash($project);
6775                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6776                                 or die_error(404, "Cannot find file");
6777                 } else {
6778                         die_error(400, "No file name defined");
6779                 }
6780         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6781                 # blobs defined by non-textual hash id's can be cached
6782                 $expires = "+1d";
6783         }
6784
6785         my $have_blame = gitweb_check_feature('blame');
6786         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6787                 or die_error(500, "Couldn't cat $file_name, $hash");
6788         my $mimetype = blob_mimetype($fd, $file_name);
6789         # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6790         if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6791                 close $fd;
6792                 return git_blob_plain($mimetype);
6793         }
6794         # we can have blame only for text/* mimetype
6795         $have_blame &&= ($mimetype =~ m!^text/!);
6796
6797         my $highlight = gitweb_check_feature('highlight');
6798         my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6799         $fd = run_highlighter($fd, $highlight, $syntax)
6800                 if $syntax;
6801
6802         git_header_html(undef, $expires);
6803         my $formats_nav = '';
6804         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6805                 if (defined $file_name) {
6806                         if ($have_blame) {
6807                                 $formats_nav .=
6808                                         $cgi->a({-href => href(action=>"blame", -replay=>1)},
6809                                                 "blame") .
6810                                         " | ";
6811                         }
6812                         $formats_nav .=
6813                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6814                                         "history") .
6815                                 " | " .
6816                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6817                                         "raw") .
6818                                 " | " .
6819                                 $cgi->a({-href => href(action=>"blob",
6820                                                        hash_base=>"HEAD", file_name=>$file_name)},
6821                                         "HEAD");
6822                 } else {
6823                         $formats_nav .=
6824                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6825                                         "raw");
6826                 }
6827                 git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6828                 git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6829         } else {
6830                 print "<div class=\"page_nav\">\n" .
6831                       "<br/><br/></div>\n" .
6832                       "<div class=\"title\">".esc_html($hash)."</div>\n";
6833         }
6834         git_print_page_path($file_name, "blob", $hash_base);
6835         print "<div class=\"page_body\">\n";
6836         if ($mimetype =~ m!^image/!) {
6837                 print qq!<img type="!.esc_attr($mimetype).qq!"!;
6838                 if ($file_name) {
6839                         print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
6840                 }
6841                 print qq! src="! .
6842                       href(action=>"blob_plain", hash=>$hash,
6843                            hash_base=>$hash_base, file_name=>$file_name) .
6844                       qq!" />\n!;
6845         } else {
6846                 my $nr;
6847                 while (my $line = <$fd>) {
6848                         chomp $line;
6849                         $nr++;
6850                         $line = untabify($line);
6851                         printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
6852                                $nr, esc_attr(href(-replay => 1)), $nr, $nr,
6853                                $syntax ? sanitize($line) : esc_html($line, -nbsp=>1);
6854                 }
6855         }
6856         close $fd
6857                 or print "Reading blob failed.\n";
6858         print "</div>";
6859         git_footer_html();
6860 }
6861
6862 sub git_tree {
6863         if (!defined $hash_base) {
6864                 $hash_base = "HEAD";
6865         }
6866         if (!defined $hash) {
6867                 if (defined $file_name) {
6868                         $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
6869                 } else {
6870                         $hash = $hash_base;
6871                 }
6872         }
6873         die_error(404, "No such tree") unless defined($hash);
6874
6875         my $show_sizes = gitweb_check_feature('show-sizes');
6876         my $have_blame = gitweb_check_feature('blame');
6877
6878         my @entries = ();
6879         {
6880                 local $/ = "\0";
6881                 open my $fd, "-|", git_cmd(), "ls-tree", '-z',
6882                         ($show_sizes ? '-l' : ()), @extra_options, $hash
6883                         or die_error(500, "Open git-ls-tree failed");
6884                 @entries = map { chomp; $_ } <$fd>;
6885                 close $fd
6886                         or die_error(404, "Reading tree failed");
6887         }
6888
6889         my $refs = git_get_references();
6890         my $ref = format_ref_marker($refs, $hash_base);
6891         git_header_html();
6892         my $basedir = '';
6893         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6894                 my @views_nav = ();
6895                 if (defined $file_name) {
6896                         push @views_nav,
6897                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6898                                         "history"),
6899                                 $cgi->a({-href => href(action=>"tree",
6900                                                        hash_base=>"HEAD", file_name=>$file_name)},
6901                                         "HEAD"),
6902                 }
6903                 my $snapshot_links = format_snapshot_links($hash);
6904                 if (defined $snapshot_links) {
6905                         # FIXME: Should be available when we have no hash base as well.
6906                         push @views_nav, $snapshot_links;
6907                 }
6908                 git_print_page_nav('tree','', $hash_base, undef, undef,
6909                                    join(' | ', @views_nav));
6910                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6911         } else {
6912                 undef $hash_base;
6913                 print "<div class=\"page_nav\">\n";
6914                 print "<br/><br/></div>\n";
6915                 print "<div class=\"title\">".esc_html($hash)."</div>\n";
6916         }
6917         if (defined $file_name) {
6918                 $basedir = $file_name;
6919                 if ($basedir ne '' && substr($basedir, -1) ne '/') {
6920                         $basedir .= '/';
6921                 }
6922                 git_print_page_path($file_name, 'tree', $hash_base);
6923         }
6924         print "<div class=\"page_body\">\n";
6925         print "<table class=\"tree\">\n";
6926         my $alternate = 1;
6927         # '..' (top directory) link if possible
6928         if (defined $hash_base &&
6929             defined $file_name && $file_name =~ m![^/]+$!) {
6930                 if ($alternate) {
6931                         print "<tr class=\"dark\">\n";
6932                 } else {
6933                         print "<tr class=\"light\">\n";
6934                 }
6935                 $alternate ^= 1;
6936
6937                 my $up = $file_name;
6938                 $up =~ s!/?[^/]+$!!;
6939                 undef $up unless $up;
6940                 # based on git_print_tree_entry
6941                 print '<td class="mode">' . mode_str('040000') . "</td>\n";
6942                 print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6943                 print '<td class="list">';
6944                 print $cgi->a({-href => href(action=>"tree",
6945                                              hash_base=>$hash_base,
6946                                              file_name=>$up)},
6947                               "..");
6948                 print "</td>\n";
6949                 print "<td class=\"link\"></td>\n";
6950
6951                 print "</tr>\n";
6952         }
6953         foreach my $line (@entries) {
6954                 my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6955
6956                 if ($alternate) {
6957                         print "<tr class=\"dark\">\n";
6958                 } else {
6959                         print "<tr class=\"light\">\n";
6960                 }
6961                 $alternate ^= 1;
6962
6963                 git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6964
6965                 print "</tr>\n";
6966         }
6967         print "</table>\n" .
6968               "</div>";
6969         git_footer_html();
6970 }
6971
6972 sub snapshot_name {
6973         my ($project, $hash) = @_;
6974
6975         # path/to/project.git  -> project
6976         # path/to/project/.git -> project
6977         my $name = to_utf8($project);
6978         $name =~ s,([^/])/*\.git$,$1,;
6979         $name = basename($name);
6980         # sanitize name
6981         $name =~ s/[[:cntrl:]]/?/g;
6982
6983         my $ver = $hash;
6984         if ($hash =~ /^[0-9a-fA-F]+$/) {
6985                 # shorten SHA-1 hash
6986                 my $full_hash = git_get_full_hash($project, $hash);
6987                 if ($full_hash =~ /^$hash/ && length($hash) > 7) {
6988                         $ver = git_get_short_hash($project, $hash);
6989                 }
6990         } elsif ($hash =~ m!^refs/tags/(.*)$!) {
6991                 # tags don't need shortened SHA-1 hash
6992                 $ver = $1;
6993         } else {
6994                 # branches and other need shortened SHA-1 hash
6995                 if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
6996                         $ver = $1;
6997                 }
6998                 $ver .= '-' . git_get_short_hash($project, $hash);
6999         }
7000         # in case of hierarchical branch names
7001         $ver =~ s!/!.!g;
7002
7003         # name = project-version_string
7004         $name = "$name-$ver";
7005
7006         return wantarray ? ($name, $name) : $name;
7007 }
7008
7009 sub git_snapshot {
7010         my $format = $input_params{'snapshot_format'};
7011         if (!@snapshot_fmts) {
7012                 die_error(403, "Snapshots not allowed");
7013         }
7014         # default to first supported snapshot format
7015         $format ||= $snapshot_fmts[0];
7016         if ($format !~ m/^[a-z0-9]+$/) {
7017                 die_error(400, "Invalid snapshot format parameter");
7018         } elsif (!exists($known_snapshot_formats{$format})) {
7019                 die_error(400, "Unknown snapshot format");
7020         } elsif ($known_snapshot_formats{$format}{'disabled'}) {
7021                 die_error(403, "Snapshot format not allowed");
7022         } elsif (!grep($_ eq $format, @snapshot_fmts)) {
7023                 die_error(403, "Unsupported snapshot format");
7024         }
7025
7026         my $type = git_get_type("$hash^{}");
7027         if (!$type) {
7028                 die_error(404, 'Object does not exist');
7029         }  elsif ($type eq 'blob') {
7030                 die_error(400, 'Object is not a tree-ish');
7031         }
7032
7033         my ($name, $prefix) = snapshot_name($project, $hash);
7034         my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
7035         my $cmd = quote_command(
7036                 git_cmd(), 'archive',
7037                 "--format=$known_snapshot_formats{$format}{'format'}",
7038                 "--prefix=$prefix/", $hash);
7039         if (exists $known_snapshot_formats{$format}{'compressor'}) {
7040                 $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
7041         }
7042
7043         $filename =~ s/(["\\])/\\$1/g;
7044         print $cgi->header(
7045                 -type => $known_snapshot_formats{$format}{'type'},
7046                 -content_disposition => 'inline; filename="' . $filename . '"',
7047                 -status => '200 OK');
7048
7049         open my $fd, "-|", $cmd
7050                 or die_error(500, "Execute git-archive failed");
7051         binmode STDOUT, ':raw';
7052         print <$fd>;
7053         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
7054         close $fd;
7055 }
7056
7057 sub git_log_generic {
7058         my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
7059
7060         my $head = git_get_head_hash($project);
7061         if (!defined $base) {
7062                 $base = $head;
7063         }
7064         if (!defined $page) {
7065                 $page = 0;
7066         }
7067         my $refs = git_get_references();
7068
7069         my $commit_hash = $base;
7070         if (defined $parent) {
7071                 $commit_hash = "$parent..$base";
7072         }
7073         my @commitlist =
7074                 parse_commits($commit_hash, 101, (100 * $page),
7075                               defined $file_name ? ($file_name, "--full-history") : ());
7076
7077         my $ftype;
7078         if (!defined $file_hash && defined $file_name) {
7079                 # some commits could have deleted file in question,
7080                 # and not have it in tree, but one of them has to have it
7081                 for (my $i = 0; $i < @commitlist; $i++) {
7082                         $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
7083                         last if defined $file_hash;
7084                 }
7085         }
7086         if (defined $file_hash) {
7087                 $ftype = git_get_type($file_hash);
7088         }
7089         if (defined $file_name && !defined $ftype) {
7090                 die_error(500, "Unknown type of object");
7091         }
7092         my %co;
7093         if (defined $file_name) {
7094                 %co = parse_commit($base)
7095                         or die_error(404, "Unknown commit object");
7096         }
7097
7098
7099         my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
7100         my $next_link = '';
7101         if ($#commitlist >= 100) {
7102                 $next_link =
7103                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
7104                                  -accesskey => "n", -title => "Alt-n"}, "next");
7105         }
7106         my $patch_max = gitweb_get_feature('patches');
7107         if ($patch_max && !defined $file_name) {
7108                 if ($patch_max < 0 || @commitlist <= $patch_max) {
7109                         $paging_nav .= " &sdot; " .
7110                                 $cgi->a({-href => href(action=>"patches", -replay=>1)},
7111                                         "patches");
7112                 }
7113         }
7114
7115         git_header_html();
7116         git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
7117         if (defined $file_name) {
7118                 git_print_header_div('commit', esc_html($co{'title'}), $base);
7119         } else {
7120                 git_print_header_div('summary', $project)
7121         }
7122         git_print_page_path($file_name, $ftype, $hash_base)
7123                 if (defined $file_name);
7124
7125         $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
7126                      $file_name, $file_hash, $ftype);
7127
7128         git_footer_html();
7129 }
7130
7131 sub git_log {
7132         git_log_generic('log', \&git_log_body,
7133                         $hash, $hash_parent);
7134 }
7135
7136 sub git_commit {
7137         $hash ||= $hash_base || "HEAD";
7138         my %co = parse_commit($hash)
7139             or die_error(404, "Unknown commit object");
7140
7141         my $parent  = $co{'parent'};
7142         my $parents = $co{'parents'}; # listref
7143
7144         # we need to prepare $formats_nav before any parameter munging
7145         my $formats_nav;
7146         if (!defined $parent) {
7147                 # --root commitdiff
7148                 $formats_nav .= '(initial)';
7149         } elsif (@$parents == 1) {
7150                 # single parent commit
7151                 $formats_nav .=
7152                         '(parent: ' .
7153                         $cgi->a({-href => href(action=>"commit",
7154                                                hash=>$parent)},
7155                                 esc_html(substr($parent, 0, 7))) .
7156                         ')';
7157         } else {
7158                 # merge commit
7159                 $formats_nav .=
7160                         '(merge: ' .
7161                         join(' ', map {
7162                                 $cgi->a({-href => href(action=>"commit",
7163                                                        hash=>$_)},
7164                                         esc_html(substr($_, 0, 7)));
7165                         } @$parents ) .
7166                         ')';
7167         }
7168         if (gitweb_check_feature('patches') && @$parents <= 1) {
7169                 $formats_nav .= " | " .
7170                         $cgi->a({-href => href(action=>"patch", -replay=>1)},
7171                                 "patch");
7172         }
7173
7174         if (!defined $parent) {
7175                 $parent = "--root";
7176         }
7177         my @difftree;
7178         open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
7179                 @diff_opts,
7180                 (@$parents <= 1 ? $parent : '-c'),
7181                 $hash, "--"
7182                 or die_error(500, "Open git-diff-tree failed");
7183         @difftree = map { chomp; $_ } <$fd>;
7184         close $fd or die_error(404, "Reading git-diff-tree failed");
7185
7186         # non-textual hash id's can be cached
7187         my $expires;
7188         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7189                 $expires = "+1d";
7190         }
7191         my $refs = git_get_references();
7192         my $ref = format_ref_marker($refs, $co{'id'});
7193
7194         git_header_html(undef, $expires);
7195         git_print_page_nav('commit', '',
7196                            $hash, $co{'tree'}, $hash,
7197                            $formats_nav);
7198
7199         if (defined $co{'parent'}) {
7200                 git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
7201         } else {
7202                 git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
7203         }
7204         print "<div class=\"title_text\">\n" .
7205               "<table class=\"object_header\">\n";
7206         git_print_authorship_rows(\%co);
7207         print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
7208         print "<tr>" .
7209               "<td>tree</td>" .
7210               "<td class=\"sha1\">" .
7211               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7212                        class => "list"}, $co{'tree'}) .
7213               "</td>" .
7214               "<td class=\"link\">" .
7215               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7216                       "tree");
7217         my $snapshot_links = format_snapshot_links($hash);
7218         if (defined $snapshot_links) {
7219                 print " | " . $snapshot_links;
7220         }
7221         print "</td>" .
7222               "</tr>\n";
7223
7224         foreach my $par (@$parents) {
7225                 print "<tr>" .
7226                       "<td>parent</td>" .
7227                       "<td class=\"sha1\">" .
7228                       $cgi->a({-href => href(action=>"commit", hash=>$par),
7229                                class => "list"}, $par) .
7230                       "</td>" .
7231                       "<td class=\"link\">" .
7232                       $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7233                       " | " .
7234                       $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7235                       "</td>" .
7236                       "</tr>\n";
7237         }
7238         print "</table>".
7239               "</div>\n";
7240
7241         print "<div class=\"page_body\">\n";
7242         git_print_log($co{'comment'});
7243         print "</div>\n";
7244
7245         git_difftree_body(\@difftree, $hash, @$parents);
7246
7247         git_footer_html();
7248 }
7249
7250 sub git_object {
7251         # object is defined by:
7252         # - hash or hash_base alone
7253         # - hash_base and file_name
7254         my $type;
7255
7256         # - hash or hash_base alone
7257         if ($hash || ($hash_base && !defined $file_name)) {
7258                 my $object_id = $hash || $hash_base;
7259
7260                 open my $fd, "-|", quote_command(
7261                         git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7262                         or die_error(404, "Object does not exist");
7263                 $type = <$fd>;
7264                 chomp $type;
7265                 close $fd
7266                         or die_error(404, "Object does not exist");
7267
7268         # - hash_base and file_name
7269         } elsif ($hash_base && defined $file_name) {
7270                 $file_name =~ s,/+$,,;
7271
7272                 system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7273                         or die_error(404, "Base object does not exist");
7274
7275                 # here errors should not hapen
7276                 open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7277                         or die_error(500, "Open git-ls-tree failed");
7278                 my $line = <$fd>;
7279                 close $fd;
7280
7281                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7282                 unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7283                         die_error(404, "File or directory for given base does not exist");
7284                 }
7285                 $type = $2;
7286                 $hash = $3;
7287         } else {
7288                 die_error(400, "Not enough information to find object");
7289         }
7290
7291         print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7292                                           hash=>$hash, hash_base=>$hash_base,
7293                                           file_name=>$file_name),
7294                              -status => '302 Found');
7295 }
7296
7297 sub git_blobdiff {
7298         my $format = shift || 'html';
7299         my $diff_style = $input_params{'diff_style'} || 'inline';
7300
7301         my $fd;
7302         my @difftree;
7303         my %diffinfo;
7304         my $expires;
7305
7306         # preparing $fd and %diffinfo for git_patchset_body
7307         # new style URI
7308         if (defined $hash_base && defined $hash_parent_base) {
7309                 if (defined $file_name) {
7310                         # read raw output
7311                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7312                                 $hash_parent_base, $hash_base,
7313                                 "--", (defined $file_parent ? $file_parent : ()), $file_name
7314                                 or die_error(500, "Open git-diff-tree failed");
7315                         @difftree = map { chomp; $_ } <$fd>;
7316                         close $fd
7317                                 or die_error(404, "Reading git-diff-tree failed");
7318                         @difftree
7319                                 or die_error(404, "Blob diff not found");
7320
7321                 } elsif (defined $hash &&
7322                          $hash =~ /[0-9a-fA-F]{40}/) {
7323                         # try to find filename from $hash
7324
7325                         # read filtered raw output
7326                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7327                                 $hash_parent_base, $hash_base, "--"
7328                                 or die_error(500, "Open git-diff-tree failed");
7329                         @difftree =
7330                                 # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7331                                 # $hash == to_id
7332                                 grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7333                                 map { chomp; $_ } <$fd>;
7334                         close $fd
7335                                 or die_error(404, "Reading git-diff-tree failed");
7336                         @difftree
7337                                 or die_error(404, "Blob diff not found");
7338
7339                 } else {
7340                         die_error(400, "Missing one of the blob diff parameters");
7341                 }
7342
7343                 if (@difftree > 1) {
7344                         die_error(400, "Ambiguous blob diff specification");
7345                 }
7346
7347                 %diffinfo = parse_difftree_raw_line($difftree[0]);
7348                 $file_parent ||= $diffinfo{'from_file'} || $file_name;
7349                 $file_name   ||= $diffinfo{'to_file'};
7350
7351                 $hash_parent ||= $diffinfo{'from_id'};
7352                 $hash        ||= $diffinfo{'to_id'};
7353
7354                 # non-textual hash id's can be cached
7355                 if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7356                     $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7357                         $expires = '+1d';
7358                 }
7359
7360                 # open patch output
7361                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7362                         '-p', ($format eq 'html' ? "--full-index" : ()),
7363                         $hash_parent_base, $hash_base,
7364                         "--", (defined $file_parent ? $file_parent : ()), $file_name
7365                         or die_error(500, "Open git-diff-tree failed");
7366         }
7367
7368         # old/legacy style URI -- not generated anymore since 1.4.3.
7369         if (!%diffinfo) {
7370                 die_error('404 Not Found', "Missing one of the blob diff parameters")
7371         }
7372
7373         # header
7374         if ($format eq 'html') {
7375                 my $formats_nav =
7376                         $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7377                                 "raw");
7378                 $formats_nav .= diff_style_nav($diff_style);
7379                 git_header_html(undef, $expires);
7380                 if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7381                         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7382                         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7383                 } else {
7384                         print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7385                         print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7386                 }
7387                 if (defined $file_name) {
7388                         git_print_page_path($file_name, "blob", $hash_base);
7389                 } else {
7390                         print "<div class=\"page_path\"></div>\n";
7391                 }
7392
7393         } elsif ($format eq 'plain') {
7394                 print $cgi->header(
7395                         -type => 'text/plain',
7396                         -charset => 'utf-8',
7397                         -expires => $expires,
7398                         -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7399
7400                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7401
7402         } else {
7403                 die_error(400, "Unknown blobdiff format");
7404         }
7405
7406         # patch
7407         if ($format eq 'html') {
7408                 print "<div class=\"page_body\">\n";
7409
7410                 git_patchset_body($fd, $diff_style,
7411                                   [ \%diffinfo ], $hash_base, $hash_parent_base);
7412                 close $fd;
7413
7414                 print "</div>\n"; # class="page_body"
7415                 git_footer_html();
7416
7417         } else {
7418                 while (my $line = <$fd>) {
7419                         $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7420                         $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7421
7422                         print $line;
7423
7424                         last if $line =~ m!^\+\+\+!;
7425                 }
7426                 local $/ = undef;
7427                 print <$fd>;
7428                 close $fd;
7429         }
7430 }
7431
7432 sub git_blobdiff_plain {
7433         git_blobdiff('plain');
7434 }
7435
7436 # assumes that it is added as later part of already existing navigation,
7437 # so it returns "| foo | bar" rather than just "foo | bar"
7438 sub diff_style_nav {
7439         my ($diff_style, $is_combined) = @_;
7440         $diff_style ||= 'inline';
7441
7442         return "" if ($is_combined);
7443
7444         my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7445         my %styles = @styles;
7446         @styles =
7447                 @styles[ map { $_ * 2 } 0..$#styles/2 ];
7448
7449         return join '',
7450                 map { " | ".$_ }
7451                 map {
7452                         $_ eq $diff_style ? $styles{$_} :
7453                         $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7454                 } @styles;
7455 }
7456
7457 sub git_commitdiff {
7458         my %params = @_;
7459         my $format = $params{-format} || 'html';
7460         my $diff_style = $input_params{'diff_style'} || 'inline';
7461
7462         my ($patch_max) = gitweb_get_feature('patches');
7463         if ($format eq 'patch') {
7464                 die_error(403, "Patch view not allowed") unless $patch_max;
7465         }
7466
7467         $hash ||= $hash_base || "HEAD";
7468         my %co = parse_commit($hash)
7469             or die_error(404, "Unknown commit object");
7470
7471         # choose format for commitdiff for merge
7472         if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7473                 $hash_parent = '--cc';
7474         }
7475         # we need to prepare $formats_nav before almost any parameter munging
7476         my $formats_nav;
7477         if ($format eq 'html') {
7478                 $formats_nav =
7479                         $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7480                                 "raw");
7481                 if ($patch_max && @{$co{'parents'}} <= 1) {
7482                         $formats_nav .= " | " .
7483                                 $cgi->a({-href => href(action=>"patch", -replay=>1)},
7484                                         "patch");
7485                 }
7486                 $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7487
7488                 if (defined $hash_parent &&
7489                     $hash_parent ne '-c' && $hash_parent ne '--cc') {
7490                         # commitdiff with two commits given
7491                         my $hash_parent_short = $hash_parent;
7492                         if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7493                                 $hash_parent_short = substr($hash_parent, 0, 7);
7494                         }
7495                         $formats_nav .=
7496                                 ' (from';
7497                         for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7498                                 if ($co{'parents'}[$i] eq $hash_parent) {
7499                                         $formats_nav .= ' parent ' . ($i+1);
7500                                         last;
7501                                 }
7502                         }
7503                         $formats_nav .= ': ' .
7504                                 $cgi->a({-href => href(-replay=>1,
7505                                                        hash=>$hash_parent, hash_base=>undef)},
7506                                         esc_html($hash_parent_short)) .
7507                                 ')';
7508                 } elsif (!$co{'parent'}) {
7509                         # --root commitdiff
7510                         $formats_nav .= ' (initial)';
7511                 } elsif (scalar @{$co{'parents'}} == 1) {
7512                         # single parent commit
7513                         $formats_nav .=
7514                                 ' (parent: ' .
7515                                 $cgi->a({-href => href(-replay=>1,
7516                                                        hash=>$co{'parent'}, hash_base=>undef)},
7517                                         esc_html(substr($co{'parent'}, 0, 7))) .
7518                                 ')';
7519                 } else {
7520                         # merge commit
7521                         if ($hash_parent eq '--cc') {
7522                                 $formats_nav .= ' | ' .
7523                                         $cgi->a({-href => href(-replay=>1,
7524                                                                hash=>$hash, hash_parent=>'-c')},
7525                                                 'combined');
7526                         } else { # $hash_parent eq '-c'
7527                                 $formats_nav .= ' | ' .
7528                                         $cgi->a({-href => href(-replay=>1,
7529                                                                hash=>$hash, hash_parent=>'--cc')},
7530                                                 'compact');
7531                         }
7532                         $formats_nav .=
7533                                 ' (merge: ' .
7534                                 join(' ', map {
7535                                         $cgi->a({-href => href(-replay=>1,
7536                                                                hash=>$_, hash_base=>undef)},
7537                                                 esc_html(substr($_, 0, 7)));
7538                                 } @{$co{'parents'}} ) .
7539                                 ')';
7540                 }
7541         }
7542
7543         my $hash_parent_param = $hash_parent;
7544         if (!defined $hash_parent_param) {
7545                 # --cc for multiple parents, --root for parentless
7546                 $hash_parent_param =
7547                         @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7548         }
7549
7550         # read commitdiff
7551         my $fd;
7552         my @difftree;
7553         if ($format eq 'html') {
7554                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7555                         "--no-commit-id", "--patch-with-raw", "--full-index",
7556                         $hash_parent_param, $hash, "--"
7557                         or die_error(500, "Open git-diff-tree failed");
7558
7559                 while (my $line = <$fd>) {
7560                         chomp $line;
7561                         # empty line ends raw part of diff-tree output
7562                         last unless $line;
7563                         push @difftree, scalar parse_difftree_raw_line($line);
7564                 }
7565
7566         } elsif ($format eq 'plain') {
7567                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7568                         '-p', $hash_parent_param, $hash, "--"
7569                         or die_error(500, "Open git-diff-tree failed");
7570         } elsif ($format eq 'patch') {
7571                 # For commit ranges, we limit the output to the number of
7572                 # patches specified in the 'patches' feature.
7573                 # For single commits, we limit the output to a single patch,
7574                 # diverging from the git-format-patch default.
7575                 my @commit_spec = ();
7576                 if ($hash_parent) {
7577                         if ($patch_max > 0) {
7578                                 push @commit_spec, "-$patch_max";
7579                         }
7580                         push @commit_spec, '-n', "$hash_parent..$hash";
7581                 } else {
7582                         if ($params{-single}) {
7583                                 push @commit_spec, '-1';
7584                         } else {
7585                                 if ($patch_max > 0) {
7586                                         push @commit_spec, "-$patch_max";
7587                                 }
7588                                 push @commit_spec, "-n";
7589                         }
7590                         push @commit_spec, '--root', $hash;
7591                 }
7592                 open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7593                         '--encoding=utf8', '--stdout', @commit_spec
7594                         or die_error(500, "Open git-format-patch failed");
7595         } else {
7596                 die_error(400, "Unknown commitdiff format");
7597         }
7598
7599         # non-textual hash id's can be cached
7600         my $expires;
7601         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7602                 $expires = "+1d";
7603         }
7604
7605         # write commit message
7606         if ($format eq 'html') {
7607                 my $refs = git_get_references();
7608                 my $ref = format_ref_marker($refs, $co{'id'});
7609
7610                 git_header_html(undef, $expires);
7611                 git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7612                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7613                 print "<div class=\"title_text\">\n" .
7614                       "<table class=\"object_header\">\n";
7615                 git_print_authorship_rows(\%co);
7616                 print "</table>".
7617                       "</div>\n";
7618                 print "<div class=\"page_body\">\n";
7619                 if (@{$co{'comment'}} > 1) {
7620                         print "<div class=\"log\">\n";
7621                         git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7622                         print "</div>\n"; # class="log"
7623                 }
7624
7625         } elsif ($format eq 'plain') {
7626                 my $refs = git_get_references("tags");
7627                 my $tagname = git_get_rev_name_tags($hash);
7628                 my $filename = basename($project) . "-$hash.patch";
7629
7630                 print $cgi->header(
7631                         -type => 'text/plain',
7632                         -charset => 'utf-8',
7633                         -expires => $expires,
7634                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7635                 my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7636                 print "From: " . to_utf8($co{'author'}) . "\n";
7637                 print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7638                 print "Subject: " . to_utf8($co{'title'}) . "\n";
7639
7640                 print "X-Git-Tag: $tagname\n" if $tagname;
7641                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7642
7643                 foreach my $line (@{$co{'comment'}}) {
7644                         print to_utf8($line) . "\n";
7645                 }
7646                 print "---\n\n";
7647         } elsif ($format eq 'patch') {
7648                 my $filename = basename($project) . "-$hash.patch";
7649
7650                 print $cgi->header(
7651                         -type => 'text/plain',
7652                         -charset => 'utf-8',
7653                         -expires => $expires,
7654                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7655         }
7656
7657         # write patch
7658         if ($format eq 'html') {
7659                 my $use_parents = !defined $hash_parent ||
7660                         $hash_parent eq '-c' || $hash_parent eq '--cc';
7661                 git_difftree_body(\@difftree, $hash,
7662                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7663                 print "<br/>\n";
7664
7665                 git_patchset_body($fd, $diff_style,
7666                                   \@difftree, $hash,
7667                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7668                 close $fd;
7669                 print "</div>\n"; # class="page_body"
7670                 git_footer_html();
7671
7672         } elsif ($format eq 'plain') {
7673                 local $/ = undef;
7674                 print <$fd>;
7675                 close $fd
7676                         or print "Reading git-diff-tree failed\n";
7677         } elsif ($format eq 'patch') {
7678                 local $/ = undef;
7679                 print <$fd>;
7680                 close $fd
7681                         or print "Reading git-format-patch failed\n";
7682         }
7683 }
7684
7685 sub git_commitdiff_plain {
7686         git_commitdiff(-format => 'plain');
7687 }
7688
7689 # format-patch-style patches
7690 sub git_patch {
7691         git_commitdiff(-format => 'patch', -single => 1);
7692 }
7693
7694 sub git_patches {
7695         git_commitdiff(-format => 'patch');
7696 }
7697
7698 sub git_history {
7699         git_log_generic('history', \&git_history_body,
7700                         $hash_base, $hash_parent_base,
7701                         $file_name, $hash);
7702 }
7703
7704 sub git_search {
7705         $searchtype ||= 'commit';
7706
7707         # check if appropriate features are enabled
7708         gitweb_check_feature('search')
7709                 or die_error(403, "Search is disabled");
7710         if ($searchtype eq 'pickaxe') {
7711                 # pickaxe may take all resources of your box and run for several minutes
7712                 # with every query - so decide by yourself how public you make this feature
7713                 gitweb_check_feature('pickaxe')
7714                         or die_error(403, "Pickaxe search is disabled");
7715         }
7716         if ($searchtype eq 'grep') {
7717                 # grep search might be potentially CPU-intensive, too
7718                 gitweb_check_feature('grep')
7719                         or die_error(403, "Grep search is disabled");
7720         }
7721
7722         if (!defined $searchtext) {
7723                 die_error(400, "Text field is empty");
7724         }
7725         if (!defined $hash) {
7726                 $hash = git_get_head_hash($project);
7727         }
7728         my %co = parse_commit($hash);
7729         if (!%co) {
7730                 die_error(404, "Unknown commit object");
7731         }
7732         if (!defined $page) {
7733                 $page = 0;
7734         }
7735
7736         if ($searchtype eq 'commit' ||
7737             $searchtype eq 'author' ||
7738             $searchtype eq 'committer') {
7739                 git_search_message(%co);
7740         } elsif ($searchtype eq 'pickaxe') {
7741                 git_search_changes(%co);
7742         } elsif ($searchtype eq 'grep') {
7743                 git_search_files(%co);
7744         } else {
7745                 die_error(400, "Unknown search type");
7746         }
7747 }
7748
7749 sub git_search_help {
7750         git_header_html();
7751         git_print_page_nav('','', $hash,$hash,$hash);
7752         print <<EOT;
7753 <p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7754 regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7755 the pattern entered is recognized as the POSIX extended
7756 <a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7757 insensitive).</p>
7758 <dl>
7759 <dt><b>commit</b></dt>
7760 <dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7761 EOT
7762         my $have_grep = gitweb_check_feature('grep');
7763         if ($have_grep) {
7764                 print <<EOT;
7765 <dt><b>grep</b></dt>
7766 <dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7767     a different one) are searched for the given pattern. On large trees, this search can take
7768 a while and put some strain on the server, so please use it with some consideration. Note that
7769 due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7770 case-sensitive.</dd>
7771 EOT
7772         }
7773         print <<EOT;
7774 <dt><b>author</b></dt>
7775 <dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7776 <dt><b>committer</b></dt>
7777 <dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7778 EOT
7779         my $have_pickaxe = gitweb_check_feature('pickaxe');
7780         if ($have_pickaxe) {
7781                 print <<EOT;
7782 <dt><b>pickaxe</b></dt>
7783 <dd>All commits that caused the string to appear or disappear from any file (changes that
7784 added, removed or "modified" the string) will be listed. This search can take a while and
7785 takes a lot of strain on the server, so please use it wisely. Note that since you may be
7786 interested even in changes just changing the case as well, this search is case sensitive.</dd>
7787 EOT
7788         }
7789         print "</dl>\n";
7790         git_footer_html();
7791 }
7792
7793 sub git_shortlog {
7794         git_log_generic('shortlog', \&git_shortlog_body,
7795                         $hash, $hash_parent);
7796 }
7797
7798 ## ......................................................................
7799 ## feeds (RSS, Atom; OPML)
7800
7801 sub git_feed {
7802         my $format = shift || 'atom';
7803         my $have_blame = gitweb_check_feature('blame');
7804
7805         # Atom: http://www.atomenabled.org/developers/syndication/
7806         # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7807         if ($format ne 'rss' && $format ne 'atom') {
7808                 die_error(400, "Unknown web feed format");
7809         }
7810
7811         # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7812         my $head = $hash || 'HEAD';
7813         my @commitlist = parse_commits($head, 150, 0, $file_name);
7814
7815         my %latest_commit;
7816         my %latest_date;
7817         my $content_type = "application/$format+xml";
7818         if (defined $cgi->http('HTTP_ACCEPT') &&
7819                  $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7820                 # browser (feed reader) prefers text/xml
7821                 $content_type = 'text/xml';
7822         }
7823         if (defined($commitlist[0])) {
7824                 %latest_commit = %{$commitlist[0]};
7825                 my $latest_epoch = $latest_commit{'committer_epoch'};
7826                 %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7827                 my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7828                 if (defined $if_modified) {
7829                         my $since;
7830                         if (eval { require HTTP::Date; 1; }) {
7831                                 $since = HTTP::Date::str2time($if_modified);
7832                         } elsif (eval { require Time::ParseDate; 1; }) {
7833                                 $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7834                         }
7835                         if (defined $since && $latest_epoch <= $since) {
7836                                 print $cgi->header(
7837                                         -type => $content_type,
7838                                         -charset => 'utf-8',
7839                                         -last_modified => $latest_date{'rfc2822'},
7840                                         -status => '304 Not Modified');
7841                                 return;
7842                         }
7843                 }
7844                 print $cgi->header(
7845                         -type => $content_type,
7846                         -charset => 'utf-8',
7847                         -last_modified => $latest_date{'rfc2822'});
7848         } else {
7849                 print $cgi->header(
7850                         -type => $content_type,
7851                         -charset => 'utf-8');
7852         }
7853
7854         # Optimization: skip generating the body if client asks only
7855         # for Last-Modified date.
7856         return if ($cgi->request_method() eq 'HEAD');
7857
7858         # header variables
7859         my $title = "$site_name - $project/$action";
7860         my $feed_type = 'log';
7861         if (defined $hash) {
7862                 $title .= " - '$hash'";
7863                 $feed_type = 'branch log';
7864                 if (defined $file_name) {
7865                         $title .= " :: $file_name";
7866                         $feed_type = 'history';
7867                 }
7868         } elsif (defined $file_name) {
7869                 $title .= " - $file_name";
7870                 $feed_type = 'history';
7871         }
7872         $title .= " $feed_type";
7873         my $descr = git_get_project_description($project);
7874         if (defined $descr) {
7875                 $descr = esc_html($descr);
7876         } else {
7877                 $descr = "$project " .
7878                          ($format eq 'rss' ? 'RSS' : 'Atom') .
7879                          " feed";
7880         }
7881         my $owner = git_get_project_owner($project);
7882         $owner = esc_html($owner);
7883
7884         #header
7885         my $alt_url;
7886         if (defined $file_name) {
7887                 $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7888         } elsif (defined $hash) {
7889                 $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7890         } else {
7891                 $alt_url = href(-full=>1, action=>"summary");
7892         }
7893         print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7894         if ($format eq 'rss') {
7895                 print <<XML;
7896 <rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7897 <channel>
7898 XML
7899                 print "<title>$title</title>\n" .
7900                       "<link>$alt_url</link>\n" .
7901                       "<description>$descr</description>\n" .
7902                       "<language>en</language>\n" .
7903                       # project owner is responsible for 'editorial' content
7904                       "<managingEditor>$owner</managingEditor>\n";
7905                 if (defined $logo || defined $favicon) {
7906                         # prefer the logo to the favicon, since RSS
7907                         # doesn't allow both
7908                         my $img = esc_url($logo || $favicon);
7909                         print "<image>\n" .
7910                               "<url>$img</url>\n" .
7911                               "<title>$title</title>\n" .
7912                               "<link>$alt_url</link>\n" .
7913                               "</image>\n";
7914                 }
7915                 if (%latest_date) {
7916                         print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7917                         print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7918                 }
7919                 print "<generator>gitweb v.$version/$git_version</generator>\n";
7920         } elsif ($format eq 'atom') {
7921                 print <<XML;
7922 <feed xmlns="http://www.w3.org/2005/Atom">
7923 XML
7924                 print "<title>$title</title>\n" .
7925                       "<subtitle>$descr</subtitle>\n" .
7926                       '<link rel="alternate" type="text/html" href="' .
7927                       $alt_url . '" />' . "\n" .
7928                       '<link rel="self" type="' . $content_type . '" href="' .
7929                       $cgi->self_url() . '" />' . "\n" .
7930                       "<id>" . href(-full=>1) . "</id>\n" .
7931                       # use project owner for feed author
7932                       "<author><name>$owner</name></author>\n";
7933                 if (defined $favicon) {
7934                         print "<icon>" . esc_url($favicon) . "</icon>\n";
7935                 }
7936                 if (defined $logo) {
7937                         # not twice as wide as tall: 72 x 27 pixels
7938                         print "<logo>" . esc_url($logo) . "</logo>\n";
7939                 }
7940                 if (! %latest_date) {
7941                         # dummy date to keep the feed valid until commits trickle in:
7942                         print "<updated>1970-01-01T00:00:00Z</updated>\n";
7943                 } else {
7944                         print "<updated>$latest_date{'iso-8601'}</updated>\n";
7945                 }
7946                 print "<generator version='$version/$git_version'>gitweb</generator>\n";
7947         }
7948
7949         # contents
7950         for (my $i = 0; $i <= $#commitlist; $i++) {
7951                 my %co = %{$commitlist[$i]};
7952                 my $commit = $co{'id'};
7953                 # we read 150, we always show 30 and the ones more recent than 48 hours
7954                 if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7955                         last;
7956                 }
7957                 my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7958
7959                 # get list of changed files
7960                 open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7961                         $co{'parent'} || "--root",
7962                         $co{'id'}, "--", (defined $file_name ? $file_name : ())
7963                         or next;
7964                 my @difftree = map { chomp; $_ } <$fd>;
7965                 close $fd
7966                         or next;
7967
7968                 # print element (entry, item)
7969                 my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7970                 if ($format eq 'rss') {
7971                         print "<item>\n" .
7972                               "<title>" . esc_html($co{'title'}) . "</title>\n" .
7973                               "<author>" . esc_html($co{'author'}) . "</author>\n" .
7974                               "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7975                               "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7976                               "<link>$co_url</link>\n" .
7977                               "<description>" . esc_html($co{'title'}) . "</description>\n" .
7978                               "<content:encoded>" .
7979                               "<![CDATA[\n";
7980                 } elsif ($format eq 'atom') {
7981                         print "<entry>\n" .
7982                               "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7983                               "<updated>$cd{'iso-8601'}</updated>\n" .
7984                               "<author>\n" .
7985                               "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7986                         if ($co{'author_email'}) {
7987                                 print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7988                         }
7989                         print "</author>\n" .
7990                               # use committer for contributor
7991                               "<contributor>\n" .
7992                               "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7993                         if ($co{'committer_email'}) {
7994                                 print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7995                         }
7996                         print "</contributor>\n" .
7997                               "<published>$cd{'iso-8601'}</published>\n" .
7998                               "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7999                               "<id>$co_url</id>\n" .
8000                               "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
8001                               "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
8002                 }
8003                 my $comment = $co{'comment'};
8004                 print "<pre>\n";
8005                 foreach my $line (@$comment) {
8006                         $line = esc_html($line);
8007                         print "$line\n";
8008                 }
8009                 print "</pre><ul>\n";
8010                 foreach my $difftree_line (@difftree) {
8011                         my %difftree = parse_difftree_raw_line($difftree_line);
8012                         next if !$difftree{'from_id'};
8013
8014                         my $file = $difftree{'file'} || $difftree{'to_file'};
8015
8016                         print "<li>" .
8017                               "[" .
8018                               $cgi->a({-href => href(-full=>1, action=>"blobdiff",
8019                                                      hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
8020                                                      hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
8021                                                      file_name=>$file, file_parent=>$difftree{'from_file'}),
8022                                       -title => "diff"}, 'D');
8023                         if ($have_blame) {
8024                                 print $cgi->a({-href => href(-full=>1, action=>"blame",
8025                                                              file_name=>$file, hash_base=>$commit),
8026                                               -title => "blame"}, 'B');
8027                         }
8028                         # if this is not a feed of a file history
8029                         if (!defined $file_name || $file_name ne $file) {
8030                                 print $cgi->a({-href => href(-full=>1, action=>"history",
8031                                                              file_name=>$file, hash=>$commit),
8032                                               -title => "history"}, 'H');
8033                         }
8034                         $file = esc_path($file);
8035                         print "] ".
8036                               "$file</li>\n";
8037                 }
8038                 if ($format eq 'rss') {
8039                         print "</ul>]]>\n" .
8040                               "</content:encoded>\n" .
8041                               "</item>\n";
8042                 } elsif ($format eq 'atom') {
8043                         print "</ul>\n</div>\n" .
8044                               "</content>\n" .
8045                               "</entry>\n";
8046                 }
8047         }
8048
8049         # end of feed
8050         if ($format eq 'rss') {
8051                 print "</channel>\n</rss>\n";
8052         } elsif ($format eq 'atom') {
8053                 print "</feed>\n";
8054         }
8055 }
8056
8057 sub git_rss {
8058         git_feed('rss');
8059 }
8060
8061 sub git_atom {
8062         git_feed('atom');
8063 }
8064
8065 sub git_opml {
8066         my @list = git_get_projects_list($project_filter, $strict_export);
8067         if (!@list) {
8068                 die_error(404, "No projects found");
8069         }
8070
8071         print $cgi->header(
8072                 -type => 'text/xml',
8073                 -charset => 'utf-8',
8074                 -content_disposition => 'inline; filename="opml.xml"');
8075
8076         my $title = esc_html($site_name);
8077         my $filter = " within subdirectory ";
8078         if (defined $project_filter) {
8079                 $filter .= esc_html($project_filter);
8080         } else {
8081                 $filter = "";
8082         }
8083         print <<XML;
8084 <?xml version="1.0" encoding="utf-8"?>
8085 <opml version="1.0">
8086 <head>
8087   <title>$title OPML Export$filter</title>
8088 </head>
8089 <body>
8090 <outline text="git RSS feeds">
8091 XML
8092
8093         foreach my $pr (@list) {
8094                 my %proj = %$pr;
8095                 my $head = git_get_head_hash($proj{'path'});
8096                 if (!defined $head) {
8097                         next;
8098                 }
8099                 $git_dir = "$projectroot/$proj{'path'}";
8100                 my %co = parse_commit($head);
8101                 if (!%co) {
8102                         next;
8103                 }
8104
8105                 my $path = esc_html(chop_str($proj{'path'}, 25, 5));
8106                 my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
8107                 my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
8108                 print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
8109         }
8110         print <<XML;
8111 </outline>
8112 </body>
8113 </opml>
8114 XML
8115 }