gitweb: JavaScript ability to adjust time based on timezone
[git] / gitweb / gitweb.perl
1 #!/usr/bin/perl
2
3 # gitweb - simple web interface to track changes in git repositories
4 #
5 # (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
6 # (C) 2005, Christian Gierke
7 #
8 # This program is licensed under the GPLv2
9
10 use 5.008;
11 use strict;
12 use warnings;
13 use CGI qw(:standard :escapeHTML -nosticky);
14 use CGI::Util qw(unescape);
15 use CGI::Carp qw(fatalsToBrowser set_message);
16 use Encode;
17 use Fcntl ':mode';
18 use File::Find qw();
19 use File::Basename qw(basename);
20 use Time::HiRes qw(gettimeofday tv_interval);
21 binmode STDOUT, ':utf8';
22
23 our $t0 = [ gettimeofday() ];
24 our $number_of_git_cmds = 0;
25
26 BEGIN {
27         CGI->compile() if $ENV{'MOD_PERL'};
28 }
29
30 our $version = "++GIT_VERSION++";
31
32 our ($my_url, $my_uri, $base_url, $path_info, $home_link);
33 sub evaluate_uri {
34         our $cgi;
35
36         our $my_url = $cgi->url();
37         our $my_uri = $cgi->url(-absolute => 1);
38
39         # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
40         # needed and used only for URLs with nonempty PATH_INFO
41         our $base_url = $my_url;
42
43         # When the script is used as DirectoryIndex, the URL does not contain the name
44         # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
45         # have to do it ourselves. We make $path_info global because it's also used
46         # later on.
47         #
48         # Another issue with the script being the DirectoryIndex is that the resulting
49         # $my_url data is not the full script URL: this is good, because we want
50         # generated links to keep implying the script name if it wasn't explicitly
51         # indicated in the URL we're handling, but it means that $my_url cannot be used
52         # as base URL.
53         # Therefore, if we needed to strip PATH_INFO, then we know that we have
54         # to build the base URL ourselves:
55         our $path_info = $ENV{"PATH_INFO"};
56         if ($path_info) {
57                 if ($my_url =~ s,\Q$path_info\E$,, &&
58                     $my_uri =~ s,\Q$path_info\E$,, &&
59                     defined $ENV{'SCRIPT_NAME'}) {
60                         $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
61                 }
62         }
63
64         # target of the home link on top of all pages
65         our $home_link = $my_uri || "/";
66 }
67
68 # core git executable to use
69 # this can just be "git" if your webserver has a sensible PATH
70 our $GIT = "++GIT_BINDIR++/git";
71
72 # absolute fs-path which will be prepended to the project path
73 #our $projectroot = "/pub/scm";
74 our $projectroot = "++GITWEB_PROJECTROOT++";
75
76 # fs traversing limit for getting project list
77 # the number is relative to the projectroot
78 our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
79
80 # string of the home link on top of all pages
81 our $home_link_str = "++GITWEB_HOME_LINK_STR++";
82
83 # name of your site or organization to appear in page titles
84 # replace this with something more descriptive for clearer bookmarks
85 our $site_name = "++GITWEB_SITENAME++"
86                  || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
87
88 # filename of html text to include at top of each page
89 our $site_header = "++GITWEB_SITE_HEADER++";
90 # html text to include at home page
91 our $home_text = "++GITWEB_HOMETEXT++";
92 # filename of html text to include at bottom of each page
93 our $site_footer = "++GITWEB_SITE_FOOTER++";
94
95 # URI of stylesheets
96 our @stylesheets = ("++GITWEB_CSS++");
97 # URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
98 our $stylesheet = undef;
99 # URI of GIT logo (72x27 size)
100 our $logo = "++GITWEB_LOGO++";
101 # URI of GIT favicon, assumed to be image/png type
102 our $favicon = "++GITWEB_FAVICON++";
103 # URI of gitweb.js (JavaScript code for gitweb)
104 our $javascript = "++GITWEB_JS++";
105
106 # URI and label (title) of GIT logo link
107 #our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
108 #our $logo_label = "git documentation";
109 our $logo_url = "http://git-scm.com/";
110 our $logo_label = "git homepage";
111
112 # source of projects list
113 our $projects_list = "++GITWEB_LIST++";
114
115 # the width (in characters) of the projects list "Description" column
116 our $projects_list_description_width = 25;
117
118 # default order of projects list
119 # valid values are none, project, descr, owner, and age
120 our $default_projects_order = "project";
121
122 # show repository only if this file exists
123 # (only effective if this variable evaluates to true)
124 our $export_ok = "++GITWEB_EXPORT_OK++";
125
126 # show repository only if this subroutine returns true
127 # when given the path to the project, for example:
128 #    sub { return -e "$_[0]/git-daemon-export-ok"; }
129 our $export_auth_hook = undef;
130
131 # only allow viewing of repositories also shown on the overview page
132 our $strict_export = "++GITWEB_STRICT_EXPORT++";
133
134 # list of git base URLs used for URL to where fetch project from,
135 # i.e. full URL is "$git_base_url/$project"
136 our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
137
138 # default blob_plain mimetype and default charset for text/plain blob
139 our $default_blob_plain_mimetype = 'text/plain';
140 our $default_text_plain_charset  = undef;
141
142 # file to use for guessing MIME types before trying /etc/mime.types
143 # (relative to the current git repository)
144 our $mimetypes_file = undef;
145
146 # assume this charset if line contains non-UTF-8 characters;
147 # it should be valid encoding (see Encoding::Supported(3pm) for list),
148 # for which encoding all byte sequences are valid, for example
149 # 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
150 # could be even 'utf-8' for the old behavior)
151 our $fallback_encoding = 'latin1';
152
153 # rename detection options for git-diff and git-diff-tree
154 # - default is '-M', with the cost proportional to
155 #   (number of removed files) * (number of new files).
156 # - more costly is '-C' (which implies '-M'), with the cost proportional to
157 #   (number of changed files + number of removed files) * (number of new files)
158 # - even more costly is '-C', '--find-copies-harder' with cost
159 #   (number of files in the original tree) * (number of new files)
160 # - one might want to include '-B' option, e.g. '-B', '-M'
161 our @diff_opts = ('-M'); # taken from git_commit
162
163 # Disables features that would allow repository owners to inject script into
164 # the gitweb domain.
165 our $prevent_xss = 0;
166
167 # Path to the highlight executable to use (must be the one from
168 # http://www.andre-simon.de due to assumptions about parameters and output).
169 # Useful if highlight is not installed on your webserver's PATH.
170 # [Default: highlight]
171 our $highlight_bin = "++HIGHLIGHT_BIN++";
172
173 # information about snapshot formats that gitweb is capable of serving
174 our %known_snapshot_formats = (
175         # name => {
176         #       'display' => display name,
177         #       'type' => mime type,
178         #       'suffix' => filename suffix,
179         #       'format' => --format for git-archive,
180         #       'compressor' => [compressor command and arguments]
181         #                       (array reference, optional)
182         #       'disabled' => boolean (optional)}
183         #
184         'tgz' => {
185                 'display' => 'tar.gz',
186                 'type' => 'application/x-gzip',
187                 'suffix' => '.tar.gz',
188                 'format' => 'tar',
189                 'compressor' => ['gzip']},
190
191         'tbz2' => {
192                 'display' => 'tar.bz2',
193                 'type' => 'application/x-bzip2',
194                 'suffix' => '.tar.bz2',
195                 'format' => 'tar',
196                 'compressor' => ['bzip2']},
197
198         'txz' => {
199                 'display' => 'tar.xz',
200                 'type' => 'application/x-xz',
201                 'suffix' => '.tar.xz',
202                 'format' => 'tar',
203                 'compressor' => ['xz'],
204                 'disabled' => 1},
205
206         'zip' => {
207                 'display' => 'zip',
208                 'type' => 'application/x-zip',
209                 'suffix' => '.zip',
210                 'format' => 'zip'},
211 );
212
213 # Aliases so we understand old gitweb.snapshot values in repository
214 # configuration.
215 our %known_snapshot_format_aliases = (
216         'gzip'  => 'tgz',
217         'bzip2' => 'tbz2',
218         'xz'    => 'txz',
219
220         # backward compatibility: legacy gitweb config support
221         'x-gzip' => undef, 'gz' => undef,
222         'x-bzip2' => undef, 'bz2' => undef,
223         'x-zip' => undef, '' => undef,
224 );
225
226 # Pixel sizes for icons and avatars. If the default font sizes or lineheights
227 # are changed, it may be appropriate to change these values too via
228 # $GITWEB_CONFIG.
229 our %avatar_size = (
230         'default' => 16,
231         'double'  => 32
232 );
233
234 # Used to set the maximum load that we will still respond to gitweb queries.
235 # If server load exceed this value then return "503 server busy" error.
236 # If gitweb cannot determined server load, it is taken to be 0.
237 # Leave it undefined (or set to 'undef') to turn off load checking.
238 our $maxload = 300;
239
240 # configuration for 'highlight' (http://www.andre-simon.de/)
241 # match by basename
242 our %highlight_basename = (
243         #'Program' => 'py',
244         #'Library' => 'py',
245         'SConstruct' => 'py', # SCons equivalent of Makefile
246         'Makefile' => 'make',
247 );
248 # match by extension
249 our %highlight_ext = (
250         # main extensions, defining name of syntax;
251         # see files in /usr/share/highlight/langDefs/ directory
252         map { $_ => $_ }
253                 qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
254         # alternate extensions, see /etc/highlight/filetypes.conf
255         'h' => 'c',
256         map { $_ => 'sh'  } qw(bash zsh ksh),
257         map { $_ => 'cpp' } qw(cxx c++ cc),
258         map { $_ => 'php' } qw(php3 php4 php5 phps),
259         map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
260         map { $_ => 'make'} qw(mak mk),
261         map { $_ => 'xml' } qw(xhtml html htm),
262 );
263
264 # You define site-wide feature defaults here; override them with
265 # $GITWEB_CONFIG as necessary.
266 our %feature = (
267         # feature => {
268         #       'sub' => feature-sub (subroutine),
269         #       'override' => allow-override (boolean),
270         #       'default' => [ default options...] (array reference)}
271         #
272         # if feature is overridable (it means that allow-override has true value),
273         # then feature-sub will be called with default options as parameters;
274         # return value of feature-sub indicates if to enable specified feature
275         #
276         # if there is no 'sub' key (no feature-sub), then feature cannot be
277         # overridden
278         #
279         # use gitweb_get_feature(<feature>) to retrieve the <feature> value
280         # (an array) or gitweb_check_feature(<feature>) to check if <feature>
281         # is enabled
282
283         # Enable the 'blame' blob view, showing the last commit that modified
284         # each line in the file. This can be very CPU-intensive.
285
286         # To enable system wide have in $GITWEB_CONFIG
287         # $feature{'blame'}{'default'} = [1];
288         # To have project specific config enable override in $GITWEB_CONFIG
289         # $feature{'blame'}{'override'} = 1;
290         # and in project config gitweb.blame = 0|1;
291         'blame' => {
292                 'sub' => sub { feature_bool('blame', @_) },
293                 'override' => 0,
294                 'default' => [0]},
295
296         # Enable the 'snapshot' link, providing a compressed archive of any
297         # tree. This can potentially generate high traffic if you have large
298         # project.
299
300         # Value is a list of formats defined in %known_snapshot_formats that
301         # you wish to offer.
302         # To disable system wide have in $GITWEB_CONFIG
303         # $feature{'snapshot'}{'default'} = [];
304         # To have project specific config enable override in $GITWEB_CONFIG
305         # $feature{'snapshot'}{'override'} = 1;
306         # and in project config, a comma-separated list of formats or "none"
307         # to disable.  Example: gitweb.snapshot = tbz2,zip;
308         'snapshot' => {
309                 'sub' => \&feature_snapshot,
310                 'override' => 0,
311                 'default' => ['tgz']},
312
313         # Enable text search, which will list the commits which match author,
314         # committer or commit text to a given string.  Enabled by default.
315         # Project specific override is not supported.
316         'search' => {
317                 'override' => 0,
318                 'default' => [1]},
319
320         # Enable grep search, which will list the files in currently selected
321         # tree containing the given string. Enabled by default. This can be
322         # potentially CPU-intensive, of course.
323
324         # To enable system wide have in $GITWEB_CONFIG
325         # $feature{'grep'}{'default'} = [1];
326         # To have project specific config enable override in $GITWEB_CONFIG
327         # $feature{'grep'}{'override'} = 1;
328         # and in project config gitweb.grep = 0|1;
329         'grep' => {
330                 'sub' => sub { feature_bool('grep', @_) },
331                 'override' => 0,
332                 'default' => [1]},
333
334         # Enable the pickaxe search, which will list the commits that modified
335         # a given string in a file. This can be practical and quite faster
336         # alternative to 'blame', but still potentially CPU-intensive.
337
338         # To enable system wide have in $GITWEB_CONFIG
339         # $feature{'pickaxe'}{'default'} = [1];
340         # To have project specific config enable override in $GITWEB_CONFIG
341         # $feature{'pickaxe'}{'override'} = 1;
342         # and in project config gitweb.pickaxe = 0|1;
343         'pickaxe' => {
344                 'sub' => sub { feature_bool('pickaxe', @_) },
345                 'override' => 0,
346                 'default' => [1]},
347
348         # Enable showing size of blobs in a 'tree' view, in a separate
349         # column, similar to what 'ls -l' does.  This cost a bit of IO.
350
351         # To disable system wide have in $GITWEB_CONFIG
352         # $feature{'show-sizes'}{'default'} = [0];
353         # To have project specific config enable override in $GITWEB_CONFIG
354         # $feature{'show-sizes'}{'override'} = 1;
355         # and in project config gitweb.showsizes = 0|1;
356         'show-sizes' => {
357                 'sub' => sub { feature_bool('showsizes', @_) },
358                 'override' => 0,
359                 'default' => [1]},
360
361         # Make gitweb use an alternative format of the URLs which can be
362         # more readable and natural-looking: project name is embedded
363         # directly in the path and the query string contains other
364         # auxiliary information. All gitweb installations recognize
365         # URL in either format; this configures in which formats gitweb
366         # generates links.
367
368         # To enable system wide have in $GITWEB_CONFIG
369         # $feature{'pathinfo'}{'default'} = [1];
370         # Project specific override is not supported.
371
372         # Note that you will need to change the default location of CSS,
373         # favicon, logo and possibly other files to an absolute URL. Also,
374         # if gitweb.cgi serves as your indexfile, you will need to force
375         # $my_uri to contain the script name in your $GITWEB_CONFIG.
376         'pathinfo' => {
377                 'override' => 0,
378                 'default' => [0]},
379
380         # Make gitweb consider projects in project root subdirectories
381         # to be forks of existing projects. Given project $projname.git,
382         # projects matching $projname/*.git will not be shown in the main
383         # projects list, instead a '+' mark will be added to $projname
384         # there and a 'forks' view will be enabled for the project, listing
385         # all the forks. If project list is taken from a file, forks have
386         # to be listed after the main project.
387
388         # To enable system wide have in $GITWEB_CONFIG
389         # $feature{'forks'}{'default'} = [1];
390         # Project specific override is not supported.
391         'forks' => {
392                 'override' => 0,
393                 'default' => [0]},
394
395         # Insert custom links to the action bar of all project pages.
396         # This enables you mainly to link to third-party scripts integrating
397         # into gitweb; e.g. git-browser for graphical history representation
398         # or custom web-based repository administration interface.
399
400         # The 'default' value consists of a list of triplets in the form
401         # (label, link, position) where position is the label after which
402         # to insert the link and link is a format string where %n expands
403         # to the project name, %f to the project path within the filesystem,
404         # %h to the current hash (h gitweb parameter) and %b to the current
405         # hash base (hb gitweb parameter); %% expands to %.
406
407         # To enable system wide have in $GITWEB_CONFIG e.g.
408         # $feature{'actions'}{'default'} = [('graphiclog',
409         #       '/git-browser/by-commit.html?r=%n', 'summary')];
410         # Project specific override is not supported.
411         'actions' => {
412                 'override' => 0,
413                 'default' => []},
414
415         # Allow gitweb scan project content tags described in ctags/
416         # of project repository, and display the popular Web 2.0-ish
417         # "tag cloud" near the project list. Note that this is something
418         # COMPLETELY different from the normal Git tags.
419
420         # gitweb by itself can show existing tags, but it does not handle
421         # tagging itself; you need an external application for that.
422         # For an example script, check Girocco's cgi/tagproj.cgi.
423         # You may want to install the HTML::TagCloud Perl module to get
424         # a pretty tag cloud instead of just a list of tags.
425
426         # To enable system wide have in $GITWEB_CONFIG
427         # $feature{'ctags'}{'default'} = ['path_to_tag_script'];
428         # Project specific override is not supported.
429         'ctags' => {
430                 'override' => 0,
431                 'default' => [0]},
432
433         # The maximum number of patches in a patchset generated in patch
434         # view. Set this to 0 or undef to disable patch view, or to a
435         # negative number to remove any limit.
436
437         # To disable system wide have in $GITWEB_CONFIG
438         # $feature{'patches'}{'default'} = [0];
439         # To have project specific config enable override in $GITWEB_CONFIG
440         # $feature{'patches'}{'override'} = 1;
441         # and in project config gitweb.patches = 0|n;
442         # where n is the maximum number of patches allowed in a patchset.
443         'patches' => {
444                 'sub' => \&feature_patches,
445                 'override' => 0,
446                 'default' => [16]},
447
448         # Avatar support. When this feature is enabled, views such as
449         # shortlog or commit will display an avatar associated with
450         # the email of the committer(s) and/or author(s).
451
452         # Currently available providers are gravatar and picon.
453         # If an unknown provider is specified, the feature is disabled.
454
455         # Gravatar depends on Digest::MD5.
456         # Picon currently relies on the indiana.edu database.
457
458         # To enable system wide have in $GITWEB_CONFIG
459         # $feature{'avatar'}{'default'} = ['<provider>'];
460         # where <provider> is either gravatar or picon.
461         # To have project specific config enable override in $GITWEB_CONFIG
462         # $feature{'avatar'}{'override'} = 1;
463         # and in project config gitweb.avatar = <provider>;
464         'avatar' => {
465                 'sub' => \&feature_avatar,
466                 'override' => 0,
467                 'default' => ['']},
468
469         # Enable displaying how much time and how many git commands
470         # it took to generate and display page.  Disabled by default.
471         # Project specific override is not supported.
472         'timed' => {
473                 'override' => 0,
474                 'default' => [0]},
475
476         # Enable turning some links into links to actions which require
477         # JavaScript to run (like 'blame_incremental').  Not enabled by
478         # default.  Project specific override is currently not supported.
479         'javascript-actions' => {
480                 'override' => 0,
481                 'default' => [0]},
482
483         # Syntax highlighting support. This is based on Daniel Svensson's
484         # and Sham Chukoury's work in gitweb-xmms2.git.
485         # It requires the 'highlight' program present in $PATH,
486         # and therefore is disabled by default.
487
488         # To enable system wide have in $GITWEB_CONFIG
489         # $feature{'highlight'}{'default'} = [1];
490
491         'highlight' => {
492                 'sub' => sub { feature_bool('highlight', @_) },
493                 'override' => 0,
494                 'default' => [0]},
495
496         # Enable displaying of remote heads in the heads list
497
498         # To enable system wide have in $GITWEB_CONFIG
499         # $feature{'remote_heads'}{'default'} = [1];
500         # To have project specific config enable override in $GITWEB_CONFIG
501         # $feature{'remote_heads'}{'override'} = 1;
502         # and in project config gitweb.remote_heads = 0|1;
503         'remote_heads' => {
504                 'sub' => sub { feature_bool('remote_heads', @_) },
505                 'override' => 0,
506                 'default' => [0]},
507 );
508
509 sub gitweb_get_feature {
510         my ($name) = @_;
511         return unless exists $feature{$name};
512         my ($sub, $override, @defaults) = (
513                 $feature{$name}{'sub'},
514                 $feature{$name}{'override'},
515                 @{$feature{$name}{'default'}});
516         # project specific override is possible only if we have project
517         our $git_dir; # global variable, declared later
518         if (!$override || !defined $git_dir) {
519                 return @defaults;
520         }
521         if (!defined $sub) {
522                 warn "feature $name is not overridable";
523                 return @defaults;
524         }
525         return $sub->(@defaults);
526 }
527
528 # A wrapper to check if a given feature is enabled.
529 # With this, you can say
530 #
531 #   my $bool_feat = gitweb_check_feature('bool_feat');
532 #   gitweb_check_feature('bool_feat') or somecode;
533 #
534 # instead of
535 #
536 #   my ($bool_feat) = gitweb_get_feature('bool_feat');
537 #   (gitweb_get_feature('bool_feat'))[0] or somecode;
538 #
539 sub gitweb_check_feature {
540         return (gitweb_get_feature(@_))[0];
541 }
542
543
544 sub feature_bool {
545         my $key = shift;
546         my ($val) = git_get_project_config($key, '--bool');
547
548         if (!defined $val) {
549                 return ($_[0]);
550         } elsif ($val eq 'true') {
551                 return (1);
552         } elsif ($val eq 'false') {
553                 return (0);
554         }
555 }
556
557 sub feature_snapshot {
558         my (@fmts) = @_;
559
560         my ($val) = git_get_project_config('snapshot');
561
562         if ($val) {
563                 @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
564         }
565
566         return @fmts;
567 }
568
569 sub feature_patches {
570         my @val = (git_get_project_config('patches', '--int'));
571
572         if (@val) {
573                 return @val;
574         }
575
576         return ($_[0]);
577 }
578
579 sub feature_avatar {
580         my @val = (git_get_project_config('avatar'));
581
582         return @val ? @val : @_;
583 }
584
585 # checking HEAD file with -e is fragile if the repository was
586 # initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
587 # and then pruned.
588 sub check_head_link {
589         my ($dir) = @_;
590         my $headfile = "$dir/HEAD";
591         return ((-e $headfile) ||
592                 (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
593 }
594
595 sub check_export_ok {
596         my ($dir) = @_;
597         return (check_head_link($dir) &&
598                 (!$export_ok || -e "$dir/$export_ok") &&
599                 (!$export_auth_hook || $export_auth_hook->($dir)));
600 }
601
602 # process alternate names for backward compatibility
603 # filter out unsupported (unknown) snapshot formats
604 sub filter_snapshot_fmts {
605         my @fmts = @_;
606
607         @fmts = map {
608                 exists $known_snapshot_format_aliases{$_} ?
609                        $known_snapshot_format_aliases{$_} : $_} @fmts;
610         @fmts = grep {
611                 exists $known_snapshot_formats{$_} &&
612                 !$known_snapshot_formats{$_}{'disabled'}} @fmts;
613 }
614
615 # If it is set to code reference, it is code that it is to be run once per
616 # request, allowing updating configurations that change with each request,
617 # while running other code in config file only once.
618 #
619 # Otherwise, if it is false then gitweb would process config file only once;
620 # if it is true then gitweb config would be run for each request.
621 our $per_request_config = 1;
622
623 our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM);
624 sub evaluate_gitweb_config {
625         our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
626         our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
627         # die if there are errors parsing config file
628         if (-e $GITWEB_CONFIG) {
629                 do $GITWEB_CONFIG;
630                 die $@ if $@;
631         } elsif (-e $GITWEB_CONFIG_SYSTEM) {
632                 do $GITWEB_CONFIG_SYSTEM;
633                 die $@ if $@;
634         }
635 }
636
637 # Get loadavg of system, to compare against $maxload.
638 # Currently it requires '/proc/loadavg' present to get loadavg;
639 # if it is not present it returns 0, which means no load checking.
640 sub get_loadavg {
641         if( -e '/proc/loadavg' ){
642                 open my $fd, '<', '/proc/loadavg'
643                         or return 0;
644                 my @load = split(/\s+/, scalar <$fd>);
645                 close $fd;
646
647                 # The first three columns measure CPU and IO utilization of the last one,
648                 # five, and 10 minute periods.  The fourth column shows the number of
649                 # currently running processes and the total number of processes in the m/n
650                 # format.  The last column displays the last process ID used.
651                 return $load[0] || 0;
652         }
653         # additional checks for load average should go here for things that don't export
654         # /proc/loadavg
655
656         return 0;
657 }
658
659 # version of the core git binary
660 our $git_version;
661 sub evaluate_git_version {
662         our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
663         $number_of_git_cmds++;
664 }
665
666 sub check_loadavg {
667         if (defined $maxload && get_loadavg() > $maxload) {
668                 die_error(503, "The load average on the server is too high");
669         }
670 }
671
672 # ======================================================================
673 # input validation and dispatch
674
675 # input parameters can be collected from a variety of sources (presently, CGI
676 # and PATH_INFO), so we define an %input_params hash that collects them all
677 # together during validation: this allows subsequent uses (e.g. href()) to be
678 # agnostic of the parameter origin
679
680 our %input_params = ();
681
682 # input parameters are stored with the long parameter name as key. This will
683 # also be used in the href subroutine to convert parameters to their CGI
684 # equivalent, and since the href() usage is the most frequent one, we store
685 # the name -> CGI key mapping here, instead of the reverse.
686 #
687 # XXX: Warning: If you touch this, check the search form for updating,
688 # too.
689
690 our @cgi_param_mapping = (
691         project => "p",
692         action => "a",
693         file_name => "f",
694         file_parent => "fp",
695         hash => "h",
696         hash_parent => "hp",
697         hash_base => "hb",
698         hash_parent_base => "hpb",
699         page => "pg",
700         order => "o",
701         searchtext => "s",
702         searchtype => "st",
703         snapshot_format => "sf",
704         extra_options => "opt",
705         search_use_regexp => "sr",
706         # this must be last entry (for manipulation from JavaScript)
707         javascript => "js"
708 );
709 our %cgi_param_mapping = @cgi_param_mapping;
710
711 # we will also need to know the possible actions, for validation
712 our %actions = (
713         "blame" => \&git_blame,
714         "blame_incremental" => \&git_blame_incremental,
715         "blame_data" => \&git_blame_data,
716         "blobdiff" => \&git_blobdiff,
717         "blobdiff_plain" => \&git_blobdiff_plain,
718         "blob" => \&git_blob,
719         "blob_plain" => \&git_blob_plain,
720         "commitdiff" => \&git_commitdiff,
721         "commitdiff_plain" => \&git_commitdiff_plain,
722         "commit" => \&git_commit,
723         "forks" => \&git_forks,
724         "heads" => \&git_heads,
725         "history" => \&git_history,
726         "log" => \&git_log,
727         "patch" => \&git_patch,
728         "patches" => \&git_patches,
729         "remotes" => \&git_remotes,
730         "rss" => \&git_rss,
731         "atom" => \&git_atom,
732         "search" => \&git_search,
733         "search_help" => \&git_search_help,
734         "shortlog" => \&git_shortlog,
735         "summary" => \&git_summary,
736         "tag" => \&git_tag,
737         "tags" => \&git_tags,
738         "tree" => \&git_tree,
739         "snapshot" => \&git_snapshot,
740         "object" => \&git_object,
741         # those below don't need $project
742         "opml" => \&git_opml,
743         "project_list" => \&git_project_list,
744         "project_index" => \&git_project_index,
745 );
746
747 # finally, we have the hash of allowed extra_options for the commands that
748 # allow them
749 our %allowed_options = (
750         "--no-merges" => [ qw(rss atom log shortlog history) ],
751 );
752
753 # fill %input_params with the CGI parameters. All values except for 'opt'
754 # should be single values, but opt can be an array. We should probably
755 # build an array of parameters that can be multi-valued, but since for the time
756 # being it's only this one, we just single it out
757 sub evaluate_query_params {
758         our $cgi;
759
760         while (my ($name, $symbol) = each %cgi_param_mapping) {
761                 if ($symbol eq 'opt') {
762                         $input_params{$name} = [ $cgi->param($symbol) ];
763                 } else {
764                         $input_params{$name} = $cgi->param($symbol);
765                 }
766         }
767 }
768
769 # now read PATH_INFO and update the parameter list for missing parameters
770 sub evaluate_path_info {
771         return if defined $input_params{'project'};
772         return if !$path_info;
773         $path_info =~ s,^/+,,;
774         return if !$path_info;
775
776         # find which part of PATH_INFO is project
777         my $project = $path_info;
778         $project =~ s,/+$,,;
779         while ($project && !check_head_link("$projectroot/$project")) {
780                 $project =~ s,/*[^/]*$,,;
781         }
782         return unless $project;
783         $input_params{'project'} = $project;
784
785         # do not change any parameters if an action is given using the query string
786         return if $input_params{'action'};
787         $path_info =~ s,^\Q$project\E/*,,;
788
789         # next, check if we have an action
790         my $action = $path_info;
791         $action =~ s,/.*$,,;
792         if (exists $actions{$action}) {
793                 $path_info =~ s,^$action/*,,;
794                 $input_params{'action'} = $action;
795         }
796
797         # list of actions that want hash_base instead of hash, but can have no
798         # pathname (f) parameter
799         my @wants_base = (
800                 'tree',
801                 'history',
802         );
803
804         # we want to catch, among others
805         # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
806         my ($parentrefname, $parentpathname, $refname, $pathname) =
807                 ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
808
809         # first, analyze the 'current' part
810         if (defined $pathname) {
811                 # we got "branch:filename" or "branch:dir/"
812                 # we could use git_get_type(branch:pathname), but:
813                 # - it needs $git_dir
814                 # - it does a git() call
815                 # - the convention of terminating directories with a slash
816                 #   makes it superfluous
817                 # - embedding the action in the PATH_INFO would make it even
818                 #   more superfluous
819                 $pathname =~ s,^/+,,;
820                 if (!$pathname || substr($pathname, -1) eq "/") {
821                         $input_params{'action'} ||= "tree";
822                         $pathname =~ s,/$,,;
823                 } else {
824                         # the default action depends on whether we had parent info
825                         # or not
826                         if ($parentrefname) {
827                                 $input_params{'action'} ||= "blobdiff_plain";
828                         } else {
829                                 $input_params{'action'} ||= "blob_plain";
830                         }
831                 }
832                 $input_params{'hash_base'} ||= $refname;
833                 $input_params{'file_name'} ||= $pathname;
834         } elsif (defined $refname) {
835                 # we got "branch". In this case we have to choose if we have to
836                 # set hash or hash_base.
837                 #
838                 # Most of the actions without a pathname only want hash to be
839                 # set, except for the ones specified in @wants_base that want
840                 # hash_base instead. It should also be noted that hand-crafted
841                 # links having 'history' as an action and no pathname or hash
842                 # set will fail, but that happens regardless of PATH_INFO.
843                 if (defined $parentrefname) {
844                         # if there is parent let the default be 'shortlog' action
845                         # (for http://git.example.com/repo.git/A..B links); if there
846                         # is no parent, dispatch will detect type of object and set
847                         # action appropriately if required (if action is not set)
848                         $input_params{'action'} ||= "shortlog";
849                 }
850                 if ($input_params{'action'} &&
851                     grep { $_ eq $input_params{'action'} } @wants_base) {
852                         $input_params{'hash_base'} ||= $refname;
853                 } else {
854                         $input_params{'hash'} ||= $refname;
855                 }
856         }
857
858         # next, handle the 'parent' part, if present
859         if (defined $parentrefname) {
860                 # a missing pathspec defaults to the 'current' filename, allowing e.g.
861                 # someproject/blobdiff/oldrev..newrev:/filename
862                 if ($parentpathname) {
863                         $parentpathname =~ s,^/+,,;
864                         $parentpathname =~ s,/$,,;
865                         $input_params{'file_parent'} ||= $parentpathname;
866                 } else {
867                         $input_params{'file_parent'} ||= $input_params{'file_name'};
868                 }
869                 # we assume that hash_parent_base is wanted if a path was specified,
870                 # or if the action wants hash_base instead of hash
871                 if (defined $input_params{'file_parent'} ||
872                         grep { $_ eq $input_params{'action'} } @wants_base) {
873                         $input_params{'hash_parent_base'} ||= $parentrefname;
874                 } else {
875                         $input_params{'hash_parent'} ||= $parentrefname;
876                 }
877         }
878
879         # for the snapshot action, we allow URLs in the form
880         # $project/snapshot/$hash.ext
881         # where .ext determines the snapshot and gets removed from the
882         # passed $refname to provide the $hash.
883         #
884         # To be able to tell that $refname includes the format extension, we
885         # require the following two conditions to be satisfied:
886         # - the hash input parameter MUST have been set from the $refname part
887         #   of the URL (i.e. they must be equal)
888         # - the snapshot format MUST NOT have been defined already (e.g. from
889         #   CGI parameter sf)
890         # It's also useless to try any matching unless $refname has a dot,
891         # so we check for that too
892         if (defined $input_params{'action'} &&
893                 $input_params{'action'} eq 'snapshot' &&
894                 defined $refname && index($refname, '.') != -1 &&
895                 $refname eq $input_params{'hash'} &&
896                 !defined $input_params{'snapshot_format'}) {
897                 # We loop over the known snapshot formats, checking for
898                 # extensions. Allowed extensions are both the defined suffix
899                 # (which includes the initial dot already) and the snapshot
900                 # format key itself, with a prepended dot
901                 while (my ($fmt, $opt) = each %known_snapshot_formats) {
902                         my $hash = $refname;
903                         unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
904                                 next;
905                         }
906                         my $sfx = $1;
907                         # a valid suffix was found, so set the snapshot format
908                         # and reset the hash parameter
909                         $input_params{'snapshot_format'} = $fmt;
910                         $input_params{'hash'} = $hash;
911                         # we also set the format suffix to the one requested
912                         # in the URL: this way a request for e.g. .tgz returns
913                         # a .tgz instead of a .tar.gz
914                         $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
915                         last;
916                 }
917         }
918 }
919
920 our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
921      $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
922      $searchtext, $search_regexp);
923 sub evaluate_and_validate_params {
924         our $action = $input_params{'action'};
925         if (defined $action) {
926                 if (!validate_action($action)) {
927                         die_error(400, "Invalid action parameter");
928                 }
929         }
930
931         # parameters which are pathnames
932         our $project = $input_params{'project'};
933         if (defined $project) {
934                 if (!validate_project($project)) {
935                         undef $project;
936                         die_error(404, "No such project");
937                 }
938         }
939
940         our $file_name = $input_params{'file_name'};
941         if (defined $file_name) {
942                 if (!validate_pathname($file_name)) {
943                         die_error(400, "Invalid file parameter");
944                 }
945         }
946
947         our $file_parent = $input_params{'file_parent'};
948         if (defined $file_parent) {
949                 if (!validate_pathname($file_parent)) {
950                         die_error(400, "Invalid file parent parameter");
951                 }
952         }
953
954         # parameters which are refnames
955         our $hash = $input_params{'hash'};
956         if (defined $hash) {
957                 if (!validate_refname($hash)) {
958                         die_error(400, "Invalid hash parameter");
959                 }
960         }
961
962         our $hash_parent = $input_params{'hash_parent'};
963         if (defined $hash_parent) {
964                 if (!validate_refname($hash_parent)) {
965                         die_error(400, "Invalid hash parent parameter");
966                 }
967         }
968
969         our $hash_base = $input_params{'hash_base'};
970         if (defined $hash_base) {
971                 if (!validate_refname($hash_base)) {
972                         die_error(400, "Invalid hash base parameter");
973                 }
974         }
975
976         our @extra_options = @{$input_params{'extra_options'}};
977         # @extra_options is always defined, since it can only be (currently) set from
978         # CGI, and $cgi->param() returns the empty array in array context if the param
979         # is not set
980         foreach my $opt (@extra_options) {
981                 if (not exists $allowed_options{$opt}) {
982                         die_error(400, "Invalid option parameter");
983                 }
984                 if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
985                         die_error(400, "Invalid option parameter for this action");
986                 }
987         }
988
989         our $hash_parent_base = $input_params{'hash_parent_base'};
990         if (defined $hash_parent_base) {
991                 if (!validate_refname($hash_parent_base)) {
992                         die_error(400, "Invalid hash parent base parameter");
993                 }
994         }
995
996         # other parameters
997         our $page = $input_params{'page'};
998         if (defined $page) {
999                 if ($page =~ m/[^0-9]/) {
1000                         die_error(400, "Invalid page parameter");
1001                 }
1002         }
1003
1004         our $searchtype = $input_params{'searchtype'};
1005         if (defined $searchtype) {
1006                 if ($searchtype =~ m/[^a-z]/) {
1007                         die_error(400, "Invalid searchtype parameter");
1008                 }
1009         }
1010
1011         our $search_use_regexp = $input_params{'search_use_regexp'};
1012
1013         our $searchtext = $input_params{'searchtext'};
1014         our $search_regexp;
1015         if (defined $searchtext) {
1016                 if (length($searchtext) < 2) {
1017                         die_error(403, "At least two characters are required for search parameter");
1018                 }
1019                 $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
1020         }
1021 }
1022
1023 # path to the current git repository
1024 our $git_dir;
1025 sub evaluate_git_dir {
1026         our $git_dir = "$projectroot/$project" if $project;
1027 }
1028
1029 our (@snapshot_fmts, $git_avatar);
1030 sub configure_gitweb_features {
1031         # list of supported snapshot formats
1032         our @snapshot_fmts = gitweb_get_feature('snapshot');
1033         @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1034
1035         # check that the avatar feature is set to a known provider name,
1036         # and for each provider check if the dependencies are satisfied.
1037         # if the provider name is invalid or the dependencies are not met,
1038         # reset $git_avatar to the empty string.
1039         our ($git_avatar) = gitweb_get_feature('avatar');
1040         if ($git_avatar eq 'gravatar') {
1041                 $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1042         } elsif ($git_avatar eq 'picon') {
1043                 # no dependencies
1044         } else {
1045                 $git_avatar = '';
1046         }
1047 }
1048
1049 # custom error handler: 'die <message>' is Internal Server Error
1050 sub handle_errors_html {
1051         my $msg = shift; # it is already HTML escaped
1052
1053         # to avoid infinite loop where error occurs in die_error,
1054         # change handler to default handler, disabling handle_errors_html
1055         set_message("Error occured when inside die_error:\n$msg");
1056
1057         # you cannot jump out of die_error when called as error handler;
1058         # the subroutine set via CGI::Carp::set_message is called _after_
1059         # HTTP headers are already written, so it cannot write them itself
1060         die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1061 }
1062 set_message(\&handle_errors_html);
1063
1064 # dispatch
1065 sub dispatch {
1066         if (!defined $action) {
1067                 if (defined $hash) {
1068                         $action = git_get_type($hash);
1069                 } elsif (defined $hash_base && defined $file_name) {
1070                         $action = git_get_type("$hash_base:$file_name");
1071                 } elsif (defined $project) {
1072                         $action = 'summary';
1073                 } else {
1074                         $action = 'project_list';
1075                 }
1076         }
1077         if (!defined($actions{$action})) {
1078                 die_error(400, "Unknown action");
1079         }
1080         if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1081             !$project) {
1082                 die_error(400, "Project needed");
1083         }
1084         $actions{$action}->();
1085 }
1086
1087 sub reset_timer {
1088         our $t0 = [ gettimeofday() ]
1089                 if defined $t0;
1090         our $number_of_git_cmds = 0;
1091 }
1092
1093 our $first_request = 1;
1094 sub run_request {
1095         reset_timer();
1096
1097         evaluate_uri();
1098         if ($first_request) {
1099                 evaluate_gitweb_config();
1100                 evaluate_git_version();
1101         }
1102         if ($per_request_config) {
1103                 if (ref($per_request_config) eq 'CODE') {
1104                         $per_request_config->();
1105                 } elsif (!$first_request) {
1106                         evaluate_gitweb_config();
1107                 }
1108         }
1109         check_loadavg();
1110
1111         # $projectroot and $projects_list might be set in gitweb config file
1112         $projects_list ||= $projectroot;
1113
1114         evaluate_query_params();
1115         evaluate_path_info();
1116         evaluate_and_validate_params();
1117         evaluate_git_dir();
1118
1119         configure_gitweb_features();
1120
1121         dispatch();
1122 }
1123
1124 our $is_last_request = sub { 1 };
1125 our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1126 our $CGI = 'CGI';
1127 our $cgi;
1128 sub configure_as_fcgi {
1129         require CGI::Fast;
1130         our $CGI = 'CGI::Fast';
1131
1132         my $request_number = 0;
1133         # let each child service 100 requests
1134         our $is_last_request = sub { ++$request_number > 100 };
1135 }
1136 sub evaluate_argv {
1137         my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1138         configure_as_fcgi()
1139                 if $script_name =~ /\.fcgi$/;
1140
1141         return unless (@ARGV);
1142
1143         require Getopt::Long;
1144         Getopt::Long::GetOptions(
1145                 'fastcgi|fcgi|f' => \&configure_as_fcgi,
1146                 'nproc|n=i' => sub {
1147                         my ($arg, $val) = @_;
1148                         return unless eval { require FCGI::ProcManager; 1; };
1149                         my $proc_manager = FCGI::ProcManager->new({
1150                                 n_processes => $val,
1151                         });
1152                         our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1153                         our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1154                         our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1155                 },
1156         );
1157 }
1158
1159 sub run {
1160         evaluate_argv();
1161
1162         $first_request = 1;
1163         $pre_listen_hook->()
1164                 if $pre_listen_hook;
1165
1166  REQUEST:
1167         while ($cgi = $CGI->new()) {
1168                 $pre_dispatch_hook->()
1169                         if $pre_dispatch_hook;
1170
1171                 run_request();
1172
1173                 $post_dispatch_hook->()
1174                         if $post_dispatch_hook;
1175                 $first_request = 0;
1176
1177                 last REQUEST if ($is_last_request->());
1178         }
1179
1180  DONE_GITWEB:
1181         1;
1182 }
1183
1184 run();
1185
1186 if (defined caller) {
1187         # wrapped in a subroutine processing requests,
1188         # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1189         return;
1190 } else {
1191         # pure CGI script, serving single request
1192         exit;
1193 }
1194
1195 ## ======================================================================
1196 ## action links
1197
1198 # possible values of extra options
1199 # -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1200 # -replay => 1      - start from a current view (replay with modifications)
1201 # -path_info => 0|1 - don't use/use path_info URL (if possible)
1202 # -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1203 sub href {
1204         my %params = @_;
1205         # default is to use -absolute url() i.e. $my_uri
1206         my $href = $params{-full} ? $my_url : $my_uri;
1207
1208         # implicit -replay, must be first of implicit params
1209         $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1210
1211         $params{'project'} = $project unless exists $params{'project'};
1212
1213         if ($params{-replay}) {
1214                 while (my ($name, $symbol) = each %cgi_param_mapping) {
1215                         if (!exists $params{$name}) {
1216                                 $params{$name} = $input_params{$name};
1217                         }
1218                 }
1219         }
1220
1221         my $use_pathinfo = gitweb_check_feature('pathinfo');
1222         if (defined $params{'project'} &&
1223             (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1224                 # try to put as many parameters as possible in PATH_INFO:
1225                 #   - project name
1226                 #   - action
1227                 #   - hash_parent or hash_parent_base:/file_parent
1228                 #   - hash or hash_base:/filename
1229                 #   - the snapshot_format as an appropriate suffix
1230
1231                 # When the script is the root DirectoryIndex for the domain,
1232                 # $href here would be something like http://gitweb.example.com/
1233                 # Thus, we strip any trailing / from $href, to spare us double
1234                 # slashes in the final URL
1235                 $href =~ s,/$,,;
1236
1237                 # Then add the project name, if present
1238                 $href .= "/".esc_path_info($params{'project'});
1239                 delete $params{'project'};
1240
1241                 # since we destructively absorb parameters, we keep this
1242                 # boolean that remembers if we're handling a snapshot
1243                 my $is_snapshot = $params{'action'} eq 'snapshot';
1244
1245                 # Summary just uses the project path URL, any other action is
1246                 # added to the URL
1247                 if (defined $params{'action'}) {
1248                         $href .= "/".esc_path_info($params{'action'})
1249                                 unless $params{'action'} eq 'summary';
1250                         delete $params{'action'};
1251                 }
1252
1253                 # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1254                 # stripping nonexistent or useless pieces
1255                 $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1256                         || $params{'hash_parent'} || $params{'hash'});
1257                 if (defined $params{'hash_base'}) {
1258                         if (defined $params{'hash_parent_base'}) {
1259                                 $href .= esc_path_info($params{'hash_parent_base'});
1260                                 # skip the file_parent if it's the same as the file_name
1261                                 if (defined $params{'file_parent'}) {
1262                                         if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1263                                                 delete $params{'file_parent'};
1264                                         } elsif ($params{'file_parent'} !~ /\.\./) {
1265                                                 $href .= ":/".esc_path_info($params{'file_parent'});
1266                                                 delete $params{'file_parent'};
1267                                         }
1268                                 }
1269                                 $href .= "..";
1270                                 delete $params{'hash_parent'};
1271                                 delete $params{'hash_parent_base'};
1272                         } elsif (defined $params{'hash_parent'}) {
1273                                 $href .= esc_path_info($params{'hash_parent'}). "..";
1274                                 delete $params{'hash_parent'};
1275                         }
1276
1277                         $href .= esc_path_info($params{'hash_base'});
1278                         if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1279                                 $href .= ":/".esc_path_info($params{'file_name'});
1280                                 delete $params{'file_name'};
1281                         }
1282                         delete $params{'hash'};
1283                         delete $params{'hash_base'};
1284                 } elsif (defined $params{'hash'}) {
1285                         $href .= esc_path_info($params{'hash'});
1286                         delete $params{'hash'};
1287                 }
1288
1289                 # If the action was a snapshot, we can absorb the
1290                 # snapshot_format parameter too
1291                 if ($is_snapshot) {
1292                         my $fmt = $params{'snapshot_format'};
1293                         # snapshot_format should always be defined when href()
1294                         # is called, but just in case some code forgets, we
1295                         # fall back to the default
1296                         $fmt ||= $snapshot_fmts[0];
1297                         $href .= $known_snapshot_formats{$fmt}{'suffix'};
1298                         delete $params{'snapshot_format'};
1299                 }
1300         }
1301
1302         # now encode the parameters explicitly
1303         my @result = ();
1304         for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1305                 my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1306                 if (defined $params{$name}) {
1307                         if (ref($params{$name}) eq "ARRAY") {
1308                                 foreach my $par (@{$params{$name}}) {
1309                                         push @result, $symbol . "=" . esc_param($par);
1310                                 }
1311                         } else {
1312                                 push @result, $symbol . "=" . esc_param($params{$name});
1313                         }
1314                 }
1315         }
1316         $href .= "?" . join(';', @result) if scalar @result;
1317
1318         # final transformation: trailing spaces must be escaped (URI-encoded)
1319         $href =~ s/(\s+)$/CGI::escape($1)/e;
1320
1321         if ($params{-anchor}) {
1322                 $href .= "#".esc_param($params{-anchor});
1323         }
1324
1325         return $href;
1326 }
1327
1328
1329 ## ======================================================================
1330 ## validation, quoting/unquoting and escaping
1331
1332 sub validate_action {
1333         my $input = shift || return undef;
1334         return undef unless exists $actions{$input};
1335         return $input;
1336 }
1337
1338 sub validate_project {
1339         my $input = shift || return undef;
1340         if (!validate_pathname($input) ||
1341                 !(-d "$projectroot/$input") ||
1342                 !check_export_ok("$projectroot/$input") ||
1343                 ($strict_export && !project_in_list($input))) {
1344                 return undef;
1345         } else {
1346                 return $input;
1347         }
1348 }
1349
1350 sub validate_pathname {
1351         my $input = shift || return undef;
1352
1353         # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1354         # at the beginning, at the end, and between slashes.
1355         # also this catches doubled slashes
1356         if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1357                 return undef;
1358         }
1359         # no null characters
1360         if ($input =~ m!\0!) {
1361                 return undef;
1362         }
1363         return $input;
1364 }
1365
1366 sub validate_refname {
1367         my $input = shift || return undef;
1368
1369         # textual hashes are O.K.
1370         if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1371                 return $input;
1372         }
1373         # it must be correct pathname
1374         $input = validate_pathname($input)
1375                 or return undef;
1376         # restrictions on ref name according to git-check-ref-format
1377         if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1378                 return undef;
1379         }
1380         return $input;
1381 }
1382
1383 # decode sequences of octets in utf8 into Perl's internal form,
1384 # which is utf-8 with utf8 flag set if needed.  gitweb writes out
1385 # in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1386 sub to_utf8 {
1387         my $str = shift;
1388         return undef unless defined $str;
1389         if (utf8::valid($str)) {
1390                 utf8::decode($str);
1391                 return $str;
1392         } else {
1393                 return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1394         }
1395 }
1396
1397 # quote unsafe chars, but keep the slash, even when it's not
1398 # correct, but quoted slashes look too horrible in bookmarks
1399 sub esc_param {
1400         my $str = shift;
1401         return undef unless defined $str;
1402         $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1403         $str =~ s/ /\+/g;
1404         return $str;
1405 }
1406
1407 # the quoting rules for path_info fragment are slightly different
1408 sub esc_path_info {
1409         my $str = shift;
1410         return undef unless defined $str;
1411
1412         # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1413         $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1414
1415         return $str;
1416 }
1417
1418 # quote unsafe chars in whole URL, so some characters cannot be quoted
1419 sub esc_url {
1420         my $str = shift;
1421         return undef unless defined $str;
1422         $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1423         $str =~ s/ /\+/g;
1424         return $str;
1425 }
1426
1427 # quote unsafe characters in HTML attributes
1428 sub esc_attr {
1429
1430         # for XHTML conformance escaping '"' to '&quot;' is not enough
1431         return esc_html(@_);
1432 }
1433
1434 # replace invalid utf8 character with SUBSTITUTION sequence
1435 sub esc_html {
1436         my $str = shift;
1437         my %opts = @_;
1438
1439         return undef unless defined $str;
1440
1441         $str = to_utf8($str);
1442         $str = $cgi->escapeHTML($str);
1443         if ($opts{'-nbsp'}) {
1444                 $str =~ s/ /&nbsp;/g;
1445         }
1446         $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1447         return $str;
1448 }
1449
1450 # quote control characters and escape filename to HTML
1451 sub esc_path {
1452         my $str = shift;
1453         my %opts = @_;
1454
1455         return undef unless defined $str;
1456
1457         $str = to_utf8($str);
1458         $str = $cgi->escapeHTML($str);
1459         if ($opts{'-nbsp'}) {
1460                 $str =~ s/ /&nbsp;/g;
1461         }
1462         $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1463         return $str;
1464 }
1465
1466 # Make control characters "printable", using character escape codes (CEC)
1467 sub quot_cec {
1468         my $cntrl = shift;
1469         my %opts = @_;
1470         my %es = ( # character escape codes, aka escape sequences
1471                 "\t" => '\t',   # tab            (HT)
1472                 "\n" => '\n',   # line feed      (LF)
1473                 "\r" => '\r',   # carrige return (CR)
1474                 "\f" => '\f',   # form feed      (FF)
1475                 "\b" => '\b',   # backspace      (BS)
1476                 "\a" => '\a',   # alarm (bell)   (BEL)
1477                 "\e" => '\e',   # escape         (ESC)
1478                 "\013" => '\v', # vertical tab   (VT)
1479                 "\000" => '\0', # nul character  (NUL)
1480         );
1481         my $chr = ( (exists $es{$cntrl})
1482                     ? $es{$cntrl}
1483                     : sprintf('\%2x', ord($cntrl)) );
1484         if ($opts{-nohtml}) {
1485                 return $chr;
1486         } else {
1487                 return "<span class=\"cntrl\">$chr</span>";
1488         }
1489 }
1490
1491 # Alternatively use unicode control pictures codepoints,
1492 # Unicode "printable representation" (PR)
1493 sub quot_upr {
1494         my $cntrl = shift;
1495         my %opts = @_;
1496
1497         my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1498         if ($opts{-nohtml}) {
1499                 return $chr;
1500         } else {
1501                 return "<span class=\"cntrl\">$chr</span>";
1502         }
1503 }
1504
1505 # git may return quoted and escaped filenames
1506 sub unquote {
1507         my $str = shift;
1508
1509         sub unq {
1510                 my $seq = shift;
1511                 my %es = ( # character escape codes, aka escape sequences
1512                         't' => "\t",   # tab            (HT, TAB)
1513                         'n' => "\n",   # newline        (NL)
1514                         'r' => "\r",   # return         (CR)
1515                         'f' => "\f",   # form feed      (FF)
1516                         'b' => "\b",   # backspace      (BS)
1517                         'a' => "\a",   # alarm (bell)   (BEL)
1518                         'e' => "\e",   # escape         (ESC)
1519                         'v' => "\013", # vertical tab   (VT)
1520                 );
1521
1522                 if ($seq =~ m/^[0-7]{1,3}$/) {
1523                         # octal char sequence
1524                         return chr(oct($seq));
1525                 } elsif (exists $es{$seq}) {
1526                         # C escape sequence, aka character escape code
1527                         return $es{$seq};
1528                 }
1529                 # quoted ordinary character
1530                 return $seq;
1531         }
1532
1533         if ($str =~ m/^"(.*)"$/) {
1534                 # needs unquoting
1535                 $str = $1;
1536                 $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1537         }
1538         return $str;
1539 }
1540
1541 # escape tabs (convert tabs to spaces)
1542 sub untabify {
1543         my $line = shift;
1544
1545         while ((my $pos = index($line, "\t")) != -1) {
1546                 if (my $count = (8 - ($pos % 8))) {
1547                         my $spaces = ' ' x $count;
1548                         $line =~ s/\t/$spaces/;
1549                 }
1550         }
1551
1552         return $line;
1553 }
1554
1555 sub project_in_list {
1556         my $project = shift;
1557         my @list = git_get_projects_list();
1558         return @list && scalar(grep { $_->{'path'} eq $project } @list);
1559 }
1560
1561 ## ----------------------------------------------------------------------
1562 ## HTML aware string manipulation
1563
1564 # Try to chop given string on a word boundary between position
1565 # $len and $len+$add_len. If there is no word boundary there,
1566 # chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1567 # (marking chopped part) would be longer than given string.
1568 sub chop_str {
1569         my $str = shift;
1570         my $len = shift;
1571         my $add_len = shift || 10;
1572         my $where = shift || 'right'; # 'left' | 'center' | 'right'
1573
1574         # Make sure perl knows it is utf8 encoded so we don't
1575         # cut in the middle of a utf8 multibyte char.
1576         $str = to_utf8($str);
1577
1578         # allow only $len chars, but don't cut a word if it would fit in $add_len
1579         # if it doesn't fit, cut it if it's still longer than the dots we would add
1580         # remove chopped character entities entirely
1581
1582         # when chopping in the middle, distribute $len into left and right part
1583         # return early if chopping wouldn't make string shorter
1584         if ($where eq 'center') {
1585                 return $str if ($len + 5 >= length($str)); # filler is length 5
1586                 $len = int($len/2);
1587         } else {
1588                 return $str if ($len + 4 >= length($str)); # filler is length 4
1589         }
1590
1591         # regexps: ending and beginning with word part up to $add_len
1592         my $endre = qr/.{$len}\w{0,$add_len}/;
1593         my $begre = qr/\w{0,$add_len}.{$len}/;
1594
1595         if ($where eq 'left') {
1596                 $str =~ m/^(.*?)($begre)$/;
1597                 my ($lead, $body) = ($1, $2);
1598                 if (length($lead) > 4) {
1599                         $lead = " ...";
1600                 }
1601                 return "$lead$body";
1602
1603         } elsif ($where eq 'center') {
1604                 $str =~ m/^($endre)(.*)$/;
1605                 my ($left, $str)  = ($1, $2);
1606                 $str =~ m/^(.*?)($begre)$/;
1607                 my ($mid, $right) = ($1, $2);
1608                 if (length($mid) > 5) {
1609                         $mid = " ... ";
1610                 }
1611                 return "$left$mid$right";
1612
1613         } else {
1614                 $str =~ m/^($endre)(.*)$/;
1615                 my $body = $1;
1616                 my $tail = $2;
1617                 if (length($tail) > 4) {
1618                         $tail = "... ";
1619                 }
1620                 return "$body$tail";
1621         }
1622 }
1623
1624 # takes the same arguments as chop_str, but also wraps a <span> around the
1625 # result with a title attribute if it does get chopped. Additionally, the
1626 # string is HTML-escaped.
1627 sub chop_and_escape_str {
1628         my ($str) = @_;
1629
1630         my $chopped = chop_str(@_);
1631         if ($chopped eq $str) {
1632                 return esc_html($chopped);
1633         } else {
1634                 $str =~ s/[[:cntrl:]]/?/g;
1635                 return $cgi->span({-title=>$str}, esc_html($chopped));
1636         }
1637 }
1638
1639 ## ----------------------------------------------------------------------
1640 ## functions returning short strings
1641
1642 # CSS class for given age value (in seconds)
1643 sub age_class {
1644         my $age = shift;
1645
1646         if (!defined $age) {
1647                 return "noage";
1648         } elsif ($age < 60*60*2) {
1649                 return "age0";
1650         } elsif ($age < 60*60*24*2) {
1651                 return "age1";
1652         } else {
1653                 return "age2";
1654         }
1655 }
1656
1657 # convert age in seconds to "nn units ago" string
1658 sub age_string {
1659         my $age = shift;
1660         my $age_str;
1661
1662         if ($age > 60*60*24*365*2) {
1663                 $age_str = (int $age/60/60/24/365);
1664                 $age_str .= " years ago";
1665         } elsif ($age > 60*60*24*(365/12)*2) {
1666                 $age_str = int $age/60/60/24/(365/12);
1667                 $age_str .= " months ago";
1668         } elsif ($age > 60*60*24*7*2) {
1669                 $age_str = int $age/60/60/24/7;
1670                 $age_str .= " weeks ago";
1671         } elsif ($age > 60*60*24*2) {
1672                 $age_str = int $age/60/60/24;
1673                 $age_str .= " days ago";
1674         } elsif ($age > 60*60*2) {
1675                 $age_str = int $age/60/60;
1676                 $age_str .= " hours ago";
1677         } elsif ($age > 60*2) {
1678                 $age_str = int $age/60;
1679                 $age_str .= " min ago";
1680         } elsif ($age > 2) {
1681                 $age_str = int $age;
1682                 $age_str .= " sec ago";
1683         } else {
1684                 $age_str .= " right now";
1685         }
1686         return $age_str;
1687 }
1688
1689 use constant {
1690         S_IFINVALID => 0030000,
1691         S_IFGITLINK => 0160000,
1692 };
1693
1694 # submodule/subproject, a commit object reference
1695 sub S_ISGITLINK {
1696         my $mode = shift;
1697
1698         return (($mode & S_IFMT) == S_IFGITLINK)
1699 }
1700
1701 # convert file mode in octal to symbolic file mode string
1702 sub mode_str {
1703         my $mode = oct shift;
1704
1705         if (S_ISGITLINK($mode)) {
1706                 return 'm---------';
1707         } elsif (S_ISDIR($mode & S_IFMT)) {
1708                 return 'drwxr-xr-x';
1709         } elsif (S_ISLNK($mode)) {
1710                 return 'lrwxrwxrwx';
1711         } elsif (S_ISREG($mode)) {
1712                 # git cares only about the executable bit
1713                 if ($mode & S_IXUSR) {
1714                         return '-rwxr-xr-x';
1715                 } else {
1716                         return '-rw-r--r--';
1717                 };
1718         } else {
1719                 return '----------';
1720         }
1721 }
1722
1723 # convert file mode in octal to file type string
1724 sub file_type {
1725         my $mode = shift;
1726
1727         if ($mode !~ m/^[0-7]+$/) {
1728                 return $mode;
1729         } else {
1730                 $mode = oct $mode;
1731         }
1732
1733         if (S_ISGITLINK($mode)) {
1734                 return "submodule";
1735         } elsif (S_ISDIR($mode & S_IFMT)) {
1736                 return "directory";
1737         } elsif (S_ISLNK($mode)) {
1738                 return "symlink";
1739         } elsif (S_ISREG($mode)) {
1740                 return "file";
1741         } else {
1742                 return "unknown";
1743         }
1744 }
1745
1746 # convert file mode in octal to file type description string
1747 sub file_type_long {
1748         my $mode = shift;
1749
1750         if ($mode !~ m/^[0-7]+$/) {
1751                 return $mode;
1752         } else {
1753                 $mode = oct $mode;
1754         }
1755
1756         if (S_ISGITLINK($mode)) {
1757                 return "submodule";
1758         } elsif (S_ISDIR($mode & S_IFMT)) {
1759                 return "directory";
1760         } elsif (S_ISLNK($mode)) {
1761                 return "symlink";
1762         } elsif (S_ISREG($mode)) {
1763                 if ($mode & S_IXUSR) {
1764                         return "executable";
1765                 } else {
1766                         return "file";
1767                 };
1768         } else {
1769                 return "unknown";
1770         }
1771 }
1772
1773
1774 ## ----------------------------------------------------------------------
1775 ## functions returning short HTML fragments, or transforming HTML fragments
1776 ## which don't belong to other sections
1777
1778 # format line of commit message.
1779 sub format_log_line_html {
1780         my $line = shift;
1781
1782         $line = esc_html($line, -nbsp=>1);
1783         $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1784                 $cgi->a({-href => href(action=>"object", hash=>$1),
1785                                         -class => "text"}, $1);
1786         }eg;
1787
1788         return $line;
1789 }
1790
1791 # format marker of refs pointing to given object
1792
1793 # the destination action is chosen based on object type and current context:
1794 # - for annotated tags, we choose the tag view unless it's the current view
1795 #   already, in which case we go to shortlog view
1796 # - for other refs, we keep the current view if we're in history, shortlog or
1797 #   log view, and select shortlog otherwise
1798 sub format_ref_marker {
1799         my ($refs, $id) = @_;
1800         my $markers = '';
1801
1802         if (defined $refs->{$id}) {
1803                 foreach my $ref (@{$refs->{$id}}) {
1804                         # this code exploits the fact that non-lightweight tags are the
1805                         # only indirect objects, and that they are the only objects for which
1806                         # we want to use tag instead of shortlog as action
1807                         my ($type, $name) = qw();
1808                         my $indirect = ($ref =~ s/\^\{\}$//);
1809                         # e.g. tags/v2.6.11 or heads/next
1810                         if ($ref =~ m!^(.*?)s?/(.*)$!) {
1811                                 $type = $1;
1812                                 $name = $2;
1813                         } else {
1814                                 $type = "ref";
1815                                 $name = $ref;
1816                         }
1817
1818                         my $class = $type;
1819                         $class .= " indirect" if $indirect;
1820
1821                         my $dest_action = "shortlog";
1822
1823                         if ($indirect) {
1824                                 $dest_action = "tag" unless $action eq "tag";
1825                         } elsif ($action =~ /^(history|(short)?log)$/) {
1826                                 $dest_action = $action;
1827                         }
1828
1829                         my $dest = "";
1830                         $dest .= "refs/" unless $ref =~ m!^refs/!;
1831                         $dest .= $ref;
1832
1833                         my $link = $cgi->a({
1834                                 -href => href(
1835                                         action=>$dest_action,
1836                                         hash=>$dest
1837                                 )}, $name);
1838
1839                         $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
1840                                 $link . "</span>";
1841                 }
1842         }
1843
1844         if ($markers) {
1845                 return ' <span class="refs">'. $markers . '</span>';
1846         } else {
1847                 return "";
1848         }
1849 }
1850
1851 # format, perhaps shortened and with markers, title line
1852 sub format_subject_html {
1853         my ($long, $short, $href, $extra) = @_;
1854         $extra = '' unless defined($extra);
1855
1856         if (length($short) < length($long)) {
1857                 $long =~ s/[[:cntrl:]]/?/g;
1858                 return $cgi->a({-href => $href, -class => "list subject",
1859                                 -title => to_utf8($long)},
1860                        esc_html($short)) . $extra;
1861         } else {
1862                 return $cgi->a({-href => $href, -class => "list subject"},
1863                        esc_html($long)) . $extra;
1864         }
1865 }
1866
1867 # Rather than recomputing the url for an email multiple times, we cache it
1868 # after the first hit. This gives a visible benefit in views where the avatar
1869 # for the same email is used repeatedly (e.g. shortlog).
1870 # The cache is shared by all avatar engines (currently gravatar only), which
1871 # are free to use it as preferred. Since only one avatar engine is used for any
1872 # given page, there's no risk for cache conflicts.
1873 our %avatar_cache = ();
1874
1875 # Compute the picon url for a given email, by using the picon search service over at
1876 # http://www.cs.indiana.edu/picons/search.html
1877 sub picon_url {
1878         my $email = lc shift;
1879         if (!$avatar_cache{$email}) {
1880                 my ($user, $domain) = split('@', $email);
1881                 $avatar_cache{$email} =
1882                         "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1883                         "$domain/$user/" .
1884                         "users+domains+unknown/up/single";
1885         }
1886         return $avatar_cache{$email};
1887 }
1888
1889 # Compute the gravatar url for a given email, if it's not in the cache already.
1890 # Gravatar stores only the part of the URL before the size, since that's the
1891 # one computationally more expensive. This also allows reuse of the cache for
1892 # different sizes (for this particular engine).
1893 sub gravatar_url {
1894         my $email = lc shift;
1895         my $size = shift;
1896         $avatar_cache{$email} ||=
1897                 "http://www.gravatar.com/avatar/" .
1898                         Digest::MD5::md5_hex($email) . "?s=";
1899         return $avatar_cache{$email} . $size;
1900 }
1901
1902 # Insert an avatar for the given $email at the given $size if the feature
1903 # is enabled.
1904 sub git_get_avatar {
1905         my ($email, %opts) = @_;
1906         my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1907         my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1908         $opts{-size} ||= 'default';
1909         my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1910         my $url = "";
1911         if ($git_avatar eq 'gravatar') {
1912                 $url = gravatar_url($email, $size);
1913         } elsif ($git_avatar eq 'picon') {
1914                 $url = picon_url($email);
1915         }
1916         # Other providers can be added by extending the if chain, defining $url
1917         # as needed. If no variant puts something in $url, we assume avatars
1918         # are completely disabled/unavailable.
1919         if ($url) {
1920                 return $pre_white .
1921                        "<img width=\"$size\" " .
1922                             "class=\"avatar\" " .
1923                             "src=\"".esc_url($url)."\" " .
1924                             "alt=\"\" " .
1925                        "/>" . $post_white;
1926         } else {
1927                 return "";
1928         }
1929 }
1930
1931 sub format_search_author {
1932         my ($author, $searchtype, $displaytext) = @_;
1933         my $have_search = gitweb_check_feature('search');
1934
1935         if ($have_search) {
1936                 my $performed = "";
1937                 if ($searchtype eq 'author') {
1938                         $performed = "authored";
1939                 } elsif ($searchtype eq 'committer') {
1940                         $performed = "committed";
1941                 }
1942
1943                 return $cgi->a({-href => href(action=>"search", hash=>$hash,
1944                                 searchtext=>$author,
1945                                 searchtype=>$searchtype), class=>"list",
1946                                 title=>"Search for commits $performed by $author"},
1947                                 $displaytext);
1948
1949         } else {
1950                 return $displaytext;
1951         }
1952 }
1953
1954 # format the author name of the given commit with the given tag
1955 # the author name is chopped and escaped according to the other
1956 # optional parameters (see chop_str).
1957 sub format_author_html {
1958         my $tag = shift;
1959         my $co = shift;
1960         my $author = chop_and_escape_str($co->{'author_name'}, @_);
1961         return "<$tag class=\"author\">" .
1962                format_search_author($co->{'author_name'}, "author",
1963                        git_get_avatar($co->{'author_email'}, -pad_after => 1) .
1964                        $author) .
1965                "</$tag>";
1966 }
1967
1968 # format git diff header line, i.e. "diff --(git|combined|cc) ..."
1969 sub format_git_diff_header_line {
1970         my $line = shift;
1971         my $diffinfo = shift;
1972         my ($from, $to) = @_;
1973
1974         if ($diffinfo->{'nparents'}) {
1975                 # combined diff
1976                 $line =~ s!^(diff (.*?) )"?.*$!$1!;
1977                 if ($to->{'href'}) {
1978                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1979                                          esc_path($to->{'file'}));
1980                 } else { # file was deleted (no href)
1981                         $line .= esc_path($to->{'file'});
1982                 }
1983         } else {
1984                 # "ordinary" diff
1985                 $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
1986                 if ($from->{'href'}) {
1987                         $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
1988                                          'a/' . esc_path($from->{'file'}));
1989                 } else { # file was added (no href)
1990                         $line .= 'a/' . esc_path($from->{'file'});
1991                 }
1992                 $line .= ' ';
1993                 if ($to->{'href'}) {
1994                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1995                                          'b/' . esc_path($to->{'file'}));
1996                 } else { # file was deleted
1997                         $line .= 'b/' . esc_path($to->{'file'});
1998                 }
1999         }
2000
2001         return "<div class=\"diff header\">$line</div>\n";
2002 }
2003
2004 # format extended diff header line, before patch itself
2005 sub format_extended_diff_header_line {
2006         my $line = shift;
2007         my $diffinfo = shift;
2008         my ($from, $to) = @_;
2009
2010         # match <path>
2011         if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2012                 $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2013                                        esc_path($from->{'file'}));
2014         }
2015         if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2016                 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2017                                  esc_path($to->{'file'}));
2018         }
2019         # match single <mode>
2020         if ($line =~ m/\s(\d{6})$/) {
2021                 $line .= '<span class="info"> (' .
2022                          file_type_long($1) .
2023                          ')</span>';
2024         }
2025         # match <hash>
2026         if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2027                 # can match only for combined diff
2028                 $line = 'index ';
2029                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2030                         if ($from->{'href'}[$i]) {
2031                                 $line .= $cgi->a({-href=>$from->{'href'}[$i],
2032                                                   -class=>"hash"},
2033                                                  substr($diffinfo->{'from_id'}[$i],0,7));
2034                         } else {
2035                                 $line .= '0' x 7;
2036                         }
2037                         # separator
2038                         $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2039                 }
2040                 $line .= '..';
2041                 if ($to->{'href'}) {
2042                         $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2043                                          substr($diffinfo->{'to_id'},0,7));
2044                 } else {
2045                         $line .= '0' x 7;
2046                 }
2047
2048         } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2049                 # can match only for ordinary diff
2050                 my ($from_link, $to_link);
2051                 if ($from->{'href'}) {
2052                         $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2053                                              substr($diffinfo->{'from_id'},0,7));
2054                 } else {
2055                         $from_link = '0' x 7;
2056                 }
2057                 if ($to->{'href'}) {
2058                         $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2059                                            substr($diffinfo->{'to_id'},0,7));
2060                 } else {
2061                         $to_link = '0' x 7;
2062                 }
2063                 my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2064                 $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2065         }
2066
2067         return $line . "<br/>\n";
2068 }
2069
2070 # format from-file/to-file diff header
2071 sub format_diff_from_to_header {
2072         my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2073         my $line;
2074         my $result = '';
2075
2076         $line = $from_line;
2077         #assert($line =~ m/^---/) if DEBUG;
2078         # no extra formatting for "^--- /dev/null"
2079         if (! $diffinfo->{'nparents'}) {
2080                 # ordinary (single parent) diff
2081                 if ($line =~ m!^--- "?a/!) {
2082                         if ($from->{'href'}) {
2083                                 $line = '--- a/' .
2084                                         $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2085                                                 esc_path($from->{'file'}));
2086                         } else {
2087                                 $line = '--- a/' .
2088                                         esc_path($from->{'file'});
2089                         }
2090                 }
2091                 $result .= qq!<div class="diff from_file">$line</div>\n!;
2092
2093         } else {
2094                 # combined diff (merge commit)
2095                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2096                         if ($from->{'href'}[$i]) {
2097                                 $line = '--- ' .
2098                                         $cgi->a({-href=>href(action=>"blobdiff",
2099                                                              hash_parent=>$diffinfo->{'from_id'}[$i],
2100                                                              hash_parent_base=>$parents[$i],
2101                                                              file_parent=>$from->{'file'}[$i],
2102                                                              hash=>$diffinfo->{'to_id'},
2103                                                              hash_base=>$hash,
2104                                                              file_name=>$to->{'file'}),
2105                                                  -class=>"path",
2106                                                  -title=>"diff" . ($i+1)},
2107                                                 $i+1) .
2108                                         '/' .
2109                                         $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2110                                                 esc_path($from->{'file'}[$i]));
2111                         } else {
2112                                 $line = '--- /dev/null';
2113                         }
2114                         $result .= qq!<div class="diff from_file">$line</div>\n!;
2115                 }
2116         }
2117
2118         $line = $to_line;
2119         #assert($line =~ m/^\+\+\+/) if DEBUG;
2120         # no extra formatting for "^+++ /dev/null"
2121         if ($line =~ m!^\+\+\+ "?b/!) {
2122                 if ($to->{'href'}) {
2123                         $line = '+++ b/' .
2124                                 $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2125                                         esc_path($to->{'file'}));
2126                 } else {
2127                         $line = '+++ b/' .
2128                                 esc_path($to->{'file'});
2129                 }
2130         }
2131         $result .= qq!<div class="diff to_file">$line</div>\n!;
2132
2133         return $result;
2134 }
2135
2136 # create note for patch simplified by combined diff
2137 sub format_diff_cc_simplified {
2138         my ($diffinfo, @parents) = @_;
2139         my $result = '';
2140
2141         $result .= "<div class=\"diff header\">" .
2142                    "diff --cc ";
2143         if (!is_deleted($diffinfo)) {
2144                 $result .= $cgi->a({-href => href(action=>"blob",
2145                                                   hash_base=>$hash,
2146                                                   hash=>$diffinfo->{'to_id'},
2147                                                   file_name=>$diffinfo->{'to_file'}),
2148                                     -class => "path"},
2149                                    esc_path($diffinfo->{'to_file'}));
2150         } else {
2151                 $result .= esc_path($diffinfo->{'to_file'});
2152         }
2153         $result .= "</div>\n" . # class="diff header"
2154                    "<div class=\"diff nodifferences\">" .
2155                    "Simple merge" .
2156                    "</div>\n"; # class="diff nodifferences"
2157
2158         return $result;
2159 }
2160
2161 # format patch (diff) line (not to be used for diff headers)
2162 sub format_diff_line {
2163         my $line = shift;
2164         my ($from, $to) = @_;
2165         my $diff_class = "";
2166
2167         chomp $line;
2168
2169         if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2170                 # combined diff
2171                 my $prefix = substr($line, 0, scalar @{$from->{'href'}});
2172                 if ($line =~ m/^\@{3}/) {
2173                         $diff_class = " chunk_header";
2174                 } elsif ($line =~ m/^\\/) {
2175                         $diff_class = " incomplete";
2176                 } elsif ($prefix =~ tr/+/+/) {
2177                         $diff_class = " add";
2178                 } elsif ($prefix =~ tr/-/-/) {
2179                         $diff_class = " rem";
2180                 }
2181         } else {
2182                 # assume ordinary diff
2183                 my $char = substr($line, 0, 1);
2184                 if ($char eq '+') {
2185                         $diff_class = " add";
2186                 } elsif ($char eq '-') {
2187                         $diff_class = " rem";
2188                 } elsif ($char eq '@') {
2189                         $diff_class = " chunk_header";
2190                 } elsif ($char eq "\\") {
2191                         $diff_class = " incomplete";
2192                 }
2193         }
2194         $line = untabify($line);
2195         if ($from && $to && $line =~ m/^\@{2} /) {
2196                 my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2197                         $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2198
2199                 $from_lines = 0 unless defined $from_lines;
2200                 $to_lines   = 0 unless defined $to_lines;
2201
2202                 if ($from->{'href'}) {
2203                         $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2204                                              -class=>"list"}, $from_text);
2205                 }
2206                 if ($to->{'href'}) {
2207                         $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2208                                              -class=>"list"}, $to_text);
2209                 }
2210                 $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2211                         "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2212                 return "<div class=\"diff$diff_class\">$line</div>\n";
2213         } elsif ($from && $to && $line =~ m/^\@{3}/) {
2214                 my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2215                 my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2216
2217                 @from_text = split(' ', $ranges);
2218                 for (my $i = 0; $i < @from_text; ++$i) {
2219                         ($from_start[$i], $from_nlines[$i]) =
2220                                 (split(',', substr($from_text[$i], 1)), 0);
2221                 }
2222
2223                 $to_text   = pop @from_text;
2224                 $to_start  = pop @from_start;
2225                 $to_nlines = pop @from_nlines;
2226
2227                 $line = "<span class=\"chunk_info\">$prefix ";
2228                 for (my $i = 0; $i < @from_text; ++$i) {
2229                         if ($from->{'href'}[$i]) {
2230                                 $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2231                                                   -class=>"list"}, $from_text[$i]);
2232                         } else {
2233                                 $line .= $from_text[$i];
2234                         }
2235                         $line .= " ";
2236                 }
2237                 if ($to->{'href'}) {
2238                         $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2239                                           -class=>"list"}, $to_text);
2240                 } else {
2241                         $line .= $to_text;
2242                 }
2243                 $line .= " $prefix</span>" .
2244                          "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2245                 return "<div class=\"diff$diff_class\">$line</div>\n";
2246         }
2247         return "<div class=\"diff$diff_class\">" . esc_html($line, -nbsp=>1) . "</div>\n";
2248 }
2249
2250 # Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2251 # linked.  Pass the hash of the tree/commit to snapshot.
2252 sub format_snapshot_links {
2253         my ($hash) = @_;
2254         my $num_fmts = @snapshot_fmts;
2255         if ($num_fmts > 1) {
2256                 # A parenthesized list of links bearing format names.
2257                 # e.g. "snapshot (_tar.gz_ _zip_)"
2258                 return "snapshot (" . join(' ', map
2259                         $cgi->a({
2260                                 -href => href(
2261                                         action=>"snapshot",
2262                                         hash=>$hash,
2263                                         snapshot_format=>$_
2264                                 )
2265                         }, $known_snapshot_formats{$_}{'display'})
2266                 , @snapshot_fmts) . ")";
2267         } elsif ($num_fmts == 1) {
2268                 # A single "snapshot" link whose tooltip bears the format name.
2269                 # i.e. "_snapshot_"
2270                 my ($fmt) = @snapshot_fmts;
2271                 return
2272                         $cgi->a({
2273                                 -href => href(
2274                                         action=>"snapshot",
2275                                         hash=>$hash,
2276                                         snapshot_format=>$fmt
2277                                 ),
2278                                 -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2279                         }, "snapshot");
2280         } else { # $num_fmts == 0
2281                 return undef;
2282         }
2283 }
2284
2285 ## ......................................................................
2286 ## functions returning values to be passed, perhaps after some
2287 ## transformation, to other functions; e.g. returning arguments to href()
2288
2289 # returns hash to be passed to href to generate gitweb URL
2290 # in -title key it returns description of link
2291 sub get_feed_info {
2292         my $format = shift || 'Atom';
2293         my %res = (action => lc($format));
2294
2295         # feed links are possible only for project views
2296         return unless (defined $project);
2297         # some views should link to OPML, or to generic project feed,
2298         # or don't have specific feed yet (so they should use generic)
2299         return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2300
2301         my $branch;
2302         # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2303         # from tag links; this also makes possible to detect branch links
2304         if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2305             (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2306                 $branch = $1;
2307         }
2308         # find log type for feed description (title)
2309         my $type = 'log';
2310         if (defined $file_name) {
2311                 $type  = "history of $file_name";
2312                 $type .= "/" if ($action eq 'tree');
2313                 $type .= " on '$branch'" if (defined $branch);
2314         } else {
2315                 $type = "log of $branch" if (defined $branch);
2316         }
2317
2318         $res{-title} = $type;
2319         $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2320         $res{'file_name'} = $file_name;
2321
2322         return %res;
2323 }
2324
2325 ## ----------------------------------------------------------------------
2326 ## git utility subroutines, invoking git commands
2327
2328 # returns path to the core git executable and the --git-dir parameter as list
2329 sub git_cmd {
2330         $number_of_git_cmds++;
2331         return $GIT, '--git-dir='.$git_dir;
2332 }
2333
2334 # quote the given arguments for passing them to the shell
2335 # quote_command("command", "arg 1", "arg with ' and ! characters")
2336 # => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2337 # Try to avoid using this function wherever possible.
2338 sub quote_command {
2339         return join(' ',
2340                 map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2341 }
2342
2343 # get HEAD ref of given project as hash
2344 sub git_get_head_hash {
2345         return git_get_full_hash(shift, 'HEAD');
2346 }
2347
2348 sub git_get_full_hash {
2349         return git_get_hash(@_);
2350 }
2351
2352 sub git_get_short_hash {
2353         return git_get_hash(@_, '--short=7');
2354 }
2355
2356 sub git_get_hash {
2357         my ($project, $hash, @options) = @_;
2358         my $o_git_dir = $git_dir;
2359         my $retval = undef;
2360         $git_dir = "$projectroot/$project";
2361         if (open my $fd, '-|', git_cmd(), 'rev-parse',
2362             '--verify', '-q', @options, $hash) {
2363                 $retval = <$fd>;
2364                 chomp $retval if defined $retval;
2365                 close $fd;
2366         }
2367         if (defined $o_git_dir) {
2368                 $git_dir = $o_git_dir;
2369         }
2370         return $retval;
2371 }
2372
2373 # get type of given object
2374 sub git_get_type {
2375         my $hash = shift;
2376
2377         open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2378         my $type = <$fd>;
2379         close $fd or return;
2380         chomp $type;
2381         return $type;
2382 }
2383
2384 # repository configuration
2385 our $config_file = '';
2386 our %config;
2387
2388 # store multiple values for single key as anonymous array reference
2389 # single values stored directly in the hash, not as [ <value> ]
2390 sub hash_set_multi {
2391         my ($hash, $key, $value) = @_;
2392
2393         if (!exists $hash->{$key}) {
2394                 $hash->{$key} = $value;
2395         } elsif (!ref $hash->{$key}) {
2396                 $hash->{$key} = [ $hash->{$key}, $value ];
2397         } else {
2398                 push @{$hash->{$key}}, $value;
2399         }
2400 }
2401
2402 # return hash of git project configuration
2403 # optionally limited to some section, e.g. 'gitweb'
2404 sub git_parse_project_config {
2405         my $section_regexp = shift;
2406         my %config;
2407
2408         local $/ = "\0";
2409
2410         open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2411                 or return;
2412
2413         while (my $keyval = <$fh>) {
2414                 chomp $keyval;
2415                 my ($key, $value) = split(/\n/, $keyval, 2);
2416
2417                 hash_set_multi(\%config, $key, $value)
2418                         if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2419         }
2420         close $fh;
2421
2422         return %config;
2423 }
2424
2425 # convert config value to boolean: 'true' or 'false'
2426 # no value, number > 0, 'true' and 'yes' values are true
2427 # rest of values are treated as false (never as error)
2428 sub config_to_bool {
2429         my $val = shift;
2430
2431         return 1 if !defined $val;             # section.key
2432
2433         # strip leading and trailing whitespace
2434         $val =~ s/^\s+//;
2435         $val =~ s/\s+$//;
2436
2437         return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2438                 ($val =~ /^(?:true|yes)$/i));  # section.key = true
2439 }
2440
2441 # convert config value to simple decimal number
2442 # an optional value suffix of 'k', 'm', or 'g' will cause the value
2443 # to be multiplied by 1024, 1048576, or 1073741824
2444 sub config_to_int {
2445         my $val = shift;
2446
2447         # strip leading and trailing whitespace
2448         $val =~ s/^\s+//;
2449         $val =~ s/\s+$//;
2450
2451         if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2452                 $unit = lc($unit);
2453                 # unknown unit is treated as 1
2454                 return $num * ($unit eq 'g' ? 1073741824 :
2455                                $unit eq 'm' ?    1048576 :
2456                                $unit eq 'k' ?       1024 : 1);
2457         }
2458         return $val;
2459 }
2460
2461 # convert config value to array reference, if needed
2462 sub config_to_multi {
2463         my $val = shift;
2464
2465         return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2466 }
2467
2468 sub git_get_project_config {
2469         my ($key, $type) = @_;
2470
2471         return unless defined $git_dir;
2472
2473         # key sanity check
2474         return unless ($key);
2475         $key =~ s/^gitweb\.//;
2476         return if ($key =~ m/\W/);
2477
2478         # type sanity check
2479         if (defined $type) {
2480                 $type =~ s/^--//;
2481                 $type = undef
2482                         unless ($type eq 'bool' || $type eq 'int');
2483         }
2484
2485         # get config
2486         if (!defined $config_file ||
2487             $config_file ne "$git_dir/config") {
2488                 %config = git_parse_project_config('gitweb');
2489                 $config_file = "$git_dir/config";
2490         }
2491
2492         # check if config variable (key) exists
2493         return unless exists $config{"gitweb.$key"};
2494
2495         # ensure given type
2496         if (!defined $type) {
2497                 return $config{"gitweb.$key"};
2498         } elsif ($type eq 'bool') {
2499                 # backward compatibility: 'git config --bool' returns true/false
2500                 return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2501         } elsif ($type eq 'int') {
2502                 return config_to_int($config{"gitweb.$key"});
2503         }
2504         return $config{"gitweb.$key"};
2505 }
2506
2507 # get hash of given path at given ref
2508 sub git_get_hash_by_path {
2509         my $base = shift;
2510         my $path = shift || return undef;
2511         my $type = shift;
2512
2513         $path =~ s,/+$,,;
2514
2515         open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2516                 or die_error(500, "Open git-ls-tree failed");
2517         my $line = <$fd>;
2518         close $fd or return undef;
2519
2520         if (!defined $line) {
2521                 # there is no tree or hash given by $path at $base
2522                 return undef;
2523         }
2524
2525         #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2526         $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2527         if (defined $type && $type ne $2) {
2528                 # type doesn't match
2529                 return undef;
2530         }
2531         return $3;
2532 }
2533
2534 # get path of entry with given hash at given tree-ish (ref)
2535 # used to get 'from' filename for combined diff (merge commit) for renames
2536 sub git_get_path_by_hash {
2537         my $base = shift || return;
2538         my $hash = shift || return;
2539
2540         local $/ = "\0";
2541
2542         open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2543                 or return undef;
2544         while (my $line = <$fd>) {
2545                 chomp $line;
2546
2547                 #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2548                 #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2549                 if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2550                         close $fd;
2551                         return $1;
2552                 }
2553         }
2554         close $fd;
2555         return undef;
2556 }
2557
2558 ## ......................................................................
2559 ## git utility functions, directly accessing git repository
2560
2561 sub git_get_project_description {
2562         my $path = shift;
2563
2564         $git_dir = "$projectroot/$path";
2565         open my $fd, '<', "$git_dir/description"
2566                 or return git_get_project_config('description');
2567         my $descr = <$fd>;
2568         close $fd;
2569         if (defined $descr) {
2570                 chomp $descr;
2571         }
2572         return $descr;
2573 }
2574
2575 sub git_get_project_ctags {
2576         my $path = shift;
2577         my $ctags = {};
2578
2579         $git_dir = "$projectroot/$path";
2580         opendir my $dh, "$git_dir/ctags"
2581                 or return $ctags;
2582         foreach (grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh)) {
2583                 open my $ct, '<', $_ or next;
2584                 my $val = <$ct>;
2585                 chomp $val;
2586                 close $ct;
2587                 my $ctag = $_; $ctag =~ s#.*/##;
2588                 $ctags->{$ctag} = $val;
2589         }
2590         closedir $dh;
2591         $ctags;
2592 }
2593
2594 sub git_populate_project_tagcloud {
2595         my $ctags = shift;
2596
2597         # First, merge different-cased tags; tags vote on casing
2598         my %ctags_lc;
2599         foreach (keys %$ctags) {
2600                 $ctags_lc{lc $_}->{count} += $ctags->{$_};
2601                 if (not $ctags_lc{lc $_}->{topcount}
2602                     or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2603                         $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2604                         $ctags_lc{lc $_}->{topname} = $_;
2605                 }
2606         }
2607
2608         my $cloud;
2609         if (eval { require HTML::TagCloud; 1; }) {
2610                 $cloud = HTML::TagCloud->new;
2611                 foreach (sort keys %ctags_lc) {
2612                         # Pad the title with spaces so that the cloud looks
2613                         # less crammed.
2614                         my $title = $ctags_lc{$_}->{topname};
2615                         $title =~ s/ /&nbsp;/g;
2616                         $title =~ s/^/&nbsp;/g;
2617                         $title =~ s/$/&nbsp;/g;
2618                         $cloud->add($title, $home_link."?by_tag=".$_, $ctags_lc{$_}->{count});
2619                 }
2620         } else {
2621                 $cloud = \%ctags_lc;
2622         }
2623         $cloud;
2624 }
2625
2626 sub git_show_project_tagcloud {
2627         my ($cloud, $count) = @_;
2628         print STDERR ref($cloud)."..\n";
2629         if (ref $cloud eq 'HTML::TagCloud') {
2630                 return $cloud->html_and_css($count);
2631         } else {
2632                 my @tags = sort { $cloud->{$a}->{count} <=> $cloud->{$b}->{count} } keys %$cloud;
2633                 return '<p align="center">' . join (', ', map {
2634                         $cgi->a({-href=>"$home_link?by_tag=$_"}, $cloud->{$_}->{topname})
2635                 } splice(@tags, 0, $count)) . '</p>';
2636         }
2637 }
2638
2639 sub git_get_project_url_list {
2640         my $path = shift;
2641
2642         $git_dir = "$projectroot/$path";
2643         open my $fd, '<', "$git_dir/cloneurl"
2644                 or return wantarray ?
2645                 @{ config_to_multi(git_get_project_config('url')) } :
2646                    config_to_multi(git_get_project_config('url'));
2647         my @git_project_url_list = map { chomp; $_ } <$fd>;
2648         close $fd;
2649
2650         return wantarray ? @git_project_url_list : \@git_project_url_list;
2651 }
2652
2653 sub git_get_projects_list {
2654         my ($filter) = @_;
2655         my @list;
2656
2657         $filter ||= '';
2658         $filter =~ s/\.git$//;
2659
2660         my $check_forks = gitweb_check_feature('forks');
2661
2662         if (-d $projects_list) {
2663                 # search in directory
2664                 my $dir = $projects_list . ($filter ? "/$filter" : '');
2665                 # remove the trailing "/"
2666                 $dir =~ s!/+$!!;
2667                 my $pfxlen = length("$dir");
2668                 my $pfxdepth = ($dir =~ tr!/!!);
2669
2670                 File::Find::find({
2671                         follow_fast => 1, # follow symbolic links
2672                         follow_skip => 2, # ignore duplicates
2673                         dangling_symlinks => 0, # ignore dangling symlinks, silently
2674                         wanted => sub {
2675                                 # global variables
2676                                 our $project_maxdepth;
2677                                 our $projectroot;
2678                                 # skip project-list toplevel, if we get it.
2679                                 return if (m!^[/.]$!);
2680                                 # only directories can be git repositories
2681                                 return unless (-d $_);
2682                                 # don't traverse too deep (Find is super slow on os x)
2683                                 if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2684                                         $File::Find::prune = 1;
2685                                         return;
2686                                 }
2687
2688                                 my $subdir = substr($File::Find::name, $pfxlen + 1);
2689                                 # we check related file in $projectroot
2690                                 my $path = ($filter ? "$filter/" : '') . $subdir;
2691                                 if (check_export_ok("$projectroot/$path")) {
2692                                         push @list, { path => $path };
2693                                         $File::Find::prune = 1;
2694                                 }
2695                         },
2696                 }, "$dir");
2697
2698         } elsif (-f $projects_list) {
2699                 # read from file(url-encoded):
2700                 # 'git%2Fgit.git Linus+Torvalds'
2701                 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2702                 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2703                 my %paths;
2704                 open my $fd, '<', $projects_list or return;
2705         PROJECT:
2706                 while (my $line = <$fd>) {
2707                         chomp $line;
2708                         my ($path, $owner) = split ' ', $line;
2709                         $path = unescape($path);
2710                         $owner = unescape($owner);
2711                         if (!defined $path) {
2712                                 next;
2713                         }
2714                         if ($filter ne '') {
2715                                 # looking for forks;
2716                                 my $pfx = substr($path, 0, length($filter));
2717                                 if ($pfx ne $filter) {
2718                                         next PROJECT;
2719                                 }
2720                                 my $sfx = substr($path, length($filter));
2721                                 if ($sfx !~ /^\/.*\.git$/) {
2722                                         next PROJECT;
2723                                 }
2724                         } elsif ($check_forks) {
2725                         PATH:
2726                                 foreach my $filter (keys %paths) {
2727                                         # looking for forks;
2728                                         my $pfx = substr($path, 0, length($filter));
2729                                         if ($pfx ne $filter) {
2730                                                 next PATH;
2731                                         }
2732                                         my $sfx = substr($path, length($filter));
2733                                         if ($sfx !~ /^\/.*\.git$/) {
2734                                                 next PATH;
2735                                         }
2736                                         # is a fork, don't include it in
2737                                         # the list
2738                                         next PROJECT;
2739                                 }
2740                         }
2741                         if (check_export_ok("$projectroot/$path")) {
2742                                 my $pr = {
2743                                         path => $path,
2744                                         owner => to_utf8($owner),
2745                                 };
2746                                 push @list, $pr;
2747                                 (my $forks_path = $path) =~ s/\.git$//;
2748                                 $paths{$forks_path}++;
2749                         }
2750                 }
2751                 close $fd;
2752         }
2753         return @list;
2754 }
2755
2756 our $gitweb_project_owner = undef;
2757 sub git_get_project_list_from_file {
2758
2759         return if (defined $gitweb_project_owner);
2760
2761         $gitweb_project_owner = {};
2762         # read from file (url-encoded):
2763         # 'git%2Fgit.git Linus+Torvalds'
2764         # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2765         # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2766         if (-f $projects_list) {
2767                 open(my $fd, '<', $projects_list);
2768                 while (my $line = <$fd>) {
2769                         chomp $line;
2770                         my ($pr, $ow) = split ' ', $line;
2771                         $pr = unescape($pr);
2772                         $ow = unescape($ow);
2773                         $gitweb_project_owner->{$pr} = to_utf8($ow);
2774                 }
2775                 close $fd;
2776         }
2777 }
2778
2779 sub git_get_project_owner {
2780         my $project = shift;
2781         my $owner;
2782
2783         return undef unless $project;
2784         $git_dir = "$projectroot/$project";
2785
2786         if (!defined $gitweb_project_owner) {
2787                 git_get_project_list_from_file();
2788         }
2789
2790         if (exists $gitweb_project_owner->{$project}) {
2791                 $owner = $gitweb_project_owner->{$project};
2792         }
2793         if (!defined $owner){
2794                 $owner = git_get_project_config('owner');
2795         }
2796         if (!defined $owner) {
2797                 $owner = get_file_owner("$git_dir");
2798         }
2799
2800         return $owner;
2801 }
2802
2803 sub git_get_last_activity {
2804         my ($path) = @_;
2805         my $fd;
2806
2807         $git_dir = "$projectroot/$path";
2808         open($fd, "-|", git_cmd(), 'for-each-ref',
2809              '--format=%(committer)',
2810              '--sort=-committerdate',
2811              '--count=1',
2812              'refs/heads') or return;
2813         my $most_recent = <$fd>;
2814         close $fd or return;
2815         if (defined $most_recent &&
2816             $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
2817                 my $timestamp = $1;
2818                 my $age = time - $timestamp;
2819                 return ($age, age_string($age));
2820         }
2821         return (undef, undef);
2822 }
2823
2824 # Implementation note: when a single remote is wanted, we cannot use 'git
2825 # remote show -n' because that command always work (assuming it's a remote URL
2826 # if it's not defined), and we cannot use 'git remote show' because that would
2827 # try to make a network roundtrip. So the only way to find if that particular
2828 # remote is defined is to walk the list provided by 'git remote -v' and stop if
2829 # and when we find what we want.
2830 sub git_get_remotes_list {
2831         my $wanted = shift;
2832         my %remotes = ();
2833
2834         open my $fd, '-|' , git_cmd(), 'remote', '-v';
2835         return unless $fd;
2836         while (my $remote = <$fd>) {
2837                 chomp $remote;
2838                 $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
2839                 next if $wanted and not $remote eq $wanted;
2840                 my ($url, $key) = ($1, $2);
2841
2842                 $remotes{$remote} ||= { 'heads' => () };
2843                 $remotes{$remote}{$key} = $url;
2844         }
2845         close $fd or return;
2846         return wantarray ? %remotes : \%remotes;
2847 }
2848
2849 # Takes a hash of remotes as first parameter and fills it by adding the
2850 # available remote heads for each of the indicated remotes.
2851 sub fill_remote_heads {
2852         my $remotes = shift;
2853         my @heads = map { "remotes/$_" } keys %$remotes;
2854         my @remoteheads = git_get_heads_list(undef, @heads);
2855         foreach my $remote (keys %$remotes) {
2856                 $remotes->{$remote}{'heads'} = [ grep {
2857                         $_->{'name'} =~ s!^$remote/!!
2858                         } @remoteheads ];
2859         }
2860 }
2861
2862 sub git_get_references {
2863         my $type = shift || "";
2864         my %refs;
2865         # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
2866         # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
2867         open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
2868                 ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
2869                 or return;
2870
2871         while (my $line = <$fd>) {
2872                 chomp $line;
2873                 if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
2874                         if (defined $refs{$1}) {
2875                                 push @{$refs{$1}}, $2;
2876                         } else {
2877                                 $refs{$1} = [ $2 ];
2878                         }
2879                 }
2880         }
2881         close $fd or return;
2882         return \%refs;
2883 }
2884
2885 sub git_get_rev_name_tags {
2886         my $hash = shift || return undef;
2887
2888         open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
2889                 or return;
2890         my $name_rev = <$fd>;
2891         close $fd;
2892
2893         if ($name_rev =~ m|^$hash tags/(.*)$|) {
2894                 return $1;
2895         } else {
2896                 # catches also '$hash undefined' output
2897                 return undef;
2898         }
2899 }
2900
2901 ## ----------------------------------------------------------------------
2902 ## parse to hash functions
2903
2904 sub parse_date {
2905         my $epoch = shift;
2906         my $tz = shift || "-0000";
2907
2908         my %date;
2909         my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
2910         my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
2911         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
2912         $date{'hour'} = $hour;
2913         $date{'minute'} = $min;
2914         $date{'mday'} = $mday;
2915         $date{'day'} = $days[$wday];
2916         $date{'month'} = $months[$mon];
2917         $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
2918                              $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
2919         $date{'mday-time'} = sprintf "%d %s %02d:%02d",
2920                              $mday, $months[$mon], $hour ,$min;
2921         $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
2922                              1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
2923
2924         my ($tz_sign, $tz_hour, $tz_min) =
2925                 ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
2926         $tz_sign = ($tz_sign eq '-' ? -1 : +1);
2927         my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
2928         ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
2929         $date{'hour_local'} = $hour;
2930         $date{'minute_local'} = $min;
2931         $date{'tz_local'} = $tz;
2932         $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
2933                                   1900+$year, $mon+1, $mday,
2934                                   $hour, $min, $sec, $tz);
2935         return %date;
2936 }
2937
2938 sub parse_tag {
2939         my $tag_id = shift;
2940         my %tag;
2941         my @comment;
2942
2943         open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
2944         $tag{'id'} = $tag_id;
2945         while (my $line = <$fd>) {
2946                 chomp $line;
2947                 if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
2948                         $tag{'object'} = $1;
2949                 } elsif ($line =~ m/^type (.+)$/) {
2950                         $tag{'type'} = $1;
2951                 } elsif ($line =~ m/^tag (.+)$/) {
2952                         $tag{'name'} = $1;
2953                 } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
2954                         $tag{'author'} = $1;
2955                         $tag{'author_epoch'} = $2;
2956                         $tag{'author_tz'} = $3;
2957                         if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
2958                                 $tag{'author_name'}  = $1;
2959                                 $tag{'author_email'} = $2;
2960                         } else {
2961                                 $tag{'author_name'} = $tag{'author'};
2962                         }
2963                 } elsif ($line =~ m/--BEGIN/) {
2964                         push @comment, $line;
2965                         last;
2966                 } elsif ($line eq "") {
2967                         last;
2968                 }
2969         }
2970         push @comment, <$fd>;
2971         $tag{'comment'} = \@comment;
2972         close $fd or return;
2973         if (!defined $tag{'name'}) {
2974                 return
2975         };
2976         return %tag
2977 }
2978
2979 sub parse_commit_text {
2980         my ($commit_text, $withparents) = @_;
2981         my @commit_lines = split '\n', $commit_text;
2982         my %co;
2983
2984         pop @commit_lines; # Remove '\0'
2985
2986         if (! @commit_lines) {
2987                 return;
2988         }
2989
2990         my $header = shift @commit_lines;
2991         if ($header !~ m/^[0-9a-fA-F]{40}/) {
2992                 return;
2993         }
2994         ($co{'id'}, my @parents) = split ' ', $header;
2995         while (my $line = shift @commit_lines) {
2996                 last if $line eq "\n";
2997                 if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
2998                         $co{'tree'} = $1;
2999                 } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3000                         push @parents, $1;
3001                 } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3002                         $co{'author'} = to_utf8($1);
3003                         $co{'author_epoch'} = $2;
3004                         $co{'author_tz'} = $3;
3005                         if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3006                                 $co{'author_name'}  = $1;
3007                                 $co{'author_email'} = $2;
3008                         } else {
3009                                 $co{'author_name'} = $co{'author'};
3010                         }
3011                 } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3012                         $co{'committer'} = to_utf8($1);
3013                         $co{'committer_epoch'} = $2;
3014                         $co{'committer_tz'} = $3;
3015                         if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3016                                 $co{'committer_name'}  = $1;
3017                                 $co{'committer_email'} = $2;
3018                         } else {
3019                                 $co{'committer_name'} = $co{'committer'};
3020                         }
3021                 }
3022         }
3023         if (!defined $co{'tree'}) {
3024                 return;
3025         };
3026         $co{'parents'} = \@parents;
3027         $co{'parent'} = $parents[0];
3028
3029         foreach my $title (@commit_lines) {
3030                 $title =~ s/^    //;
3031                 if ($title ne "") {
3032                         $co{'title'} = chop_str($title, 80, 5);
3033                         # remove leading stuff of merges to make the interesting part visible
3034                         if (length($title) > 50) {
3035                                 $title =~ s/^Automatic //;
3036                                 $title =~ s/^merge (of|with) /Merge ... /i;
3037                                 if (length($title) > 50) {
3038                                         $title =~ s/(http|rsync):\/\///;
3039                                 }
3040                                 if (length($title) > 50) {
3041                                         $title =~ s/(master|www|rsync)\.//;
3042                                 }
3043                                 if (length($title) > 50) {
3044                                         $title =~ s/kernel.org:?//;
3045                                 }
3046                                 if (length($title) > 50) {
3047                                         $title =~ s/\/pub\/scm//;
3048                                 }
3049                         }
3050                         $co{'title_short'} = chop_str($title, 50, 5);
3051                         last;
3052                 }
3053         }
3054         if (! defined $co{'title'} || $co{'title'} eq "") {
3055                 $co{'title'} = $co{'title_short'} = '(no commit message)';
3056         }
3057         # remove added spaces
3058         foreach my $line (@commit_lines) {
3059                 $line =~ s/^    //;
3060         }
3061         $co{'comment'} = \@commit_lines;
3062
3063         my $age = time - $co{'committer_epoch'};
3064         $co{'age'} = $age;
3065         $co{'age_string'} = age_string($age);
3066         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3067         if ($age > 60*60*24*7*2) {
3068                 $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3069                 $co{'age_string_age'} = $co{'age_string'};
3070         } else {
3071                 $co{'age_string_date'} = $co{'age_string'};
3072                 $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3073         }
3074         return %co;
3075 }
3076
3077 sub parse_commit {
3078         my ($commit_id) = @_;
3079         my %co;
3080
3081         local $/ = "\0";
3082
3083         open my $fd, "-|", git_cmd(), "rev-list",
3084                 "--parents",
3085                 "--header",
3086                 "--max-count=1",
3087                 $commit_id,
3088                 "--",
3089                 or die_error(500, "Open git-rev-list failed");
3090         %co = parse_commit_text(<$fd>, 1);
3091         close $fd;
3092
3093         return %co;
3094 }
3095
3096 sub parse_commits {
3097         my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3098         my @cos;
3099
3100         $maxcount ||= 1;
3101         $skip ||= 0;
3102
3103         local $/ = "\0";
3104
3105         open my $fd, "-|", git_cmd(), "rev-list",
3106                 "--header",
3107                 @args,
3108                 ("--max-count=" . $maxcount),
3109                 ("--skip=" . $skip),
3110                 @extra_options,
3111                 $commit_id,
3112                 "--",
3113                 ($filename ? ($filename) : ())
3114                 or die_error(500, "Open git-rev-list failed");
3115         while (my $line = <$fd>) {
3116                 my %co = parse_commit_text($line);
3117                 push @cos, \%co;
3118         }
3119         close $fd;
3120
3121         return wantarray ? @cos : \@cos;
3122 }
3123
3124 # parse line of git-diff-tree "raw" output
3125 sub parse_difftree_raw_line {
3126         my $line = shift;
3127         my %res;
3128
3129         # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3130         # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3131         if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3132                 $res{'from_mode'} = $1;
3133                 $res{'to_mode'} = $2;
3134                 $res{'from_id'} = $3;
3135                 $res{'to_id'} = $4;
3136                 $res{'status'} = $5;
3137                 $res{'similarity'} = $6;
3138                 if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3139                         ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3140                 } else {
3141                         $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3142                 }
3143         }
3144         # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3145         # combined diff (for merge commit)
3146         elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3147                 $res{'nparents'}  = length($1);
3148                 $res{'from_mode'} = [ split(' ', $2) ];
3149                 $res{'to_mode'} = pop @{$res{'from_mode'}};
3150                 $res{'from_id'} = [ split(' ', $3) ];
3151                 $res{'to_id'} = pop @{$res{'from_id'}};
3152                 $res{'status'} = [ split('', $4) ];
3153                 $res{'to_file'} = unquote($5);
3154         }
3155         # 'c512b523472485aef4fff9e57b229d9d243c967f'
3156         elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3157                 $res{'commit'} = $1;
3158         }
3159
3160         return wantarray ? %res : \%res;
3161 }
3162
3163 # wrapper: return parsed line of git-diff-tree "raw" output
3164 # (the argument might be raw line, or parsed info)
3165 sub parsed_difftree_line {
3166         my $line_or_ref = shift;
3167
3168         if (ref($line_or_ref) eq "HASH") {
3169                 # pre-parsed (or generated by hand)
3170                 return $line_or_ref;
3171         } else {
3172                 return parse_difftree_raw_line($line_or_ref);
3173         }
3174 }
3175
3176 # parse line of git-ls-tree output
3177 sub parse_ls_tree_line {
3178         my $line = shift;
3179         my %opts = @_;
3180         my %res;
3181
3182         if ($opts{'-l'}) {
3183                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3184                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3185
3186                 $res{'mode'} = $1;
3187                 $res{'type'} = $2;
3188                 $res{'hash'} = $3;
3189                 $res{'size'} = $4;
3190                 if ($opts{'-z'}) {
3191                         $res{'name'} = $5;
3192                 } else {
3193                         $res{'name'} = unquote($5);
3194                 }
3195         } else {
3196                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3197                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3198
3199                 $res{'mode'} = $1;
3200                 $res{'type'} = $2;
3201                 $res{'hash'} = $3;
3202                 if ($opts{'-z'}) {
3203                         $res{'name'} = $4;
3204                 } else {
3205                         $res{'name'} = unquote($4);
3206                 }
3207         }
3208
3209         return wantarray ? %res : \%res;
3210 }
3211
3212 # generates _two_ hashes, references to which are passed as 2 and 3 argument
3213 sub parse_from_to_diffinfo {
3214         my ($diffinfo, $from, $to, @parents) = @_;
3215
3216         if ($diffinfo->{'nparents'}) {
3217                 # combined diff
3218                 $from->{'file'} = [];
3219                 $from->{'href'} = [];
3220                 fill_from_file_info($diffinfo, @parents)
3221                         unless exists $diffinfo->{'from_file'};
3222                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3223                         $from->{'file'}[$i] =
3224                                 defined $diffinfo->{'from_file'}[$i] ?
3225                                         $diffinfo->{'from_file'}[$i] :
3226                                         $diffinfo->{'to_file'};
3227                         if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3228                                 $from->{'href'}[$i] = href(action=>"blob",
3229                                                            hash_base=>$parents[$i],
3230                                                            hash=>$diffinfo->{'from_id'}[$i],
3231                                                            file_name=>$from->{'file'}[$i]);
3232                         } else {
3233                                 $from->{'href'}[$i] = undef;
3234                         }
3235                 }
3236         } else {
3237                 # ordinary (not combined) diff
3238                 $from->{'file'} = $diffinfo->{'from_file'};
3239                 if ($diffinfo->{'status'} ne "A") { # not new (added) file
3240                         $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3241                                                hash=>$diffinfo->{'from_id'},
3242                                                file_name=>$from->{'file'});
3243                 } else {
3244                         delete $from->{'href'};
3245                 }
3246         }
3247
3248         $to->{'file'} = $diffinfo->{'to_file'};
3249         if (!is_deleted($diffinfo)) { # file exists in result
3250                 $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3251                                      hash=>$diffinfo->{'to_id'},
3252                                      file_name=>$to->{'file'});
3253         } else {
3254                 delete $to->{'href'};
3255         }
3256 }
3257
3258 ## ......................................................................
3259 ## parse to array of hashes functions
3260
3261 sub git_get_heads_list {
3262         my ($limit, @classes) = @_;
3263         @classes = ('heads') unless @classes;
3264         my @patterns = map { "refs/$_" } @classes;
3265         my @headslist;
3266
3267         open my $fd, '-|', git_cmd(), 'for-each-ref',
3268                 ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3269                 '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3270                 @patterns
3271                 or return;
3272         while (my $line = <$fd>) {
3273                 my %ref_item;
3274
3275                 chomp $line;
3276                 my ($refinfo, $committerinfo) = split(/\0/, $line);
3277                 my ($hash, $name, $title) = split(' ', $refinfo, 3);
3278                 my ($committer, $epoch, $tz) =
3279                         ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3280                 $ref_item{'fullname'}  = $name;
3281                 $name =~ s!^refs/(?:head|remote)s/!!;
3282
3283                 $ref_item{'name'}  = $name;
3284                 $ref_item{'id'}    = $hash;
3285                 $ref_item{'title'} = $title || '(no commit message)';
3286                 $ref_item{'epoch'} = $epoch;
3287                 if ($epoch) {
3288                         $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3289                 } else {
3290                         $ref_item{'age'} = "unknown";
3291                 }
3292
3293                 push @headslist, \%ref_item;
3294         }
3295         close $fd;
3296
3297         return wantarray ? @headslist : \@headslist;
3298 }
3299
3300 sub git_get_tags_list {
3301         my $limit = shift;
3302         my @tagslist;
3303
3304         open my $fd, '-|', git_cmd(), 'for-each-ref',
3305                 ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3306                 '--format=%(objectname) %(objecttype) %(refname) '.
3307                 '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3308                 'refs/tags'
3309                 or return;
3310         while (my $line = <$fd>) {
3311                 my %ref_item;
3312
3313                 chomp $line;
3314                 my ($refinfo, $creatorinfo) = split(/\0/, $line);
3315                 my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3316                 my ($creator, $epoch, $tz) =
3317                         ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3318                 $ref_item{'fullname'} = $name;
3319                 $name =~ s!^refs/tags/!!;
3320
3321                 $ref_item{'type'} = $type;
3322                 $ref_item{'id'} = $id;
3323                 $ref_item{'name'} = $name;
3324                 if ($type eq "tag") {
3325                         $ref_item{'subject'} = $title;
3326                         $ref_item{'reftype'} = $reftype;
3327                         $ref_item{'refid'}   = $refid;
3328                 } else {
3329                         $ref_item{'reftype'} = $type;
3330                         $ref_item{'refid'}   = $id;
3331                 }
3332
3333                 if ($type eq "tag" || $type eq "commit") {
3334                         $ref_item{'epoch'} = $epoch;
3335                         if ($epoch) {
3336                                 $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3337                         } else {
3338                                 $ref_item{'age'} = "unknown";
3339                         }
3340                 }
3341
3342                 push @tagslist, \%ref_item;
3343         }
3344         close $fd;
3345
3346         return wantarray ? @tagslist : \@tagslist;
3347 }
3348
3349 ## ----------------------------------------------------------------------
3350 ## filesystem-related functions
3351
3352 sub get_file_owner {
3353         my $path = shift;
3354
3355         my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3356         my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3357         if (!defined $gcos) {
3358                 return undef;
3359         }
3360         my $owner = $gcos;
3361         $owner =~ s/[,;].*$//;
3362         return to_utf8($owner);
3363 }
3364
3365 # assume that file exists
3366 sub insert_file {
3367         my $filename = shift;
3368
3369         open my $fd, '<', $filename;
3370         print map { to_utf8($_) } <$fd>;
3371         close $fd;
3372 }
3373
3374 ## ......................................................................
3375 ## mimetype related functions
3376
3377 sub mimetype_guess_file {
3378         my $filename = shift;
3379         my $mimemap = shift;
3380         -r $mimemap or return undef;
3381
3382         my %mimemap;
3383         open(my $mh, '<', $mimemap) or return undef;
3384         while (<$mh>) {
3385                 next if m/^#/; # skip comments
3386                 my ($mimetype, $exts) = split(/\t+/);
3387                 if (defined $exts) {
3388                         my @exts = split(/\s+/, $exts);
3389                         foreach my $ext (@exts) {
3390                                 $mimemap{$ext} = $mimetype;
3391                         }
3392                 }
3393         }
3394         close($mh);
3395
3396         $filename =~ /\.([^.]*)$/;
3397         return $mimemap{$1};
3398 }
3399
3400 sub mimetype_guess {
3401         my $filename = shift;
3402         my $mime;
3403         $filename =~ /\./ or return undef;
3404
3405         if ($mimetypes_file) {
3406                 my $file = $mimetypes_file;
3407                 if ($file !~ m!^/!) { # if it is relative path
3408                         # it is relative to project
3409                         $file = "$projectroot/$project/$file";
3410                 }
3411                 $mime = mimetype_guess_file($filename, $file);
3412         }
3413         $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3414         return $mime;
3415 }
3416
3417 sub blob_mimetype {
3418         my $fd = shift;
3419         my $filename = shift;
3420
3421         if ($filename) {
3422                 my $mime = mimetype_guess($filename);
3423                 $mime and return $mime;
3424         }
3425
3426         # just in case
3427         return $default_blob_plain_mimetype unless $fd;
3428
3429         if (-T $fd) {
3430                 return 'text/plain';
3431         } elsif (! $filename) {
3432                 return 'application/octet-stream';
3433         } elsif ($filename =~ m/\.png$/i) {
3434                 return 'image/png';
3435         } elsif ($filename =~ m/\.gif$/i) {
3436                 return 'image/gif';
3437         } elsif ($filename =~ m/\.jpe?g$/i) {
3438                 return 'image/jpeg';
3439         } else {
3440                 return 'application/octet-stream';
3441         }
3442 }
3443
3444 sub blob_contenttype {
3445         my ($fd, $file_name, $type) = @_;
3446
3447         $type ||= blob_mimetype($fd, $file_name);
3448         if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3449                 $type .= "; charset=$default_text_plain_charset";
3450         }
3451
3452         return $type;
3453 }
3454
3455 # guess file syntax for syntax highlighting; return undef if no highlighting
3456 # the name of syntax can (in the future) depend on syntax highlighter used
3457 sub guess_file_syntax {
3458         my ($highlight, $mimetype, $file_name) = @_;
3459         return undef unless ($highlight && defined $file_name);
3460         my $basename = basename($file_name, '.in');
3461         return $highlight_basename{$basename}
3462                 if exists $highlight_basename{$basename};
3463
3464         $basename =~ /\.([^.]*)$/;
3465         my $ext = $1 or return undef;
3466         return $highlight_ext{$ext}
3467                 if exists $highlight_ext{$ext};
3468
3469         return undef;
3470 }
3471
3472 # run highlighter and return FD of its output,
3473 # or return original FD if no highlighting
3474 sub run_highlighter {
3475         my ($fd, $highlight, $syntax) = @_;
3476         return $fd unless ($highlight && defined $syntax);
3477
3478         close $fd;
3479         open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3480                   quote_command($highlight_bin).
3481                   " --replace-tabs=8 --fragment --syntax $syntax |"
3482                 or die_error(500, "Couldn't open file or run syntax highlighter");
3483         return $fd;
3484 }
3485
3486 ## ======================================================================
3487 ## functions printing HTML: header, footer, error page
3488
3489 sub get_page_title {
3490         my $title = to_utf8($site_name);
3491
3492         return $title unless (defined $project);
3493         $title .= " - " . to_utf8($project);
3494
3495         return $title unless (defined $action);
3496         $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3497
3498         return $title unless (defined $file_name);
3499         $title .= " - " . esc_path($file_name);
3500         if ($action eq "tree" && $file_name !~ m|/$|) {
3501                 $title .= "/";
3502         }
3503
3504         return $title;
3505 }
3506
3507 sub print_feed_meta {
3508         if (defined $project) {
3509                 my %href_params = get_feed_info();
3510                 if (!exists $href_params{'-title'}) {
3511                         $href_params{'-title'} = 'log';
3512                 }
3513
3514                 foreach my $format (qw(RSS Atom)) {
3515                         my $type = lc($format);
3516                         my %link_attr = (
3517                                 '-rel' => 'alternate',
3518                                 '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3519                                 '-type' => "application/$type+xml"
3520                         );
3521
3522                         $href_params{'action'} = $type;
3523                         $link_attr{'-href'} = href(%href_params);
3524                         print "<link ".
3525                               "rel=\"$link_attr{'-rel'}\" ".
3526                               "title=\"$link_attr{'-title'}\" ".
3527                               "href=\"$link_attr{'-href'}\" ".
3528                               "type=\"$link_attr{'-type'}\" ".
3529                               "/>\n";
3530
3531                         $href_params{'extra_options'} = '--no-merges';
3532                         $link_attr{'-href'} = href(%href_params);
3533                         $link_attr{'-title'} .= ' (no merges)';
3534                         print "<link ".
3535                               "rel=\"$link_attr{'-rel'}\" ".
3536                               "title=\"$link_attr{'-title'}\" ".
3537                               "href=\"$link_attr{'-href'}\" ".
3538                               "type=\"$link_attr{'-type'}\" ".
3539                               "/>\n";
3540                 }
3541
3542         } else {
3543                 printf('<link rel="alternate" title="%s projects list" '.
3544                        'href="%s" type="text/plain; charset=utf-8" />'."\n",
3545                        esc_attr($site_name), href(project=>undef, action=>"project_index"));
3546                 printf('<link rel="alternate" title="%s projects feeds" '.
3547                        'href="%s" type="text/x-opml" />'."\n",
3548                        esc_attr($site_name), href(project=>undef, action=>"opml"));
3549         }
3550 }
3551
3552 sub git_header_html {
3553         my $status = shift || "200 OK";
3554         my $expires = shift;
3555         my %opts = @_;
3556
3557         my $title = get_page_title();
3558         my $content_type;
3559         # require explicit support from the UA if we are to send the page as
3560         # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3561         # we have to do this because MSIE sometimes globs '*/*', pretending to
3562         # support xhtml+xml but choking when it gets what it asked for.
3563         if (defined $cgi->http('HTTP_ACCEPT') &&
3564             $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3565             $cgi->Accept('application/xhtml+xml') != 0) {
3566                 $content_type = 'application/xhtml+xml';
3567         } else {
3568                 $content_type = 'text/html';
3569         }
3570         print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3571                            -status=> $status, -expires => $expires)
3572                 unless ($opts{'-no_http_header'});
3573         my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3574         print <<EOF;
3575 <?xml version="1.0" encoding="utf-8"?>
3576 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3577 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3578 <!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3579 <!-- git core binaries version $git_version -->
3580 <head>
3581 <meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3582 <meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3583 <meta name="robots" content="index, nofollow"/>
3584 <title>$title</title>
3585 EOF
3586         # the stylesheet, favicon etc urls won't work correctly with path_info
3587         # unless we set the appropriate base URL
3588         if ($ENV{'PATH_INFO'}) {
3589                 print "<base href=\"".esc_url($base_url)."\" />\n";
3590         }
3591         # print out each stylesheet that exist, providing backwards capability
3592         # for those people who defined $stylesheet in a config file
3593         if (defined $stylesheet) {
3594                 print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3595         } else {
3596                 foreach my $stylesheet (@stylesheets) {
3597                         next unless $stylesheet;
3598                         print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3599                 }
3600         }
3601         print_feed_meta()
3602                 if ($status eq '200 OK');
3603         if (defined $favicon) {
3604                 print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3605         }
3606
3607         print "</head>\n" .
3608               "<body>\n";
3609
3610         if (defined $site_header && -f $site_header) {
3611                 insert_file($site_header);
3612         }
3613
3614         print "<div class=\"page_header\">\n";
3615         if (defined $logo) {
3616                 print $cgi->a({-href => esc_url($logo_url),
3617                                -title => $logo_label},
3618                               $cgi->img({-src => esc_url($logo),
3619                                          -width => 72, -height => 27,
3620                                          -alt => "git",
3621                                          -class => "logo"}));
3622         }
3623         print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3624         if (defined $project) {
3625                 print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3626                 if (defined $action) {
3627                         my $action_print = $action ;
3628                         if (defined $opts{-action_extra}) {
3629                                 $action_print = $cgi->a({-href => href(action=>$action)},
3630                                         $action);
3631                         }
3632                         print " / $action_print";
3633                 }
3634                 if (defined $opts{-action_extra}) {
3635                         print " / $opts{-action_extra}";
3636                 }
3637                 print "\n";
3638         }
3639         print "</div>\n";
3640
3641         my $have_search = gitweb_check_feature('search');
3642         if (defined $project && $have_search) {
3643                 if (!defined $searchtext) {
3644                         $searchtext = "";
3645                 }
3646                 my $search_hash;
3647                 if (defined $hash_base) {
3648                         $search_hash = $hash_base;
3649                 } elsif (defined $hash) {
3650                         $search_hash = $hash;
3651                 } else {
3652                         $search_hash = "HEAD";
3653                 }
3654                 my $action = $my_uri;
3655                 my $use_pathinfo = gitweb_check_feature('pathinfo');
3656                 if ($use_pathinfo) {
3657                         $action .= "/".esc_url($project);
3658                 }
3659                 print $cgi->startform(-method => "get", -action => $action) .
3660                       "<div class=\"search\">\n" .
3661                       (!$use_pathinfo &&
3662                       $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3663                       $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3664                       $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3665                       $cgi->popup_menu(-name => 'st', -default => 'commit',
3666                                        -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3667                       $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3668                       " search:\n",
3669                       $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3670                       "<span title=\"Extended regular expression\">" .
3671                       $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3672                                      -checked => $search_use_regexp) .
3673                       "</span>" .
3674                       "</div>" .
3675                       $cgi->end_form() . "\n";
3676         }
3677 }
3678
3679 sub git_footer_html {
3680         my $feed_class = 'rss_logo';
3681
3682         print "<div class=\"page_footer\">\n";
3683         if (defined $project) {
3684                 my $descr = git_get_project_description($project);
3685                 if (defined $descr) {
3686                         print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3687                 }
3688
3689                 my %href_params = get_feed_info();
3690                 if (!%href_params) {
3691                         $feed_class .= ' generic';
3692                 }
3693                 $href_params{'-title'} ||= 'log';
3694
3695                 foreach my $format (qw(RSS Atom)) {
3696                         $href_params{'action'} = lc($format);
3697                         print $cgi->a({-href => href(%href_params),
3698                                       -title => "$href_params{'-title'} $format feed",
3699                                       -class => $feed_class}, $format)."\n";
3700                 }
3701
3702         } else {
3703                 print $cgi->a({-href => href(project=>undef, action=>"opml"),
3704                               -class => $feed_class}, "OPML") . " ";
3705                 print $cgi->a({-href => href(project=>undef, action=>"project_index"),
3706                               -class => $feed_class}, "TXT") . "\n";
3707         }
3708         print "</div>\n"; # class="page_footer"
3709
3710         if (defined $t0 && gitweb_check_feature('timed')) {
3711                 print "<div id=\"generating_info\">\n";
3712                 print 'This page took '.
3713                       '<span id="generating_time" class="time_span">'.
3714                       tv_interval($t0, [ gettimeofday() ]).
3715                       ' seconds </span>'.
3716                       ' and '.
3717                       '<span id="generating_cmd">'.
3718                       $number_of_git_cmds.
3719                       '</span> git commands '.
3720                       " to generate.\n";
3721                 print "</div>\n"; # class="page_footer"
3722         }
3723
3724         if (defined $site_footer && -f $site_footer) {
3725                 insert_file($site_footer);
3726         }
3727
3728         print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
3729         if (defined $action &&
3730             $action eq 'blame_incremental') {
3731                 print qq!<script type="text/javascript">\n!.
3732                       qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
3733                       qq!           "!. href() .qq!");\n!.
3734                       qq!</script>\n!;
3735         } else {
3736                 print qq!<script type="text/javascript">\n!.
3737                       qq!window.onload = function () {\n!.
3738                       (gitweb_check_feature('javascript-actions') ?
3739                       qq!       fixLinks();\n! : '').
3740                       # last parameter to onloadTZSetup must be CSS class used by format_timestamp_html
3741                       qq!       onloadTZSetup('local', 'gitweb_tz', 'datetime');\n!.
3742                       qq!};\n!.
3743                       qq!</script>\n!;
3744         }
3745
3746         print "</body>\n" .
3747               "</html>";
3748 }
3749
3750 # die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
3751 # Example: die_error(404, 'Hash not found')
3752 # By convention, use the following status codes (as defined in RFC 2616):
3753 # 400: Invalid or missing CGI parameters, or
3754 #      requested object exists but has wrong type.
3755 # 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
3756 #      this server or project.
3757 # 404: Requested object/revision/project doesn't exist.
3758 # 500: The server isn't configured properly, or
3759 #      an internal error occurred (e.g. failed assertions caused by bugs), or
3760 #      an unknown error occurred (e.g. the git binary died unexpectedly).
3761 # 503: The server is currently unavailable (because it is overloaded,
3762 #      or down for maintenance).  Generally, this is a temporary state.
3763 sub die_error {
3764         my $status = shift || 500;
3765         my $error = esc_html(shift) || "Internal Server Error";
3766         my $extra = shift;
3767         my %opts = @_;
3768
3769         my %http_responses = (
3770                 400 => '400 Bad Request',
3771                 403 => '403 Forbidden',
3772                 404 => '404 Not Found',
3773                 500 => '500 Internal Server Error',
3774                 503 => '503 Service Unavailable',
3775         );
3776         git_header_html($http_responses{$status}, undef, %opts);
3777         print <<EOF;
3778 <div class="page_body">
3779 <br /><br />
3780 $status - $error
3781 <br />
3782 EOF
3783         if (defined $extra) {
3784                 print "<hr />\n" .
3785                       "$extra\n";
3786         }
3787         print "</div>\n";
3788
3789         git_footer_html();
3790         goto DONE_GITWEB
3791                 unless ($opts{'-error_handler'});
3792 }
3793
3794 ## ----------------------------------------------------------------------
3795 ## functions printing or outputting HTML: navigation
3796
3797 sub git_print_page_nav {
3798         my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
3799         $extra = '' if !defined $extra; # pager or formats
3800
3801         my @navs = qw(summary shortlog log commit commitdiff tree);
3802         if ($suppress) {
3803                 @navs = grep { $_ ne $suppress } @navs;
3804         }
3805
3806         my %arg = map { $_ => {action=>$_} } @navs;
3807         if (defined $head) {
3808                 for (qw(commit commitdiff)) {
3809                         $arg{$_}{'hash'} = $head;
3810                 }
3811                 if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
3812                         for (qw(shortlog log)) {
3813                                 $arg{$_}{'hash'} = $head;
3814                         }
3815                 }
3816         }
3817
3818         $arg{'tree'}{'hash'} = $treehead if defined $treehead;
3819         $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
3820
3821         my @actions = gitweb_get_feature('actions');
3822         my %repl = (
3823                 '%' => '%',
3824                 'n' => $project,         # project name
3825                 'f' => $git_dir,         # project path within filesystem
3826                 'h' => $treehead || '',  # current hash ('h' parameter)
3827                 'b' => $treebase || '',  # hash base ('hb' parameter)
3828         );
3829         while (@actions) {
3830                 my ($label, $link, $pos) = splice(@actions,0,3);
3831                 # insert
3832                 @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
3833                 # munch munch
3834                 $link =~ s/%([%nfhb])/$repl{$1}/g;
3835                 $arg{$label}{'_href'} = $link;
3836         }
3837
3838         print "<div class=\"page_nav\">\n" .
3839                 (join " | ",
3840                  map { $_ eq $current ?
3841                        $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
3842                  } @navs);
3843         print "<br/>\n$extra<br/>\n" .
3844               "</div>\n";
3845 }
3846
3847 # returns a submenu for the nagivation of the refs views (tags, heads,
3848 # remotes) with the current view disabled and the remotes view only
3849 # available if the feature is enabled
3850 sub format_ref_views {
3851         my ($current) = @_;
3852         my @ref_views = qw{tags heads};
3853         push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
3854         return join " | ", map {
3855                 $_ eq $current ? $_ :
3856                 $cgi->a({-href => href(action=>$_)}, $_)
3857         } @ref_views
3858 }
3859
3860 sub format_paging_nav {
3861         my ($action, $page, $has_next_link) = @_;
3862         my $paging_nav;
3863
3864
3865         if ($page > 0) {
3866                 $paging_nav .=
3867                         $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
3868                         " &sdot; " .
3869                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
3870                                  -accesskey => "p", -title => "Alt-p"}, "prev");
3871         } else {
3872                 $paging_nav .= "first &sdot; prev";
3873         }
3874
3875         if ($has_next_link) {
3876                 $paging_nav .= " &sdot; " .
3877                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
3878                                  -accesskey => "n", -title => "Alt-n"}, "next");
3879         } else {
3880                 $paging_nav .= " &sdot; next";
3881         }
3882
3883         return $paging_nav;
3884 }
3885
3886 ## ......................................................................
3887 ## functions printing or outputting HTML: div
3888
3889 sub git_print_header_div {
3890         my ($action, $title, $hash, $hash_base) = @_;
3891         my %args = ();
3892
3893         $args{'action'} = $action;
3894         $args{'hash'} = $hash if $hash;
3895         $args{'hash_base'} = $hash_base if $hash_base;
3896
3897         print "<div class=\"header\">\n" .
3898               $cgi->a({-href => href(%args), -class => "title"},
3899               $title ? $title : $action) .
3900               "\n</div>\n";
3901 }
3902
3903 sub format_repo_url {
3904         my ($name, $url) = @_;
3905         return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
3906 }
3907
3908 # Group output by placing it in a DIV element and adding a header.
3909 # Options for start_div() can be provided by passing a hash reference as the
3910 # first parameter to the function.
3911 # Options to git_print_header_div() can be provided by passing an array
3912 # reference. This must follow the options to start_div if they are present.
3913 # The content can be a scalar, which is output as-is, a scalar reference, which
3914 # is output after html escaping, an IO handle passed either as *handle or
3915 # *handle{IO}, or a function reference. In the latter case all following
3916 # parameters will be taken as argument to the content function call.
3917 sub git_print_section {
3918         my ($div_args, $header_args, $content);
3919         my $arg = shift;
3920         if (ref($arg) eq 'HASH') {
3921                 $div_args = $arg;
3922                 $arg = shift;
3923         }
3924         if (ref($arg) eq 'ARRAY') {
3925                 $header_args = $arg;
3926                 $arg = shift;
3927         }
3928         $content = $arg;
3929
3930         print $cgi->start_div($div_args);
3931         git_print_header_div(@$header_args);
3932
3933         if (ref($content) eq 'CODE') {
3934                 $content->(@_);
3935         } elsif (ref($content) eq 'SCALAR') {
3936                 print esc_html($$content);
3937         } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
3938                 print <$content>;
3939         } elsif (!ref($content) && defined($content)) {
3940                 print $content;
3941         }
3942
3943         print $cgi->end_div;
3944 }
3945
3946 sub format_timestamp_html {
3947         my $date = shift;
3948         my $strtime = '<span class="datetime">'.$date->{'rfc2822'}.'</span>';
3949
3950         my $localtime_format = '(%02d:%02d %s)';
3951         if ($date->{'hour_local'} < 6) {
3952                 $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
3953         }
3954         $strtime .= ' ' .
3955                     sprintf($localtime_format,
3956                             $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
3957
3958         return $strtime;
3959 }
3960
3961 # Outputs the author name and date in long form
3962 sub git_print_authorship {
3963         my $co = shift;
3964         my %opts = @_;
3965         my $tag = $opts{-tag} || 'div';
3966         my $author = $co->{'author_name'};
3967
3968         my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
3969         print "<$tag class=\"author_date\">" .
3970               format_search_author($author, "author", esc_html($author)) .
3971               " [".format_timestamp_html(\%ad)."]".
3972               git_get_avatar($co->{'author_email'}, -pad_before => 1) .
3973               "</$tag>\n";
3974 }
3975
3976 # Outputs table rows containing the full author or committer information,
3977 # in the format expected for 'commit' view (& similar).
3978 # Parameters are a commit hash reference, followed by the list of people
3979 # to output information for. If the list is empty it defaults to both
3980 # author and committer.
3981 sub git_print_authorship_rows {
3982         my $co = shift;
3983         # too bad we can't use @people = @_ || ('author', 'committer')
3984         my @people = @_;
3985         @people = ('author', 'committer') unless @people;
3986         foreach my $who (@people) {
3987                 my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
3988                 print "<tr><td>$who</td><td>" .
3989                       format_search_author($co->{"${who}_name"}, $who,
3990                                            esc_html($co->{"${who}_name"})) . " " .
3991                       format_search_author($co->{"${who}_email"}, $who,
3992                                            esc_html("<" . $co->{"${who}_email"} . ">")) .
3993                       "</td><td rowspan=\"2\">" .
3994                       git_get_avatar($co->{"${who}_email"}, -size => 'double') .
3995                       "</td></tr>\n" .
3996                       "<tr>" .
3997                       "<td></td><td>" .
3998                       format_timestamp_html(\%wd) .
3999                       "</td>" .
4000                       "</tr>\n";
4001         }
4002 }
4003
4004 sub git_print_page_path {
4005         my $name = shift;
4006         my $type = shift;
4007         my $hb = shift;
4008
4009
4010         print "<div class=\"page_path\">";
4011         print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4012                       -title => 'tree root'}, to_utf8("[$project]"));
4013         print " / ";
4014         if (defined $name) {
4015                 my @dirname = split '/', $name;
4016                 my $basename = pop @dirname;
4017                 my $fullname = '';
4018
4019                 foreach my $dir (@dirname) {
4020                         $fullname .= ($fullname ? '/' : '') . $dir;
4021                         print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4022                                                      hash_base=>$hb),
4023                                       -title => $fullname}, esc_path($dir));
4024                         print " / ";
4025                 }
4026                 if (defined $type && $type eq 'blob') {
4027                         print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4028                                                      hash_base=>$hb),
4029                                       -title => $name}, esc_path($basename));
4030                 } elsif (defined $type && $type eq 'tree') {
4031                         print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4032                                                      hash_base=>$hb),
4033                                       -title => $name}, esc_path($basename));
4034                         print " / ";
4035                 } else {
4036                         print esc_path($basename);
4037                 }
4038         }
4039         print "<br/></div>\n";
4040 }
4041
4042 sub git_print_log {
4043         my $log = shift;
4044         my %opts = @_;
4045
4046         if ($opts{'-remove_title'}) {
4047                 # remove title, i.e. first line of log
4048                 shift @$log;
4049         }
4050         # remove leading empty lines
4051         while (defined $log->[0] && $log->[0] eq "") {
4052                 shift @$log;
4053         }
4054
4055         # print log
4056         my $signoff = 0;
4057         my $empty = 0;
4058         foreach my $line (@$log) {
4059                 if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4060                         $signoff = 1;
4061                         $empty = 0;
4062                         if (! $opts{'-remove_signoff'}) {
4063                                 print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4064                                 next;
4065                         } else {
4066                                 # remove signoff lines
4067                                 next;
4068                         }
4069                 } else {
4070                         $signoff = 0;
4071                 }
4072
4073                 # print only one empty line
4074                 # do not print empty line after signoff
4075                 if ($line eq "") {
4076                         next if ($empty || $signoff);
4077                         $empty = 1;
4078                 } else {
4079                         $empty = 0;
4080                 }
4081
4082                 print format_log_line_html($line) . "<br/>\n";
4083         }
4084
4085         if ($opts{'-final_empty_line'}) {
4086                 # end with single empty line
4087                 print "<br/>\n" unless $empty;
4088         }
4089 }
4090
4091 # return link target (what link points to)
4092 sub git_get_link_target {
4093         my $hash = shift;
4094         my $link_target;
4095
4096         # read link
4097         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4098                 or return;
4099         {
4100                 local $/ = undef;
4101                 $link_target = <$fd>;
4102         }
4103         close $fd
4104                 or return;
4105
4106         return $link_target;
4107 }
4108
4109 # given link target, and the directory (basedir) the link is in,
4110 # return target of link relative to top directory (top tree);
4111 # return undef if it is not possible (including absolute links).
4112 sub normalize_link_target {
4113         my ($link_target, $basedir) = @_;
4114
4115         # absolute symlinks (beginning with '/') cannot be normalized
4116         return if (substr($link_target, 0, 1) eq '/');
4117
4118         # normalize link target to path from top (root) tree (dir)
4119         my $path;
4120         if ($basedir) {
4121                 $path = $basedir . '/' . $link_target;
4122         } else {
4123                 # we are in top (root) tree (dir)
4124                 $path = $link_target;
4125         }
4126
4127         # remove //, /./, and /../
4128         my @path_parts;
4129         foreach my $part (split('/', $path)) {
4130                 # discard '.' and ''
4131                 next if (!$part || $part eq '.');
4132                 # handle '..'
4133                 if ($part eq '..') {
4134                         if (@path_parts) {
4135                                 pop @path_parts;
4136                         } else {
4137                                 # link leads outside repository (outside top dir)
4138                                 return;
4139                         }
4140                 } else {
4141                         push @path_parts, $part;
4142                 }
4143         }
4144         $path = join('/', @path_parts);
4145
4146         return $path;
4147 }
4148
4149 # print tree entry (row of git_tree), but without encompassing <tr> element
4150 sub git_print_tree_entry {
4151         my ($t, $basedir, $hash_base, $have_blame) = @_;
4152
4153         my %base_key = ();
4154         $base_key{'hash_base'} = $hash_base if defined $hash_base;
4155
4156         # The format of a table row is: mode list link.  Where mode is
4157         # the mode of the entry, list is the name of the entry, an href,
4158         # and link is the action links of the entry.
4159
4160         print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4161         if (exists $t->{'size'}) {
4162                 print "<td class=\"size\">$t->{'size'}</td>\n";
4163         }
4164         if ($t->{'type'} eq "blob") {
4165                 print "<td class=\"list\">" .
4166                         $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4167                                                file_name=>"$basedir$t->{'name'}", %base_key),
4168                                 -class => "list"}, esc_path($t->{'name'}));
4169                 if (S_ISLNK(oct $t->{'mode'})) {
4170                         my $link_target = git_get_link_target($t->{'hash'});
4171                         if ($link_target) {
4172                                 my $norm_target = normalize_link_target($link_target, $basedir);
4173                                 if (defined $norm_target) {
4174                                         print " -> " .
4175                                               $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4176                                                                      file_name=>$norm_target),
4177                                                        -title => $norm_target}, esc_path($link_target));
4178                                 } else {
4179                                         print " -> " . esc_path($link_target);
4180                                 }
4181                         }
4182                 }
4183                 print "</td>\n";
4184                 print "<td class=\"link\">";
4185                 print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4186                                              file_name=>"$basedir$t->{'name'}", %base_key)},
4187                               "blob");
4188                 if ($have_blame) {
4189                         print " | " .
4190                               $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4191                                                      file_name=>"$basedir$t->{'name'}", %base_key)},
4192                                       "blame");
4193                 }
4194                 if (defined $hash_base) {
4195                         print " | " .
4196                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4197                                                      hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4198                                       "history");
4199                 }
4200                 print " | " .
4201                         $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4202                                                file_name=>"$basedir$t->{'name'}")},
4203                                 "raw");
4204                 print "</td>\n";
4205
4206         } elsif ($t->{'type'} eq "tree") {
4207                 print "<td class=\"list\">";
4208                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4209                                              file_name=>"$basedir$t->{'name'}",
4210                                              %base_key)},
4211                               esc_path($t->{'name'}));
4212                 print "</td>\n";
4213                 print "<td class=\"link\">";
4214                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4215                                              file_name=>"$basedir$t->{'name'}",
4216                                              %base_key)},
4217                               "tree");
4218                 if (defined $hash_base) {
4219                         print " | " .
4220                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4221                                                      file_name=>"$basedir$t->{'name'}")},
4222                                       "history");
4223                 }
4224                 print "</td>\n";
4225         } else {
4226                 # unknown object: we can only present history for it
4227                 # (this includes 'commit' object, i.e. submodule support)
4228                 print "<td class=\"list\">" .
4229                       esc_path($t->{'name'}) .
4230                       "</td>\n";
4231                 print "<td class=\"link\">";
4232                 if (defined $hash_base) {
4233                         print $cgi->a({-href => href(action=>"history",
4234                                                      hash_base=>$hash_base,
4235                                                      file_name=>"$basedir$t->{'name'}")},
4236                                       "history");
4237                 }
4238                 print "</td>\n";
4239         }
4240 }
4241
4242 ## ......................................................................
4243 ## functions printing large fragments of HTML
4244
4245 # get pre-image filenames for merge (combined) diff
4246 sub fill_from_file_info {
4247         my ($diff, @parents) = @_;
4248
4249         $diff->{'from_file'} = [ ];
4250         $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4251         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4252                 if ($diff->{'status'}[$i] eq 'R' ||
4253                     $diff->{'status'}[$i] eq 'C') {
4254                         $diff->{'from_file'}[$i] =
4255                                 git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4256                 }
4257         }
4258
4259         return $diff;
4260 }
4261
4262 # is current raw difftree line of file deletion
4263 sub is_deleted {
4264         my $diffinfo = shift;
4265
4266         return $diffinfo->{'to_id'} eq ('0' x 40);
4267 }
4268
4269 # does patch correspond to [previous] difftree raw line
4270 # $diffinfo  - hashref of parsed raw diff format
4271 # $patchinfo - hashref of parsed patch diff format
4272 #              (the same keys as in $diffinfo)
4273 sub is_patch_split {
4274         my ($diffinfo, $patchinfo) = @_;
4275
4276         return defined $diffinfo && defined $patchinfo
4277                 && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4278 }
4279
4280
4281 sub git_difftree_body {
4282         my ($difftree, $hash, @parents) = @_;
4283         my ($parent) = $parents[0];
4284         my $have_blame = gitweb_check_feature('blame');
4285         print "<div class=\"list_head\">\n";
4286         if ($#{$difftree} > 10) {
4287                 print(($#{$difftree} + 1) . " files changed:\n");
4288         }
4289         print "</div>\n";
4290
4291         print "<table class=\"" .
4292               (@parents > 1 ? "combined " : "") .
4293               "diff_tree\">\n";
4294
4295         # header only for combined diff in 'commitdiff' view
4296         my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4297         if ($has_header) {
4298                 # table header
4299                 print "<thead><tr>\n" .
4300                        "<th></th><th></th>\n"; # filename, patchN link
4301                 for (my $i = 0; $i < @parents; $i++) {
4302                         my $par = $parents[$i];
4303                         print "<th>" .
4304                               $cgi->a({-href => href(action=>"commitdiff",
4305                                                      hash=>$hash, hash_parent=>$par),
4306                                        -title => 'commitdiff to parent number ' .
4307                                                   ($i+1) . ': ' . substr($par,0,7)},
4308                                       $i+1) .
4309                               "&nbsp;</th>\n";
4310                 }
4311                 print "</tr></thead>\n<tbody>\n";
4312         }
4313
4314         my $alternate = 1;
4315         my $patchno = 0;
4316         foreach my $line (@{$difftree}) {
4317                 my $diff = parsed_difftree_line($line);
4318
4319                 if ($alternate) {
4320                         print "<tr class=\"dark\">\n";
4321                 } else {
4322                         print "<tr class=\"light\">\n";
4323                 }
4324                 $alternate ^= 1;
4325
4326                 if (exists $diff->{'nparents'}) { # combined diff
4327
4328                         fill_from_file_info($diff, @parents)
4329                                 unless exists $diff->{'from_file'};
4330
4331                         if (!is_deleted($diff)) {
4332                                 # file exists in the result (child) commit
4333                                 print "<td>" .
4334                                       $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4335                                                              file_name=>$diff->{'to_file'},
4336                                                              hash_base=>$hash),
4337                                               -class => "list"}, esc_path($diff->{'to_file'})) .
4338                                       "</td>\n";
4339                         } else {
4340                                 print "<td>" .
4341                                       esc_path($diff->{'to_file'}) .
4342                                       "</td>\n";
4343                         }
4344
4345                         if ($action eq 'commitdiff') {
4346                                 # link to patch
4347                                 $patchno++;
4348                                 print "<td class=\"link\">" .
4349                                       $cgi->a({-href => href(-anchor=>"patch$patchno")},
4350                                               "patch") .
4351                                       " | " .
4352                                       "</td>\n";
4353                         }
4354
4355                         my $has_history = 0;
4356                         my $not_deleted = 0;
4357                         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4358                                 my $hash_parent = $parents[$i];
4359                                 my $from_hash = $diff->{'from_id'}[$i];
4360                                 my $from_path = $diff->{'from_file'}[$i];
4361                                 my $status = $diff->{'status'}[$i];
4362
4363                                 $has_history ||= ($status ne 'A');
4364                                 $not_deleted ||= ($status ne 'D');
4365
4366                                 if ($status eq 'A') {
4367                                         print "<td  class=\"link\" align=\"right\"> | </td>\n";
4368                                 } elsif ($status eq 'D') {
4369                                         print "<td class=\"link\">" .
4370                                               $cgi->a({-href => href(action=>"blob",
4371                                                                      hash_base=>$hash,
4372                                                                      hash=>$from_hash,
4373                                                                      file_name=>$from_path)},
4374                                                       "blob" . ($i+1)) .
4375                                               " | </td>\n";
4376                                 } else {
4377                                         if ($diff->{'to_id'} eq $from_hash) {
4378                                                 print "<td class=\"link nochange\">";
4379                                         } else {
4380                                                 print "<td class=\"link\">";
4381                                         }
4382                                         print $cgi->a({-href => href(action=>"blobdiff",
4383                                                                      hash=>$diff->{'to_id'},
4384                                                                      hash_parent=>$from_hash,
4385                                                                      hash_base=>$hash,
4386                                                                      hash_parent_base=>$hash_parent,
4387                                                                      file_name=>$diff->{'to_file'},
4388                                                                      file_parent=>$from_path)},
4389                                                       "diff" . ($i+1)) .
4390                                               " | </td>\n";
4391                                 }
4392                         }
4393
4394                         print "<td class=\"link\">";
4395                         if ($not_deleted) {
4396                                 print $cgi->a({-href => href(action=>"blob",
4397                                                              hash=>$diff->{'to_id'},
4398                                                              file_name=>$diff->{'to_file'},
4399                                                              hash_base=>$hash)},
4400                                               "blob");
4401                                 print " | " if ($has_history);
4402                         }
4403                         if ($has_history) {
4404                                 print $cgi->a({-href => href(action=>"history",
4405                                                              file_name=>$diff->{'to_file'},
4406                                                              hash_base=>$hash)},
4407                                               "history");
4408                         }
4409                         print "</td>\n";
4410
4411                         print "</tr>\n";
4412                         next; # instead of 'else' clause, to avoid extra indent
4413                 }
4414                 # else ordinary diff
4415
4416                 my ($to_mode_oct, $to_mode_str, $to_file_type);
4417                 my ($from_mode_oct, $from_mode_str, $from_file_type);
4418                 if ($diff->{'to_mode'} ne ('0' x 6)) {
4419                         $to_mode_oct = oct $diff->{'to_mode'};
4420                         if (S_ISREG($to_mode_oct)) { # only for regular file
4421                                 $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4422                         }
4423                         $to_file_type = file_type($diff->{'to_mode'});
4424                 }
4425                 if ($diff->{'from_mode'} ne ('0' x 6)) {
4426                         $from_mode_oct = oct $diff->{'from_mode'};
4427                         if (S_ISREG($from_mode_oct)) { # only for regular file
4428                                 $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4429                         }
4430                         $from_file_type = file_type($diff->{'from_mode'});
4431                 }
4432
4433                 if ($diff->{'status'} eq "A") { # created
4434                         my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4435                         $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4436                         $mode_chng   .= "]</span>";
4437                         print "<td>";
4438                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4439                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4440                                       -class => "list"}, esc_path($diff->{'file'}));
4441                         print "</td>\n";
4442                         print "<td>$mode_chng</td>\n";
4443                         print "<td class=\"link\">";
4444                         if ($action eq 'commitdiff') {
4445                                 # link to patch
4446                                 $patchno++;
4447                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4448                                               "patch") .
4449                                       " | ";
4450                         }
4451                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4452                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4453                                       "blob");
4454                         print "</td>\n";
4455
4456                 } elsif ($diff->{'status'} eq "D") { # deleted
4457                         my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4458                         print "<td>";
4459                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4460                                                      hash_base=>$parent, file_name=>$diff->{'file'}),
4461                                        -class => "list"}, esc_path($diff->{'file'}));
4462                         print "</td>\n";
4463                         print "<td>$mode_chng</td>\n";
4464                         print "<td class=\"link\">";
4465                         if ($action eq 'commitdiff') {
4466                                 # link to patch
4467                                 $patchno++;
4468                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4469                                               "patch") .
4470                                       " | ";
4471                         }
4472                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4473                                                      hash_base=>$parent, file_name=>$diff->{'file'})},
4474                                       "blob") . " | ";
4475                         if ($have_blame) {
4476                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4477                                                              file_name=>$diff->{'file'})},
4478                                               "blame") . " | ";
4479                         }
4480                         print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4481                                                      file_name=>$diff->{'file'})},
4482                                       "history");
4483                         print "</td>\n";
4484
4485                 } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4486                         my $mode_chnge = "";
4487                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4488                                 $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4489                                 if ($from_file_type ne $to_file_type) {
4490                                         $mode_chnge .= " from $from_file_type to $to_file_type";
4491                                 }
4492                                 if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4493                                         if ($from_mode_str && $to_mode_str) {
4494                                                 $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4495                                         } elsif ($to_mode_str) {
4496                                                 $mode_chnge .= " mode: $to_mode_str";
4497                                         }
4498                                 }
4499                                 $mode_chnge .= "]</span>\n";
4500                         }
4501                         print "<td>";
4502                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4503                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4504                                       -class => "list"}, esc_path($diff->{'file'}));
4505                         print "</td>\n";
4506                         print "<td>$mode_chnge</td>\n";
4507                         print "<td class=\"link\">";
4508                         if ($action eq 'commitdiff') {
4509                                 # link to patch
4510                                 $patchno++;
4511                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4512                                               "patch") .
4513                                       " | ";
4514                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4515                                 # "commit" view and modified file (not onlu mode changed)
4516                                 print $cgi->a({-href => href(action=>"blobdiff",
4517                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4518                                                              hash_base=>$hash, hash_parent_base=>$parent,
4519                                                              file_name=>$diff->{'file'})},
4520                                               "diff") .
4521                                       " | ";
4522                         }
4523                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4524                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4525                                        "blob") . " | ";
4526                         if ($have_blame) {
4527                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4528                                                              file_name=>$diff->{'file'})},
4529                                               "blame") . " | ";
4530                         }
4531                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4532                                                      file_name=>$diff->{'file'})},
4533                                       "history");
4534                         print "</td>\n";
4535
4536                 } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4537                         my %status_name = ('R' => 'moved', 'C' => 'copied');
4538                         my $nstatus = $status_name{$diff->{'status'}};
4539                         my $mode_chng = "";
4540                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4541                                 # mode also for directories, so we cannot use $to_mode_str
4542                                 $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4543                         }
4544                         print "<td>" .
4545                               $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4546                                                      hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4547                                       -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4548                               "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4549                               $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4550                                                      hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4551                                       -class => "list"}, esc_path($diff->{'from_file'})) .
4552                               " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4553                               "<td class=\"link\">";
4554                         if ($action eq 'commitdiff') {
4555                                 # link to patch
4556                                 $patchno++;
4557                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4558                                               "patch") .
4559                                       " | ";
4560                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4561                                 # "commit" view and modified file (not only pure rename or copy)
4562                                 print $cgi->a({-href => href(action=>"blobdiff",
4563                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4564                                                              hash_base=>$hash, hash_parent_base=>$parent,
4565                                                              file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4566                                               "diff") .
4567                                       " | ";
4568                         }
4569                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4570                                                      hash_base=>$parent, file_name=>$diff->{'to_file'})},
4571                                       "blob") . " | ";
4572                         if ($have_blame) {
4573                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4574                                                              file_name=>$diff->{'to_file'})},
4575                                               "blame") . " | ";
4576                         }
4577                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4578                                                     file_name=>$diff->{'to_file'})},
4579                                       "history");
4580                         print "</td>\n";
4581
4582                 } # we should not encounter Unmerged (U) or Unknown (X) status
4583                 print "</tr>\n";
4584         }
4585         print "</tbody>" if $has_header;
4586         print "</table>\n";
4587 }
4588
4589 sub git_patchset_body {
4590         my ($fd, $difftree, $hash, @hash_parents) = @_;
4591         my ($hash_parent) = $hash_parents[0];
4592
4593         my $is_combined = (@hash_parents > 1);
4594         my $patch_idx = 0;
4595         my $patch_number = 0;
4596         my $patch_line;
4597         my $diffinfo;
4598         my $to_name;
4599         my (%from, %to);
4600
4601         print "<div class=\"patchset\">\n";
4602
4603         # skip to first patch
4604         while ($patch_line = <$fd>) {
4605                 chomp $patch_line;
4606
4607                 last if ($patch_line =~ m/^diff /);
4608         }
4609
4610  PATCH:
4611         while ($patch_line) {
4612
4613                 # parse "git diff" header line
4614                 if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
4615                         # $1 is from_name, which we do not use
4616                         $to_name = unquote($2);
4617                         $to_name =~ s!^b/!!;
4618                 } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
4619                         # $1 is 'cc' or 'combined', which we do not use
4620                         $to_name = unquote($2);
4621                 } else {
4622                         $to_name = undef;
4623                 }
4624
4625                 # check if current patch belong to current raw line
4626                 # and parse raw git-diff line if needed
4627                 if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
4628                         # this is continuation of a split patch
4629                         print "<div class=\"patch cont\">\n";
4630                 } else {
4631                         # advance raw git-diff output if needed
4632                         $patch_idx++ if defined $diffinfo;
4633
4634                         # read and prepare patch information
4635                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4636
4637                         # compact combined diff output can have some patches skipped
4638                         # find which patch (using pathname of result) we are at now;
4639                         if ($is_combined) {
4640                                 while ($to_name ne $diffinfo->{'to_file'}) {
4641                                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4642                                               format_diff_cc_simplified($diffinfo, @hash_parents) .
4643                                               "</div>\n";  # class="patch"
4644
4645                                         $patch_idx++;
4646                                         $patch_number++;
4647
4648                                         last if $patch_idx > $#$difftree;
4649                                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4650                                 }
4651                         }
4652
4653                         # modifies %from, %to hashes
4654                         parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
4655
4656                         # this is first patch for raw difftree line with $patch_idx index
4657                         # we index @$difftree array from 0, but number patches from 1
4658                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
4659                 }
4660
4661                 # git diff header
4662                 #assert($patch_line =~ m/^diff /) if DEBUG;
4663                 #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
4664                 $patch_number++;
4665                 # print "git diff" header
4666                 print format_git_diff_header_line($patch_line, $diffinfo,
4667                                                   \%from, \%to);
4668
4669                 # print extended diff header
4670                 print "<div class=\"diff extended_header\">\n";
4671         EXTENDED_HEADER:
4672                 while ($patch_line = <$fd>) {
4673                         chomp $patch_line;
4674
4675                         last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
4676
4677                         print format_extended_diff_header_line($patch_line, $diffinfo,
4678                                                                \%from, \%to);
4679                 }
4680                 print "</div>\n"; # class="diff extended_header"
4681
4682                 # from-file/to-file diff header
4683                 if (! $patch_line) {
4684                         print "</div>\n"; # class="patch"
4685                         last PATCH;
4686                 }
4687                 next PATCH if ($patch_line =~ m/^diff /);
4688                 #assert($patch_line =~ m/^---/) if DEBUG;
4689
4690                 my $last_patch_line = $patch_line;
4691                 $patch_line = <$fd>;
4692                 chomp $patch_line;
4693                 #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
4694
4695                 print format_diff_from_to_header($last_patch_line, $patch_line,
4696                                                  $diffinfo, \%from, \%to,
4697                                                  @hash_parents);
4698
4699                 # the patch itself
4700         LINE:
4701                 while ($patch_line = <$fd>) {
4702                         chomp $patch_line;
4703
4704                         next PATCH if ($patch_line =~ m/^diff /);
4705
4706                         print format_diff_line($patch_line, \%from, \%to);
4707                 }
4708
4709         } continue {
4710                 print "</div>\n"; # class="patch"
4711         }
4712
4713         # for compact combined (--cc) format, with chunk and patch simplification
4714         # the patchset might be empty, but there might be unprocessed raw lines
4715         for (++$patch_idx if $patch_number > 0;
4716              $patch_idx < @$difftree;
4717              ++$patch_idx) {
4718                 # read and prepare patch information
4719                 $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4720
4721                 # generate anchor for "patch" links in difftree / whatchanged part
4722                 print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4723                       format_diff_cc_simplified($diffinfo, @hash_parents) .
4724                       "</div>\n";  # class="patch"
4725
4726                 $patch_number++;
4727         }
4728
4729         if ($patch_number == 0) {
4730                 if (@hash_parents > 1) {
4731                         print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
4732                 } else {
4733                         print "<div class=\"diff nodifferences\">No differences found</div>\n";
4734                 }
4735         }
4736
4737         print "</div>\n"; # class="patchset"
4738 }
4739
4740 # . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
4741
4742 # fills project list info (age, description, owner, forks) for each
4743 # project in the list, removing invalid projects from returned list
4744 # NOTE: modifies $projlist, but does not remove entries from it
4745 sub fill_project_list_info {
4746         my ($projlist, $check_forks) = @_;
4747         my @projects;
4748
4749         my $show_ctags = gitweb_check_feature('ctags');
4750  PROJECT:
4751         foreach my $pr (@$projlist) {
4752                 my (@activity) = git_get_last_activity($pr->{'path'});
4753                 unless (@activity) {
4754                         next PROJECT;
4755                 }
4756                 ($pr->{'age'}, $pr->{'age_string'}) = @activity;
4757                 if (!defined $pr->{'descr'}) {
4758                         my $descr = git_get_project_description($pr->{'path'}) || "";
4759                         $descr = to_utf8($descr);
4760                         $pr->{'descr_long'} = $descr;
4761                         $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
4762                 }
4763                 if (!defined $pr->{'owner'}) {
4764                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
4765                 }
4766                 if ($check_forks) {
4767                         my $pname = $pr->{'path'};
4768                         if (($pname =~ s/\.git$//) &&
4769                             ($pname !~ /\/$/) &&
4770                             (-d "$projectroot/$pname")) {
4771                                 $pr->{'forks'} = "-d $projectroot/$pname";
4772                         } else {
4773                                 $pr->{'forks'} = 0;
4774                         }
4775                 }
4776                 $show_ctags and $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
4777                 push @projects, $pr;
4778         }
4779
4780         return @projects;
4781 }
4782
4783 # print 'sort by' <th> element, generating 'sort by $name' replay link
4784 # if that order is not selected
4785 sub print_sort_th {
4786         print format_sort_th(@_);
4787 }
4788
4789 sub format_sort_th {
4790         my ($name, $order, $header) = @_;
4791         my $sort_th = "";
4792         $header ||= ucfirst($name);
4793
4794         if ($order eq $name) {
4795                 $sort_th .= "<th>$header</th>\n";
4796         } else {
4797                 $sort_th .= "<th>" .
4798                             $cgi->a({-href => href(-replay=>1, order=>$name),
4799                                      -class => "header"}, $header) .
4800                             "</th>\n";
4801         }
4802
4803         return $sort_th;
4804 }
4805
4806 sub git_project_list_body {
4807         # actually uses global variable $project
4808         my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
4809
4810         my $check_forks = gitweb_check_feature('forks');
4811         my @projects = fill_project_list_info($projlist, $check_forks);
4812
4813         $order ||= $default_projects_order;
4814         $from = 0 unless defined $from;
4815         $to = $#projects if (!defined $to || $#projects < $to);
4816
4817         my %order_info = (
4818                 project => { key => 'path', type => 'str' },
4819                 descr => { key => 'descr_long', type => 'str' },
4820                 owner => { key => 'owner', type => 'str' },
4821                 age => { key => 'age', type => 'num' }
4822         );
4823         my $oi = $order_info{$order};
4824         if ($oi->{'type'} eq 'str') {
4825                 @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @projects;
4826         } else {
4827                 @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @projects;
4828         }
4829
4830         my $show_ctags = gitweb_check_feature('ctags');
4831         if ($show_ctags) {
4832                 my %ctags;
4833                 foreach my $p (@projects) {
4834                         foreach my $ct (keys %{$p->{'ctags'}}) {
4835                                 $ctags{$ct} += $p->{'ctags'}->{$ct};
4836                         }
4837                 }
4838                 my $cloud = git_populate_project_tagcloud(\%ctags);
4839                 print git_show_project_tagcloud($cloud, 64);
4840         }
4841
4842         print "<table class=\"project_list\">\n";
4843         unless ($no_header) {
4844                 print "<tr>\n";
4845                 if ($check_forks) {
4846                         print "<th></th>\n";
4847                 }
4848                 print_sort_th('project', $order, 'Project');
4849                 print_sort_th('descr', $order, 'Description');
4850                 print_sort_th('owner', $order, 'Owner');
4851                 print_sort_th('age', $order, 'Last Change');
4852                 print "<th></th>\n" . # for links
4853                       "</tr>\n";
4854         }
4855         my $alternate = 1;
4856         my $tagfilter = $cgi->param('by_tag');
4857         for (my $i = $from; $i <= $to; $i++) {
4858                 my $pr = $projects[$i];
4859
4860                 next if $tagfilter and $show_ctags and not grep { lc $_ eq lc $tagfilter } keys %{$pr->{'ctags'}};
4861                 next if $searchtext and not $pr->{'path'} =~ /$searchtext/
4862                         and not $pr->{'descr_long'} =~ /$searchtext/;
4863                 # Weed out forks or non-matching entries of search
4864                 if ($check_forks) {
4865                         my $forkbase = $project; $forkbase ||= ''; $forkbase =~ s#\.git$#/#;
4866                         $forkbase="^$forkbase" if $forkbase;
4867                         next if not $searchtext and not $tagfilter and $show_ctags
4868                                 and $pr->{'path'} =~ m#$forkbase.*/.*#; # regexp-safe
4869                 }
4870
4871                 if ($alternate) {
4872                         print "<tr class=\"dark\">\n";
4873                 } else {
4874                         print "<tr class=\"light\">\n";
4875                 }
4876                 $alternate ^= 1;
4877                 if ($check_forks) {
4878                         print "<td>";
4879                         if ($pr->{'forks'}) {
4880                                 print "<!-- $pr->{'forks'} -->\n";
4881                                 print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "+");
4882                         }
4883                         print "</td>\n";
4884                 }
4885                 print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4886                                         -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
4887                       "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4888                                         -class => "list", -title => $pr->{'descr_long'}},
4889                                         esc_html($pr->{'descr'})) . "</td>\n" .
4890                       "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
4891                 print "<td class=\"". age_class($pr->{'age'}) . "\">" .
4892                       (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
4893                       "<td class=\"link\">" .
4894                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
4895                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
4896                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
4897                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
4898                       ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
4899                       "</td>\n" .
4900                       "</tr>\n";
4901         }
4902         if (defined $extra) {
4903                 print "<tr>\n";
4904                 if ($check_forks) {
4905                         print "<td></td>\n";
4906                 }
4907                 print "<td colspan=\"5\">$extra</td>\n" .
4908                       "</tr>\n";
4909         }
4910         print "</table>\n";
4911 }
4912
4913 sub git_log_body {
4914         # uses global variable $project
4915         my ($commitlist, $from, $to, $refs, $extra) = @_;
4916
4917         $from = 0 unless defined $from;
4918         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4919
4920         for (my $i = 0; $i <= $to; $i++) {
4921                 my %co = %{$commitlist->[$i]};
4922                 next if !%co;
4923                 my $commit = $co{'id'};
4924                 my $ref = format_ref_marker($refs, $commit);
4925                 git_print_header_div('commit',
4926                                "<span class=\"age\">$co{'age_string'}</span>" .
4927                                esc_html($co{'title'}) . $ref,
4928                                $commit);
4929                 print "<div class=\"title_text\">\n" .
4930                       "<div class=\"log_link\">\n" .
4931                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
4932                       " | " .
4933                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
4934                       " | " .
4935                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
4936                       "<br/>\n" .
4937                       "</div>\n";
4938                       git_print_authorship(\%co, -tag => 'span');
4939                       print "<br/>\n</div>\n";
4940
4941                 print "<div class=\"log_body\">\n";
4942                 git_print_log($co{'comment'}, -final_empty_line=> 1);
4943                 print "</div>\n";
4944         }
4945         if ($extra) {
4946                 print "<div class=\"page_nav\">\n";
4947                 print "$extra\n";
4948                 print "</div>\n";
4949         }
4950 }
4951
4952 sub git_shortlog_body {
4953         # uses global variable $project
4954         my ($commitlist, $from, $to, $refs, $extra) = @_;
4955
4956         $from = 0 unless defined $from;
4957         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4958
4959         print "<table class=\"shortlog\">\n";
4960         my $alternate = 1;
4961         for (my $i = $from; $i <= $to; $i++) {
4962                 my %co = %{$commitlist->[$i]};
4963                 my $commit = $co{'id'};
4964                 my $ref = format_ref_marker($refs, $commit);
4965                 if ($alternate) {
4966                         print "<tr class=\"dark\">\n";
4967                 } else {
4968                         print "<tr class=\"light\">\n";
4969                 }
4970                 $alternate ^= 1;
4971                 # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
4972                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4973                       format_author_html('td', \%co, 10) . "<td>";
4974                 print format_subject_html($co{'title'}, $co{'title_short'},
4975                                           href(action=>"commit", hash=>$commit), $ref);
4976                 print "</td>\n" .
4977                       "<td class=\"link\">" .
4978                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
4979                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
4980                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
4981                 my $snapshot_links = format_snapshot_links($commit);
4982                 if (defined $snapshot_links) {
4983                         print " | " . $snapshot_links;
4984                 }
4985                 print "</td>\n" .
4986                       "</tr>\n";
4987         }
4988         if (defined $extra) {
4989                 print "<tr>\n" .
4990                       "<td colspan=\"4\">$extra</td>\n" .
4991                       "</tr>\n";
4992         }
4993         print "</table>\n";
4994 }
4995
4996 sub git_history_body {
4997         # Warning: assumes constant type (blob or tree) during history
4998         my ($commitlist, $from, $to, $refs, $extra,
4999             $file_name, $file_hash, $ftype) = @_;
5000
5001         $from = 0 unless defined $from;
5002         $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5003
5004         print "<table class=\"history\">\n";
5005         my $alternate = 1;
5006         for (my $i = $from; $i <= $to; $i++) {
5007                 my %co = %{$commitlist->[$i]};
5008                 if (!%co) {
5009                         next;
5010                 }
5011                 my $commit = $co{'id'};
5012
5013                 my $ref = format_ref_marker($refs, $commit);
5014
5015                 if ($alternate) {
5016                         print "<tr class=\"dark\">\n";
5017                 } else {
5018                         print "<tr class=\"light\">\n";
5019                 }
5020                 $alternate ^= 1;
5021                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5022         # shortlog:   format_author_html('td', \%co, 10)
5023                       format_author_html('td', \%co, 15, 3) . "<td>";
5024                 # originally git_history used chop_str($co{'title'}, 50)
5025                 print format_subject_html($co{'title'}, $co{'title_short'},
5026                                           href(action=>"commit", hash=>$commit), $ref);
5027                 print "</td>\n" .
5028                       "<td class=\"link\">" .
5029                       $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5030                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5031
5032                 if ($ftype eq 'blob') {
5033                         my $blob_current = $file_hash;
5034                         my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5035                         if (defined $blob_current && defined $blob_parent &&
5036                                         $blob_current ne $blob_parent) {
5037                                 print " | " .
5038                                         $cgi->a({-href => href(action=>"blobdiff",
5039                                                                hash=>$blob_current, hash_parent=>$blob_parent,
5040                                                                hash_base=>$hash_base, hash_parent_base=>$commit,
5041                                                                file_name=>$file_name)},
5042                                                 "diff to current");
5043                         }
5044                 }
5045                 print "</td>\n" .
5046                       "</tr>\n";
5047         }
5048         if (defined $extra) {
5049                 print "<tr>\n" .
5050                       "<td colspan=\"4\">$extra</td>\n" .
5051                       "</tr>\n";
5052         }
5053         print "</table>\n";
5054 }
5055
5056 sub git_tags_body {
5057         # uses global variable $project
5058         my ($taglist, $from, $to, $extra) = @_;
5059         $from = 0 unless defined $from;
5060         $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5061
5062         print "<table class=\"tags\">\n";
5063         my $alternate = 1;
5064         for (my $i = $from; $i <= $to; $i++) {
5065                 my $entry = $taglist->[$i];
5066                 my %tag = %$entry;
5067                 my $comment = $tag{'subject'};
5068                 my $comment_short;
5069                 if (defined $comment) {
5070                         $comment_short = chop_str($comment, 30, 5);
5071                 }
5072                 if ($alternate) {
5073                         print "<tr class=\"dark\">\n";
5074                 } else {
5075                         print "<tr class=\"light\">\n";
5076                 }
5077                 $alternate ^= 1;
5078                 if (defined $tag{'age'}) {
5079                         print "<td><i>$tag{'age'}</i></td>\n";
5080                 } else {
5081                         print "<td></td>\n";
5082                 }
5083                 print "<td>" .
5084                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5085                                -class => "list name"}, esc_html($tag{'name'})) .
5086                       "</td>\n" .
5087                       "<td>";
5088                 if (defined $comment) {
5089                         print format_subject_html($comment, $comment_short,
5090                                                   href(action=>"tag", hash=>$tag{'id'}));
5091                 }
5092                 print "</td>\n" .
5093                       "<td class=\"selflink\">";
5094                 if ($tag{'type'} eq "tag") {
5095                         print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5096                 } else {
5097                         print "&nbsp;";
5098                 }
5099                 print "</td>\n" .
5100                       "<td class=\"link\">" . " | " .
5101                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5102                 if ($tag{'reftype'} eq "commit") {
5103                         print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5104                               " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5105                 } elsif ($tag{'reftype'} eq "blob") {
5106                         print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5107                 }
5108                 print "</td>\n" .
5109                       "</tr>";
5110         }
5111         if (defined $extra) {
5112                 print "<tr>\n" .
5113                       "<td colspan=\"5\">$extra</td>\n" .
5114                       "</tr>\n";
5115         }
5116         print "</table>\n";
5117 }
5118
5119 sub git_heads_body {
5120         # uses global variable $project
5121         my ($headlist, $head, $from, $to, $extra) = @_;
5122         $from = 0 unless defined $from;
5123         $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5124
5125         print "<table class=\"heads\">\n";
5126         my $alternate = 1;
5127         for (my $i = $from; $i <= $to; $i++) {
5128                 my $entry = $headlist->[$i];
5129                 my %ref = %$entry;
5130                 my $curr = $ref{'id'} eq $head;
5131                 if ($alternate) {
5132                         print "<tr class=\"dark\">\n";
5133                 } else {
5134                         print "<tr class=\"light\">\n";
5135                 }
5136                 $alternate ^= 1;
5137                 print "<td><i>$ref{'age'}</i></td>\n" .
5138                       ($curr ? "<td class=\"current_head\">" : "<td>") .
5139                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5140                                -class => "list name"},esc_html($ref{'name'})) .
5141                       "</td>\n" .
5142                       "<td class=\"link\">" .
5143                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5144                       $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5145                       $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5146                       "</td>\n" .
5147                       "</tr>";
5148         }
5149         if (defined $extra) {
5150                 print "<tr>\n" .
5151                       "<td colspan=\"3\">$extra</td>\n" .
5152                       "</tr>\n";
5153         }
5154         print "</table>\n";
5155 }
5156
5157 # Display a single remote block
5158 sub git_remote_block {
5159         my ($remote, $rdata, $limit, $head) = @_;
5160
5161         my $heads = $rdata->{'heads'};
5162         my $fetch = $rdata->{'fetch'};
5163         my $push = $rdata->{'push'};
5164
5165         my $urls_table = "<table class=\"projects_list\">\n" ;
5166
5167         if (defined $fetch) {
5168                 if ($fetch eq $push) {
5169                         $urls_table .= format_repo_url("URL", $fetch);
5170                 } else {
5171                         $urls_table .= format_repo_url("Fetch URL", $fetch);
5172                         $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5173                 }
5174         } elsif (defined $push) {
5175                 $urls_table .= format_repo_url("Push URL", $push);
5176         } else {
5177                 $urls_table .= format_repo_url("", "No remote URL");
5178         }
5179
5180         $urls_table .= "</table>\n";
5181
5182         my $dots;
5183         if (defined $limit && $limit < @$heads) {
5184                 $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5185         }
5186
5187         print $urls_table;
5188         git_heads_body($heads, $head, 0, $limit, $dots);
5189 }
5190
5191 # Display a list of remote names with the respective fetch and push URLs
5192 sub git_remotes_list {
5193         my ($remotedata, $limit) = @_;
5194         print "<table class=\"heads\">\n";
5195         my $alternate = 1;
5196         my @remotes = sort keys %$remotedata;
5197
5198         my $limited = $limit && $limit < @remotes;
5199
5200         $#remotes = $limit - 1 if $limited;
5201
5202         while (my $remote = shift @remotes) {
5203                 my $rdata = $remotedata->{$remote};
5204                 my $fetch = $rdata->{'fetch'};
5205                 my $push = $rdata->{'push'};
5206                 if ($alternate) {
5207                         print "<tr class=\"dark\">\n";
5208                 } else {
5209                         print "<tr class=\"light\">\n";
5210                 }
5211                 $alternate ^= 1;
5212                 print "<td>" .
5213                       $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5214                                -class=> "list name"},esc_html($remote)) .
5215                       "</td>";
5216                 print "<td class=\"link\">" .
5217                       (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5218                       " | " .
5219                       (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5220                       "</td>";
5221
5222                 print "</tr>\n";
5223         }
5224
5225         if ($limited) {
5226                 print "<tr>\n" .
5227                       "<td colspan=\"3\">" .
5228                       $cgi->a({-href => href(action=>"remotes")}, "...") .
5229                       "</td>\n" . "</tr>\n";
5230         }
5231
5232         print "</table>";
5233 }
5234
5235 # Display remote heads grouped by remote, unless there are too many
5236 # remotes, in which case we only display the remote names
5237 sub git_remotes_body {
5238         my ($remotedata, $limit, $head) = @_;
5239         if ($limit and $limit < keys %$remotedata) {
5240                 git_remotes_list($remotedata, $limit);
5241         } else {
5242                 fill_remote_heads($remotedata);
5243                 while (my ($remote, $rdata) = each %$remotedata) {
5244                         git_print_section({-class=>"remote", -id=>$remote},
5245                                 ["remotes", $remote, $remote], sub {
5246                                         git_remote_block($remote, $rdata, $limit, $head);
5247                                 });
5248                 }
5249         }
5250 }
5251
5252 sub git_search_grep_body {
5253         my ($commitlist, $from, $to, $extra) = @_;
5254         $from = 0 unless defined $from;
5255         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5256
5257         print "<table class=\"commit_search\">\n";
5258         my $alternate = 1;
5259         for (my $i = $from; $i <= $to; $i++) {
5260                 my %co = %{$commitlist->[$i]};
5261                 if (!%co) {
5262                         next;
5263                 }
5264                 my $commit = $co{'id'};
5265                 if ($alternate) {
5266                         print "<tr class=\"dark\">\n";
5267                 } else {
5268                         print "<tr class=\"light\">\n";
5269                 }
5270                 $alternate ^= 1;
5271                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5272                       format_author_html('td', \%co, 15, 5) .
5273                       "<td>" .
5274                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5275                                -class => "list subject"},
5276                               chop_and_escape_str($co{'title'}, 50) . "<br/>");
5277                 my $comment = $co{'comment'};
5278                 foreach my $line (@$comment) {
5279                         if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
5280                                 my ($lead, $match, $trail) = ($1, $2, $3);
5281                                 $match = chop_str($match, 70, 5, 'center');
5282                                 my $contextlen = int((80 - length($match))/2);
5283                                 $contextlen = 30 if ($contextlen > 30);
5284                                 $lead  = chop_str($lead,  $contextlen, 10, 'left');
5285                                 $trail = chop_str($trail, $contextlen, 10, 'right');
5286
5287                                 $lead  = esc_html($lead);
5288                                 $match = esc_html($match);
5289                                 $trail = esc_html($trail);
5290
5291                                 print "$lead<span class=\"match\">$match</span>$trail<br />";
5292                         }
5293                 }
5294                 print "</td>\n" .
5295                       "<td class=\"link\">" .
5296                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5297                       " | " .
5298                       $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5299                       " | " .
5300                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5301                 print "</td>\n" .
5302                       "</tr>\n";
5303         }
5304         if (defined $extra) {
5305                 print "<tr>\n" .
5306                       "<td colspan=\"3\">$extra</td>\n" .
5307                       "</tr>\n";
5308         }
5309         print "</table>\n";
5310 }
5311
5312 ## ======================================================================
5313 ## ======================================================================
5314 ## actions
5315
5316 sub git_project_list {
5317         my $order = $input_params{'order'};
5318         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5319                 die_error(400, "Unknown order parameter");
5320         }
5321
5322         my @list = git_get_projects_list();
5323         if (!@list) {
5324                 die_error(404, "No projects found");
5325         }
5326
5327         git_header_html();
5328         if (defined $home_text && -f $home_text) {
5329                 print "<div class=\"index_include\">\n";
5330                 insert_file($home_text);
5331                 print "</div>\n";
5332         }
5333         print $cgi->startform(-method => "get") .
5334               "<p class=\"projsearch\">Search:\n" .
5335               $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
5336               "</p>" .
5337               $cgi->end_form() . "\n";
5338         git_project_list_body(\@list, $order);
5339         git_footer_html();
5340 }
5341
5342 sub git_forks {
5343         my $order = $input_params{'order'};
5344         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5345                 die_error(400, "Unknown order parameter");
5346         }
5347
5348         my @list = git_get_projects_list($project);
5349         if (!@list) {
5350                 die_error(404, "No forks found");
5351         }
5352
5353         git_header_html();
5354         git_print_page_nav('','');
5355         git_print_header_div('summary', "$project forks");
5356         git_project_list_body(\@list, $order);
5357         git_footer_html();
5358 }
5359
5360 sub git_project_index {
5361         my @projects = git_get_projects_list($project);
5362
5363         print $cgi->header(
5364                 -type => 'text/plain',
5365                 -charset => 'utf-8',
5366                 -content_disposition => 'inline; filename="index.aux"');
5367
5368         foreach my $pr (@projects) {
5369                 if (!exists $pr->{'owner'}) {
5370                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
5371                 }
5372
5373                 my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
5374                 # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
5375                 $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5376                 $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5377                 $path  =~ s/ /\+/g;
5378                 $owner =~ s/ /\+/g;
5379
5380                 print "$path $owner\n";
5381         }
5382 }
5383
5384 sub git_summary {
5385         my $descr = git_get_project_description($project) || "none";
5386         my %co = parse_commit("HEAD");
5387         my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
5388         my $head = $co{'id'};
5389         my $remote_heads = gitweb_check_feature('remote_heads');
5390
5391         my $owner = git_get_project_owner($project);
5392
5393         my $refs = git_get_references();
5394         # These get_*_list functions return one more to allow us to see if
5395         # there are more ...
5396         my @taglist  = git_get_tags_list(16);
5397         my @headlist = git_get_heads_list(16);
5398         my %remotedata = $remote_heads ? git_get_remotes_list() : ();
5399         my @forklist;
5400         my $check_forks = gitweb_check_feature('forks');
5401
5402         if ($check_forks) {
5403                 @forklist = git_get_projects_list($project);
5404         }
5405
5406         git_header_html();
5407         git_print_page_nav('summary','', $head);
5408
5409         print "<div class=\"title\">&nbsp;</div>\n";
5410         print "<table class=\"projects_list\">\n" .
5411               "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
5412               "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
5413         if (defined $cd{'rfc2822'}) {
5414                 print "<tr id=\"metadata_lchange\"><td>last change</td>" .
5415                       "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
5416         }
5417
5418         # use per project git URL list in $projectroot/$project/cloneurl
5419         # or make project git URL from git base URL and project name
5420         my $url_tag = "URL";
5421         my @url_list = git_get_project_url_list($project);
5422         @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
5423         foreach my $git_url (@url_list) {
5424                 next unless $git_url;
5425                 print format_repo_url($url_tag, $git_url);
5426                 $url_tag = "";
5427         }
5428
5429         # Tag cloud
5430         my $show_ctags = gitweb_check_feature('ctags');
5431         if ($show_ctags) {
5432                 my $ctags = git_get_project_ctags($project);
5433                 my $cloud = git_populate_project_tagcloud($ctags);
5434                 print "<tr id=\"metadata_ctags\"><td>Content tags:<br />";
5435                 print "</td>\n<td>" unless %$ctags;
5436                 print "<form action=\"$show_ctags\" method=\"post\"><input type=\"hidden\" name=\"p\" value=\"$project\" />Add: <input type=\"text\" name=\"t\" size=\"8\" /></form>";
5437                 print "</td>\n<td>" if %$ctags;
5438                 print git_show_project_tagcloud($cloud, 48);
5439                 print "</td></tr>";
5440         }
5441
5442         print "</table>\n";
5443
5444         # If XSS prevention is on, we don't include README.html.
5445         # TODO: Allow a readme in some safe format.
5446         if (!$prevent_xss && -s "$projectroot/$project/README.html") {
5447                 print "<div class=\"title\">readme</div>\n" .
5448                       "<div class=\"readme\">\n";
5449                 insert_file("$projectroot/$project/README.html");
5450                 print "\n</div>\n"; # class="readme"
5451         }
5452
5453         # we need to request one more than 16 (0..15) to check if
5454         # those 16 are all
5455         my @commitlist = $head ? parse_commits($head, 17) : ();
5456         if (@commitlist) {
5457                 git_print_header_div('shortlog');
5458                 git_shortlog_body(\@commitlist, 0, 15, $refs,
5459                                   $#commitlist <=  15 ? undef :
5460                                   $cgi->a({-href => href(action=>"shortlog")}, "..."));
5461         }
5462
5463         if (@taglist) {
5464                 git_print_header_div('tags');
5465                 git_tags_body(\@taglist, 0, 15,
5466                               $#taglist <=  15 ? undef :
5467                               $cgi->a({-href => href(action=>"tags")}, "..."));
5468         }
5469
5470         if (@headlist) {
5471                 git_print_header_div('heads');
5472                 git_heads_body(\@headlist, $head, 0, 15,
5473                                $#headlist <= 15 ? undef :
5474                                $cgi->a({-href => href(action=>"heads")}, "..."));
5475         }
5476
5477         if (%remotedata) {
5478                 git_print_header_div('remotes');
5479                 git_remotes_body(\%remotedata, 15, $head);
5480         }
5481
5482         if (@forklist) {
5483                 git_print_header_div('forks');
5484                 git_project_list_body(\@forklist, 'age', 0, 15,
5485                                       $#forklist <= 15 ? undef :
5486                                       $cgi->a({-href => href(action=>"forks")}, "..."),
5487                                       'no_header');
5488         }
5489
5490         git_footer_html();
5491 }
5492
5493 sub git_tag {
5494         my %tag = parse_tag($hash);
5495
5496         if (! %tag) {
5497                 die_error(404, "Unknown tag object");
5498         }
5499
5500         my $head = git_get_head_hash($project);
5501         git_header_html();
5502         git_print_page_nav('','', $head,undef,$head);
5503         git_print_header_div('commit', esc_html($tag{'name'}), $hash);
5504         print "<div class=\"title_text\">\n" .
5505               "<table class=\"object_header\">\n" .
5506               "<tr>\n" .
5507               "<td>object</td>\n" .
5508               "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5509                                $tag{'object'}) . "</td>\n" .
5510               "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5511                                               $tag{'type'}) . "</td>\n" .
5512               "</tr>\n";
5513         if (defined($tag{'author'})) {
5514                 git_print_authorship_rows(\%tag, 'author');
5515         }
5516         print "</table>\n\n" .
5517               "</div>\n";
5518         print "<div class=\"page_body\">";
5519         my $comment = $tag{'comment'};
5520         foreach my $line (@$comment) {
5521                 chomp $line;
5522                 print esc_html($line, -nbsp=>1) . "<br/>\n";
5523         }
5524         print "</div>\n";
5525         git_footer_html();
5526 }
5527
5528 sub git_blame_common {
5529         my $format = shift || 'porcelain';
5530         if ($format eq 'porcelain' && $cgi->param('js')) {
5531                 $format = 'incremental';
5532                 $action = 'blame_incremental'; # for page title etc
5533         }
5534
5535         # permissions
5536         gitweb_check_feature('blame')
5537                 or die_error(403, "Blame view not allowed");
5538
5539         # error checking
5540         die_error(400, "No file name given") unless $file_name;
5541         $hash_base ||= git_get_head_hash($project);
5542         die_error(404, "Couldn't find base commit") unless $hash_base;
5543         my %co = parse_commit($hash_base)
5544                 or die_error(404, "Commit not found");
5545         my $ftype = "blob";
5546         if (!defined $hash) {
5547                 $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
5548                         or die_error(404, "Error looking up file");
5549         } else {
5550                 $ftype = git_get_type($hash);
5551                 if ($ftype !~ "blob") {
5552                         die_error(400, "Object is not a blob");
5553                 }
5554         }
5555
5556         my $fd;
5557         if ($format eq 'incremental') {
5558                 # get file contents (as base)
5559                 open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
5560                         or die_error(500, "Open git-cat-file failed");
5561         } elsif ($format eq 'data') {
5562                 # run git-blame --incremental
5563                 open $fd, "-|", git_cmd(), "blame", "--incremental",
5564                         $hash_base, "--", $file_name
5565                         or die_error(500, "Open git-blame --incremental failed");
5566         } else {
5567                 # run git-blame --porcelain
5568                 open $fd, "-|", git_cmd(), "blame", '-p',
5569                         $hash_base, '--', $file_name
5570                         or die_error(500, "Open git-blame --porcelain failed");
5571         }
5572
5573         # incremental blame data returns early
5574         if ($format eq 'data') {
5575                 print $cgi->header(
5576                         -type=>"text/plain", -charset => "utf-8",
5577                         -status=> "200 OK");
5578                 local $| = 1; # output autoflush
5579                 print while <$fd>;
5580                 close $fd
5581                         or print "ERROR $!\n";
5582
5583                 print 'END';
5584                 if (defined $t0 && gitweb_check_feature('timed')) {
5585                         print ' '.
5586                               tv_interval($t0, [ gettimeofday() ]).
5587                               ' '.$number_of_git_cmds;
5588                 }
5589                 print "\n";
5590
5591                 return;
5592         }
5593
5594         # page header
5595         git_header_html();
5596         my $formats_nav =
5597                 $cgi->a({-href => href(action=>"blob", -replay=>1)},
5598                         "blob") .
5599                 " | ";
5600         if ($format eq 'incremental') {
5601                 $formats_nav .=
5602                         $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
5603                                 "blame") . " (non-incremental)";
5604         } else {
5605                 $formats_nav .=
5606                         $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
5607                                 "blame") . " (incremental)";
5608         }
5609         $formats_nav .=
5610                 " | " .
5611                 $cgi->a({-href => href(action=>"history", -replay=>1)},
5612                         "history") .
5613                 " | " .
5614                 $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
5615                         "HEAD");
5616         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5617         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5618         git_print_page_path($file_name, $ftype, $hash_base);
5619
5620         # page body
5621         if ($format eq 'incremental') {
5622                 print "<noscript>\n<div class=\"error\"><center><b>\n".
5623                       "This page requires JavaScript to run.\n Use ".
5624                       $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
5625                               'this page').
5626                       " instead.\n".
5627                       "</b></center></div>\n</noscript>\n";
5628
5629                 print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
5630         }
5631
5632         print qq!<div class="page_body">\n!;
5633         print qq!<div id="progress_info">... / ...</div>\n!
5634                 if ($format eq 'incremental');
5635         print qq!<table id="blame_table" class="blame" width="100%">\n!.
5636               #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
5637               qq!<thead>\n!.
5638               qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
5639               qq!</thead>\n!.
5640               qq!<tbody>\n!;
5641
5642         my @rev_color = qw(light dark);
5643         my $num_colors = scalar(@rev_color);
5644         my $current_color = 0;
5645
5646         if ($format eq 'incremental') {
5647                 my $color_class = $rev_color[$current_color];
5648
5649                 #contents of a file
5650                 my $linenr = 0;
5651         LINE:
5652                 while (my $line = <$fd>) {
5653                         chomp $line;
5654                         $linenr++;
5655
5656                         print qq!<tr id="l$linenr" class="$color_class">!.
5657                               qq!<td class="sha1"><a href=""> </a></td>!.
5658                               qq!<td class="linenr">!.
5659                               qq!<a class="linenr" href="">$linenr</a></td>!;
5660                         print qq!<td class="pre">! . esc_html($line) . "</td>\n";
5661                         print qq!</tr>\n!;
5662                 }
5663
5664         } else { # porcelain, i.e. ordinary blame
5665                 my %metainfo = (); # saves information about commits
5666
5667                 # blame data
5668         LINE:
5669                 while (my $line = <$fd>) {
5670                         chomp $line;
5671                         # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
5672                         # no <lines in group> for subsequent lines in group of lines
5673                         my ($full_rev, $orig_lineno, $lineno, $group_size) =
5674                            ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
5675                         if (!exists $metainfo{$full_rev}) {
5676                                 $metainfo{$full_rev} = { 'nprevious' => 0 };
5677                         }
5678                         my $meta = $metainfo{$full_rev};
5679                         my $data;
5680                         while ($data = <$fd>) {
5681                                 chomp $data;
5682                                 last if ($data =~ s/^\t//); # contents of line
5683                                 if ($data =~ /^(\S+)(?: (.*))?$/) {
5684                                         $meta->{$1} = $2 unless exists $meta->{$1};
5685                                 }
5686                                 if ($data =~ /^previous /) {
5687                                         $meta->{'nprevious'}++;
5688                                 }
5689                         }
5690                         my $short_rev = substr($full_rev, 0, 8);
5691                         my $author = $meta->{'author'};
5692                         my %date =
5693                                 parse_date($meta->{'author-time'}, $meta->{'author-tz'});
5694                         my $date = $date{'iso-tz'};
5695                         if ($group_size) {
5696                                 $current_color = ($current_color + 1) % $num_colors;
5697                         }
5698                         my $tr_class = $rev_color[$current_color];
5699                         $tr_class .= ' boundary' if (exists $meta->{'boundary'});
5700                         $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
5701                         $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
5702                         print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
5703                         if ($group_size) {
5704                                 print "<td class=\"sha1\"";
5705                                 print " title=\"". esc_html($author) . ", $date\"";
5706                                 print " rowspan=\"$group_size\"" if ($group_size > 1);
5707                                 print ">";
5708                                 print $cgi->a({-href => href(action=>"commit",
5709                                                              hash=>$full_rev,
5710                                                              file_name=>$file_name)},
5711                                               esc_html($short_rev));
5712                                 if ($group_size >= 2) {
5713                                         my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
5714                                         if (@author_initials) {
5715                                                 print "<br />" .
5716                                                       esc_html(join('', @author_initials));
5717                                                 #           or join('.', ...)
5718                                         }
5719                                 }
5720                                 print "</td>\n";
5721                         }
5722                         # 'previous' <sha1 of parent commit> <filename at commit>
5723                         if (exists $meta->{'previous'} &&
5724                             $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
5725                                 $meta->{'parent'} = $1;
5726                                 $meta->{'file_parent'} = unquote($2);
5727                         }
5728                         my $linenr_commit =
5729                                 exists($meta->{'parent'}) ?
5730                                 $meta->{'parent'} : $full_rev;
5731                         my $linenr_filename =
5732                                 exists($meta->{'file_parent'}) ?
5733                                 $meta->{'file_parent'} : unquote($meta->{'filename'});
5734                         my $blamed = href(action => 'blame',
5735                                           file_name => $linenr_filename,
5736                                           hash_base => $linenr_commit);
5737                         print "<td class=\"linenr\">";
5738                         print $cgi->a({ -href => "$blamed#l$orig_lineno",
5739                                         -class => "linenr" },
5740                                       esc_html($lineno));
5741                         print "</td>";
5742                         print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
5743                         print "</tr>\n";
5744                 } # end while
5745
5746         }
5747
5748         # footer
5749         print "</tbody>\n".
5750               "</table>\n"; # class="blame"
5751         print "</div>\n";   # class="blame_body"
5752         close $fd
5753                 or print "Reading blob failed\n";
5754
5755         git_footer_html();
5756 }
5757
5758 sub git_blame {
5759         git_blame_common();
5760 }
5761
5762 sub git_blame_incremental {
5763         git_blame_common('incremental');
5764 }
5765
5766 sub git_blame_data {
5767         git_blame_common('data');
5768 }
5769
5770 sub git_tags {
5771         my $head = git_get_head_hash($project);
5772         git_header_html();
5773         git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
5774         git_print_header_div('summary', $project);
5775
5776         my @tagslist = git_get_tags_list();
5777         if (@tagslist) {
5778                 git_tags_body(\@tagslist);
5779         }
5780         git_footer_html();
5781 }
5782
5783 sub git_heads {
5784         my $head = git_get_head_hash($project);
5785         git_header_html();
5786         git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
5787         git_print_header_div('summary', $project);
5788
5789         my @headslist = git_get_heads_list();
5790         if (@headslist) {
5791                 git_heads_body(\@headslist, $head);
5792         }
5793         git_footer_html();
5794 }
5795
5796 # used both for single remote view and for list of all the remotes
5797 sub git_remotes {
5798         gitweb_check_feature('remote_heads')
5799                 or die_error(403, "Remote heads view is disabled");
5800
5801         my $head = git_get_head_hash($project);
5802         my $remote = $input_params{'hash'};
5803
5804         my $remotedata = git_get_remotes_list($remote);
5805         die_error(500, "Unable to get remote information") unless defined $remotedata;
5806
5807         unless (%$remotedata) {
5808                 die_error(404, defined $remote ?
5809                         "Remote $remote not found" :
5810                         "No remotes found");
5811         }
5812
5813         git_header_html(undef, undef, -action_extra => $remote);
5814         git_print_page_nav('', '',  $head, undef, $head,
5815                 format_ref_views($remote ? '' : 'remotes'));
5816
5817         fill_remote_heads($remotedata);
5818         if (defined $remote) {
5819                 git_print_header_div('remotes', "$remote remote for $project");
5820                 git_remote_block($remote, $remotedata->{$remote}, undef, $head);
5821         } else {
5822                 git_print_header_div('summary', "$project remotes");
5823                 git_remotes_body($remotedata, undef, $head);
5824         }
5825
5826         git_footer_html();
5827 }
5828
5829 sub git_blob_plain {
5830         my $type = shift;
5831         my $expires;
5832
5833         if (!defined $hash) {
5834                 if (defined $file_name) {
5835                         my $base = $hash_base || git_get_head_hash($project);
5836                         $hash = git_get_hash_by_path($base, $file_name, "blob")
5837                                 or die_error(404, "Cannot find file");
5838                 } else {
5839                         die_error(400, "No file name defined");
5840                 }
5841         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5842                 # blobs defined by non-textual hash id's can be cached
5843                 $expires = "+1d";
5844         }
5845
5846         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5847                 or die_error(500, "Open git-cat-file blob '$hash' failed");
5848
5849         # content-type (can include charset)
5850         $type = blob_contenttype($fd, $file_name, $type);
5851
5852         # "save as" filename, even when no $file_name is given
5853         my $save_as = "$hash";
5854         if (defined $file_name) {
5855                 $save_as = $file_name;
5856         } elsif ($type =~ m/^text\//) {
5857                 $save_as .= '.txt';
5858         }
5859
5860         # With XSS prevention on, blobs of all types except a few known safe
5861         # ones are served with "Content-Disposition: attachment" to make sure
5862         # they don't run in our security domain.  For certain image types,
5863         # blob view writes an <img> tag referring to blob_plain view, and we
5864         # want to be sure not to break that by serving the image as an
5865         # attachment (though Firefox 3 doesn't seem to care).
5866         my $sandbox = $prevent_xss &&
5867                 $type !~ m!^(?:text/plain|image/(?:gif|png|jpeg))$!;
5868
5869         print $cgi->header(
5870                 -type => $type,
5871                 -expires => $expires,
5872                 -content_disposition =>
5873                         ($sandbox ? 'attachment' : 'inline')
5874                         . '; filename="' . $save_as . '"');
5875         local $/ = undef;
5876         binmode STDOUT, ':raw';
5877         print <$fd>;
5878         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
5879         close $fd;
5880 }
5881
5882 sub git_blob {
5883         my $expires;
5884
5885         if (!defined $hash) {
5886                 if (defined $file_name) {
5887                         my $base = $hash_base || git_get_head_hash($project);
5888                         $hash = git_get_hash_by_path($base, $file_name, "blob")
5889                                 or die_error(404, "Cannot find file");
5890                 } else {
5891                         die_error(400, "No file name defined");
5892                 }
5893         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5894                 # blobs defined by non-textual hash id's can be cached
5895                 $expires = "+1d";
5896         }
5897
5898         my $have_blame = gitweb_check_feature('blame');
5899         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5900                 or die_error(500, "Couldn't cat $file_name, $hash");
5901         my $mimetype = blob_mimetype($fd, $file_name);
5902         # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
5903         if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
5904                 close $fd;
5905                 return git_blob_plain($mimetype);
5906         }
5907         # we can have blame only for text/* mimetype
5908         $have_blame &&= ($mimetype =~ m!^text/!);
5909
5910         my $highlight = gitweb_check_feature('highlight');
5911         my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
5912         $fd = run_highlighter($fd, $highlight, $syntax)
5913                 if $syntax;
5914
5915         git_header_html(undef, $expires);
5916         my $formats_nav = '';
5917         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
5918                 if (defined $file_name) {
5919                         if ($have_blame) {
5920                                 $formats_nav .=
5921                                         $cgi->a({-href => href(action=>"blame", -replay=>1)},
5922                                                 "blame") .
5923                                         " | ";
5924                         }
5925                         $formats_nav .=
5926                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
5927                                         "history") .
5928                                 " | " .
5929                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5930                                         "raw") .
5931                                 " | " .
5932                                 $cgi->a({-href => href(action=>"blob",
5933                                                        hash_base=>"HEAD", file_name=>$file_name)},
5934                                         "HEAD");
5935                 } else {
5936                         $formats_nav .=
5937                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5938                                         "raw");
5939                 }
5940                 git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5941                 git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5942         } else {
5943                 print "<div class=\"page_nav\">\n" .
5944                       "<br/><br/></div>\n" .
5945                       "<div class=\"title\">".esc_html($hash)."</div>\n";
5946         }
5947         git_print_page_path($file_name, "blob", $hash_base);
5948         print "<div class=\"page_body\">\n";
5949         if ($mimetype =~ m!^image/!) {
5950                 print qq!<img type="!.esc_attr($mimetype).qq!"!;
5951                 if ($file_name) {
5952                         print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
5953                 }
5954                 print qq! src="! .
5955                       href(action=>"blob_plain", hash=>$hash,
5956                            hash_base=>$hash_base, file_name=>$file_name) .
5957                       qq!" />\n!;
5958         } else {
5959                 my $nr;
5960                 while (my $line = <$fd>) {
5961                         chomp $line;
5962                         $nr++;
5963                         $line = untabify($line);
5964                         printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
5965                                $nr, esc_attr(href(-replay => 1)), $nr, $nr, $syntax ? $line : esc_html($line, -nbsp=>1);
5966                 }
5967         }
5968         close $fd
5969                 or print "Reading blob failed.\n";
5970         print "</div>";
5971         git_footer_html();
5972 }
5973
5974 sub git_tree {
5975         if (!defined $hash_base) {
5976                 $hash_base = "HEAD";
5977         }
5978         if (!defined $hash) {
5979                 if (defined $file_name) {
5980                         $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
5981                 } else {
5982                         $hash = $hash_base;
5983                 }
5984         }
5985         die_error(404, "No such tree") unless defined($hash);
5986
5987         my $show_sizes = gitweb_check_feature('show-sizes');
5988         my $have_blame = gitweb_check_feature('blame');
5989
5990         my @entries = ();
5991         {
5992                 local $/ = "\0";
5993                 open my $fd, "-|", git_cmd(), "ls-tree", '-z',
5994                         ($show_sizes ? '-l' : ()), @extra_options, $hash
5995                         or die_error(500, "Open git-ls-tree failed");
5996                 @entries = map { chomp; $_ } <$fd>;
5997                 close $fd
5998                         or die_error(404, "Reading tree failed");
5999         }
6000
6001         my $refs = git_get_references();
6002         my $ref = format_ref_marker($refs, $hash_base);
6003         git_header_html();
6004         my $basedir = '';
6005         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6006                 my @views_nav = ();
6007                 if (defined $file_name) {
6008                         push @views_nav,
6009                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6010                                         "history"),
6011                                 $cgi->a({-href => href(action=>"tree",
6012                                                        hash_base=>"HEAD", file_name=>$file_name)},
6013                                         "HEAD"),
6014                 }
6015                 my $snapshot_links = format_snapshot_links($hash);
6016                 if (defined $snapshot_links) {
6017                         # FIXME: Should be available when we have no hash base as well.
6018                         push @views_nav, $snapshot_links;
6019                 }
6020                 git_print_page_nav('tree','', $hash_base, undef, undef,
6021                                    join(' | ', @views_nav));
6022                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6023         } else {
6024                 undef $hash_base;
6025                 print "<div class=\"page_nav\">\n";
6026                 print "<br/><br/></div>\n";
6027                 print "<div class=\"title\">".esc_html($hash)."</div>\n";
6028         }
6029         if (defined $file_name) {
6030                 $basedir = $file_name;
6031                 if ($basedir ne '' && substr($basedir, -1) ne '/') {
6032                         $basedir .= '/';
6033                 }
6034                 git_print_page_path($file_name, 'tree', $hash_base);
6035         }
6036         print "<div class=\"page_body\">\n";
6037         print "<table class=\"tree\">\n";
6038         my $alternate = 1;
6039         # '..' (top directory) link if possible
6040         if (defined $hash_base &&
6041             defined $file_name && $file_name =~ m![^/]+$!) {
6042                 if ($alternate) {
6043                         print "<tr class=\"dark\">\n";
6044                 } else {
6045                         print "<tr class=\"light\">\n";
6046                 }
6047                 $alternate ^= 1;
6048
6049                 my $up = $file_name;
6050                 $up =~ s!/?[^/]+$!!;
6051                 undef $up unless $up;
6052                 # based on git_print_tree_entry
6053                 print '<td class="mode">' . mode_str('040000') . "</td>\n";
6054                 print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6055                 print '<td class="list">';
6056                 print $cgi->a({-href => href(action=>"tree",
6057                                              hash_base=>$hash_base,
6058                                              file_name=>$up)},
6059                               "..");
6060                 print "</td>\n";
6061                 print "<td class=\"link\"></td>\n";
6062
6063                 print "</tr>\n";
6064         }
6065         foreach my $line (@entries) {
6066                 my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6067
6068                 if ($alternate) {
6069                         print "<tr class=\"dark\">\n";
6070                 } else {
6071                         print "<tr class=\"light\">\n";
6072                 }
6073                 $alternate ^= 1;
6074
6075                 git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6076
6077                 print "</tr>\n";
6078         }
6079         print "</table>\n" .
6080               "</div>";
6081         git_footer_html();
6082 }
6083
6084 sub snapshot_name {
6085         my ($project, $hash) = @_;
6086
6087         # path/to/project.git  -> project
6088         # path/to/project/.git -> project
6089         my $name = to_utf8($project);
6090         $name =~ s,([^/])/*\.git$,$1,;
6091         $name = basename($name);
6092         # sanitize name
6093         $name =~ s/[[:cntrl:]]/?/g;
6094
6095         my $ver = $hash;
6096         if ($hash =~ /^[0-9a-fA-F]+$/) {
6097                 # shorten SHA-1 hash
6098                 my $full_hash = git_get_full_hash($project, $hash);
6099                 if ($full_hash =~ /^$hash/ && length($hash) > 7) {
6100                         $ver = git_get_short_hash($project, $hash);
6101                 }
6102         } elsif ($hash =~ m!^refs/tags/(.*)$!) {
6103                 # tags don't need shortened SHA-1 hash
6104                 $ver = $1;
6105         } else {
6106                 # branches and other need shortened SHA-1 hash
6107                 if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
6108                         $ver = $1;
6109                 }
6110                 $ver .= '-' . git_get_short_hash($project, $hash);
6111         }
6112         # in case of hierarchical branch names
6113         $ver =~ s!/!.!g;
6114
6115         # name = project-version_string
6116         $name = "$name-$ver";
6117
6118         return wantarray ? ($name, $name) : $name;
6119 }
6120
6121 sub git_snapshot {
6122         my $format = $input_params{'snapshot_format'};
6123         if (!@snapshot_fmts) {
6124                 die_error(403, "Snapshots not allowed");
6125         }
6126         # default to first supported snapshot format
6127         $format ||= $snapshot_fmts[0];
6128         if ($format !~ m/^[a-z0-9]+$/) {
6129                 die_error(400, "Invalid snapshot format parameter");
6130         } elsif (!exists($known_snapshot_formats{$format})) {
6131                 die_error(400, "Unknown snapshot format");
6132         } elsif ($known_snapshot_formats{$format}{'disabled'}) {
6133                 die_error(403, "Snapshot format not allowed");
6134         } elsif (!grep($_ eq $format, @snapshot_fmts)) {
6135                 die_error(403, "Unsupported snapshot format");
6136         }
6137
6138         my $type = git_get_type("$hash^{}");
6139         if (!$type) {
6140                 die_error(404, 'Object does not exist');
6141         }  elsif ($type eq 'blob') {
6142                 die_error(400, 'Object is not a tree-ish');
6143         }
6144
6145         my ($name, $prefix) = snapshot_name($project, $hash);
6146         my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
6147         my $cmd = quote_command(
6148                 git_cmd(), 'archive',
6149                 "--format=$known_snapshot_formats{$format}{'format'}",
6150                 "--prefix=$prefix/", $hash);
6151         if (exists $known_snapshot_formats{$format}{'compressor'}) {
6152                 $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
6153         }
6154
6155         $filename =~ s/(["\\])/\\$1/g;
6156         print $cgi->header(
6157                 -type => $known_snapshot_formats{$format}{'type'},
6158                 -content_disposition => 'inline; filename="' . $filename . '"',
6159                 -status => '200 OK');
6160
6161         open my $fd, "-|", $cmd
6162                 or die_error(500, "Execute git-archive failed");
6163         binmode STDOUT, ':raw';
6164         print <$fd>;
6165         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6166         close $fd;
6167 }
6168
6169 sub git_log_generic {
6170         my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
6171
6172         my $head = git_get_head_hash($project);
6173         if (!defined $base) {
6174                 $base = $head;
6175         }
6176         if (!defined $page) {
6177                 $page = 0;
6178         }
6179         my $refs = git_get_references();
6180
6181         my $commit_hash = $base;
6182         if (defined $parent) {
6183                 $commit_hash = "$parent..$base";
6184         }
6185         my @commitlist =
6186                 parse_commits($commit_hash, 101, (100 * $page),
6187                               defined $file_name ? ($file_name, "--full-history") : ());
6188
6189         my $ftype;
6190         if (!defined $file_hash && defined $file_name) {
6191                 # some commits could have deleted file in question,
6192                 # and not have it in tree, but one of them has to have it
6193                 for (my $i = 0; $i < @commitlist; $i++) {
6194                         $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
6195                         last if defined $file_hash;
6196                 }
6197         }
6198         if (defined $file_hash) {
6199                 $ftype = git_get_type($file_hash);
6200         }
6201         if (defined $file_name && !defined $ftype) {
6202                 die_error(500, "Unknown type of object");
6203         }
6204         my %co;
6205         if (defined $file_name) {
6206                 %co = parse_commit($base)
6207                         or die_error(404, "Unknown commit object");
6208         }
6209
6210
6211         my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
6212         my $next_link = '';
6213         if ($#commitlist >= 100) {
6214                 $next_link =
6215                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
6216                                  -accesskey => "n", -title => "Alt-n"}, "next");
6217         }
6218         my $patch_max = gitweb_get_feature('patches');
6219         if ($patch_max && !defined $file_name) {
6220                 if ($patch_max < 0 || @commitlist <= $patch_max) {
6221                         $paging_nav .= " &sdot; " .
6222                                 $cgi->a({-href => href(action=>"patches", -replay=>1)},
6223                                         "patches");
6224                 }
6225         }
6226
6227         git_header_html();
6228         git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
6229         if (defined $file_name) {
6230                 git_print_header_div('commit', esc_html($co{'title'}), $base);
6231         } else {
6232                 git_print_header_div('summary', $project)
6233         }
6234         git_print_page_path($file_name, $ftype, $hash_base)
6235                 if (defined $file_name);
6236
6237         $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
6238                      $file_name, $file_hash, $ftype);
6239
6240         git_footer_html();
6241 }
6242
6243 sub git_log {
6244         git_log_generic('log', \&git_log_body,
6245                         $hash, $hash_parent);
6246 }
6247
6248 sub git_commit {
6249         $hash ||= $hash_base || "HEAD";
6250         my %co = parse_commit($hash)
6251             or die_error(404, "Unknown commit object");
6252
6253         my $parent  = $co{'parent'};
6254         my $parents = $co{'parents'}; # listref
6255
6256         # we need to prepare $formats_nav before any parameter munging
6257         my $formats_nav;
6258         if (!defined $parent) {
6259                 # --root commitdiff
6260                 $formats_nav .= '(initial)';
6261         } elsif (@$parents == 1) {
6262                 # single parent commit
6263                 $formats_nav .=
6264                         '(parent: ' .
6265                         $cgi->a({-href => href(action=>"commit",
6266                                                hash=>$parent)},
6267                                 esc_html(substr($parent, 0, 7))) .
6268                         ')';
6269         } else {
6270                 # merge commit
6271                 $formats_nav .=
6272                         '(merge: ' .
6273                         join(' ', map {
6274                                 $cgi->a({-href => href(action=>"commit",
6275                                                        hash=>$_)},
6276                                         esc_html(substr($_, 0, 7)));
6277                         } @$parents ) .
6278                         ')';
6279         }
6280         if (gitweb_check_feature('patches') && @$parents <= 1) {
6281                 $formats_nav .= " | " .
6282                         $cgi->a({-href => href(action=>"patch", -replay=>1)},
6283                                 "patch");
6284         }
6285
6286         if (!defined $parent) {
6287                 $parent = "--root";
6288         }
6289         my @difftree;
6290         open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
6291                 @diff_opts,
6292                 (@$parents <= 1 ? $parent : '-c'),
6293                 $hash, "--"
6294                 or die_error(500, "Open git-diff-tree failed");
6295         @difftree = map { chomp; $_ } <$fd>;
6296         close $fd or die_error(404, "Reading git-diff-tree failed");
6297
6298         # non-textual hash id's can be cached
6299         my $expires;
6300         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6301                 $expires = "+1d";
6302         }
6303         my $refs = git_get_references();
6304         my $ref = format_ref_marker($refs, $co{'id'});
6305
6306         git_header_html(undef, $expires);
6307         git_print_page_nav('commit', '',
6308                            $hash, $co{'tree'}, $hash,
6309                            $formats_nav);
6310
6311         if (defined $co{'parent'}) {
6312                 git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
6313         } else {
6314                 git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
6315         }
6316         print "<div class=\"title_text\">\n" .
6317               "<table class=\"object_header\">\n";
6318         git_print_authorship_rows(\%co);
6319         print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
6320         print "<tr>" .
6321               "<td>tree</td>" .
6322               "<td class=\"sha1\">" .
6323               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
6324                        class => "list"}, $co{'tree'}) .
6325               "</td>" .
6326               "<td class=\"link\">" .
6327               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
6328                       "tree");
6329         my $snapshot_links = format_snapshot_links($hash);
6330         if (defined $snapshot_links) {
6331                 print " | " . $snapshot_links;
6332         }
6333         print "</td>" .
6334               "</tr>\n";
6335
6336         foreach my $par (@$parents) {
6337                 print "<tr>" .
6338                       "<td>parent</td>" .
6339                       "<td class=\"sha1\">" .
6340                       $cgi->a({-href => href(action=>"commit", hash=>$par),
6341                                class => "list"}, $par) .
6342                       "</td>" .
6343                       "<td class=\"link\">" .
6344                       $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
6345                       " | " .
6346                       $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
6347                       "</td>" .
6348                       "</tr>\n";
6349         }
6350         print "</table>".
6351               "</div>\n";
6352
6353         print "<div class=\"page_body\">\n";
6354         git_print_log($co{'comment'});
6355         print "</div>\n";
6356
6357         git_difftree_body(\@difftree, $hash, @$parents);
6358
6359         git_footer_html();
6360 }
6361
6362 sub git_object {
6363         # object is defined by:
6364         # - hash or hash_base alone
6365         # - hash_base and file_name
6366         my $type;
6367
6368         # - hash or hash_base alone
6369         if ($hash || ($hash_base && !defined $file_name)) {
6370                 my $object_id = $hash || $hash_base;
6371
6372                 open my $fd, "-|", quote_command(
6373                         git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
6374                         or die_error(404, "Object does not exist");
6375                 $type = <$fd>;
6376                 chomp $type;
6377                 close $fd
6378                         or die_error(404, "Object does not exist");
6379
6380         # - hash_base and file_name
6381         } elsif ($hash_base && defined $file_name) {
6382                 $file_name =~ s,/+$,,;
6383
6384                 system(git_cmd(), "cat-file", '-e', $hash_base) == 0
6385                         or die_error(404, "Base object does not exist");
6386
6387                 # here errors should not hapen
6388                 open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
6389                         or die_error(500, "Open git-ls-tree failed");
6390                 my $line = <$fd>;
6391                 close $fd;
6392
6393                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
6394                 unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
6395                         die_error(404, "File or directory for given base does not exist");
6396                 }
6397                 $type = $2;
6398                 $hash = $3;
6399         } else {
6400                 die_error(400, "Not enough information to find object");
6401         }
6402
6403         print $cgi->redirect(-uri => href(action=>$type, -full=>1,
6404                                           hash=>$hash, hash_base=>$hash_base,
6405                                           file_name=>$file_name),
6406                              -status => '302 Found');
6407 }
6408
6409 sub git_blobdiff {
6410         my $format = shift || 'html';
6411
6412         my $fd;
6413         my @difftree;
6414         my %diffinfo;
6415         my $expires;
6416
6417         # preparing $fd and %diffinfo for git_patchset_body
6418         # new style URI
6419         if (defined $hash_base && defined $hash_parent_base) {
6420                 if (defined $file_name) {
6421                         # read raw output
6422                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6423                                 $hash_parent_base, $hash_base,
6424                                 "--", (defined $file_parent ? $file_parent : ()), $file_name
6425                                 or die_error(500, "Open git-diff-tree failed");
6426                         @difftree = map { chomp; $_ } <$fd>;
6427                         close $fd
6428                                 or die_error(404, "Reading git-diff-tree failed");
6429                         @difftree
6430                                 or die_error(404, "Blob diff not found");
6431
6432                 } elsif (defined $hash &&
6433                          $hash =~ /[0-9a-fA-F]{40}/) {
6434                         # try to find filename from $hash
6435
6436                         # read filtered raw output
6437                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6438                                 $hash_parent_base, $hash_base, "--"
6439                                 or die_error(500, "Open git-diff-tree failed");
6440                         @difftree =
6441                                 # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
6442                                 # $hash == to_id
6443                                 grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
6444                                 map { chomp; $_ } <$fd>;
6445                         close $fd
6446                                 or die_error(404, "Reading git-diff-tree failed");
6447                         @difftree
6448                                 or die_error(404, "Blob diff not found");
6449
6450                 } else {
6451                         die_error(400, "Missing one of the blob diff parameters");
6452                 }
6453
6454                 if (@difftree > 1) {
6455                         die_error(400, "Ambiguous blob diff specification");
6456                 }
6457
6458                 %diffinfo = parse_difftree_raw_line($difftree[0]);
6459                 $file_parent ||= $diffinfo{'from_file'} || $file_name;
6460                 $file_name   ||= $diffinfo{'to_file'};
6461
6462                 $hash_parent ||= $diffinfo{'from_id'};
6463                 $hash        ||= $diffinfo{'to_id'};
6464
6465                 # non-textual hash id's can be cached
6466                 if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
6467                     $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
6468                         $expires = '+1d';
6469                 }
6470
6471                 # open patch output
6472                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6473                         '-p', ($format eq 'html' ? "--full-index" : ()),
6474                         $hash_parent_base, $hash_base,
6475                         "--", (defined $file_parent ? $file_parent : ()), $file_name
6476                         or die_error(500, "Open git-diff-tree failed");
6477         }
6478
6479         # old/legacy style URI -- not generated anymore since 1.4.3.
6480         if (!%diffinfo) {
6481                 die_error('404 Not Found', "Missing one of the blob diff parameters")
6482         }
6483
6484         # header
6485         if ($format eq 'html') {
6486                 my $formats_nav =
6487                         $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
6488                                 "raw");
6489                 git_header_html(undef, $expires);
6490                 if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6491                         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6492                         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6493                 } else {
6494                         print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
6495                         print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
6496                 }
6497                 if (defined $file_name) {
6498                         git_print_page_path($file_name, "blob", $hash_base);
6499                 } else {
6500                         print "<div class=\"page_path\"></div>\n";
6501                 }
6502
6503         } elsif ($format eq 'plain') {
6504                 print $cgi->header(
6505                         -type => 'text/plain',
6506                         -charset => 'utf-8',
6507                         -expires => $expires,
6508                         -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
6509
6510                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6511
6512         } else {
6513                 die_error(400, "Unknown blobdiff format");
6514         }
6515
6516         # patch
6517         if ($format eq 'html') {
6518                 print "<div class=\"page_body\">\n";
6519
6520                 git_patchset_body($fd, [ \%diffinfo ], $hash_base, $hash_parent_base);
6521                 close $fd;
6522
6523                 print "</div>\n"; # class="page_body"
6524                 git_footer_html();
6525
6526         } else {
6527                 while (my $line = <$fd>) {
6528                         $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
6529                         $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
6530
6531                         print $line;
6532
6533                         last if $line =~ m!^\+\+\+!;
6534                 }
6535                 local $/ = undef;
6536                 print <$fd>;
6537                 close $fd;
6538         }
6539 }
6540
6541 sub git_blobdiff_plain {
6542         git_blobdiff('plain');
6543 }
6544
6545 sub git_commitdiff {
6546         my %params = @_;
6547         my $format = $params{-format} || 'html';
6548
6549         my ($patch_max) = gitweb_get_feature('patches');
6550         if ($format eq 'patch') {
6551                 die_error(403, "Patch view not allowed") unless $patch_max;
6552         }
6553
6554         $hash ||= $hash_base || "HEAD";
6555         my %co = parse_commit($hash)
6556             or die_error(404, "Unknown commit object");
6557
6558         # choose format for commitdiff for merge
6559         if (! defined $hash_parent && @{$co{'parents'}} > 1) {
6560                 $hash_parent = '--cc';
6561         }
6562         # we need to prepare $formats_nav before almost any parameter munging
6563         my $formats_nav;
6564         if ($format eq 'html') {
6565                 $formats_nav =
6566                         $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
6567                                 "raw");
6568                 if ($patch_max && @{$co{'parents'}} <= 1) {
6569                         $formats_nav .= " | " .
6570                                 $cgi->a({-href => href(action=>"patch", -replay=>1)},
6571                                         "patch");
6572                 }
6573
6574                 if (defined $hash_parent &&
6575                     $hash_parent ne '-c' && $hash_parent ne '--cc') {
6576                         # commitdiff with two commits given
6577                         my $hash_parent_short = $hash_parent;
6578                         if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
6579                                 $hash_parent_short = substr($hash_parent, 0, 7);
6580                         }
6581                         $formats_nav .=
6582                                 ' (from';
6583                         for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
6584                                 if ($co{'parents'}[$i] eq $hash_parent) {
6585                                         $formats_nav .= ' parent ' . ($i+1);
6586                                         last;
6587                                 }
6588                         }
6589                         $formats_nav .= ': ' .
6590                                 $cgi->a({-href => href(action=>"commitdiff",
6591                                                        hash=>$hash_parent)},
6592                                         esc_html($hash_parent_short)) .
6593                                 ')';
6594                 } elsif (!$co{'parent'}) {
6595                         # --root commitdiff
6596                         $formats_nav .= ' (initial)';
6597                 } elsif (scalar @{$co{'parents'}} == 1) {
6598                         # single parent commit
6599                         $formats_nav .=
6600                                 ' (parent: ' .
6601                                 $cgi->a({-href => href(action=>"commitdiff",
6602                                                        hash=>$co{'parent'})},
6603                                         esc_html(substr($co{'parent'}, 0, 7))) .
6604                                 ')';
6605                 } else {
6606                         # merge commit
6607                         if ($hash_parent eq '--cc') {
6608                                 $formats_nav .= ' | ' .
6609                                         $cgi->a({-href => href(action=>"commitdiff",
6610                                                                hash=>$hash, hash_parent=>'-c')},
6611                                                 'combined');
6612                         } else { # $hash_parent eq '-c'
6613                                 $formats_nav .= ' | ' .
6614                                         $cgi->a({-href => href(action=>"commitdiff",
6615                                                                hash=>$hash, hash_parent=>'--cc')},
6616                                                 'compact');
6617                         }
6618                         $formats_nav .=
6619                                 ' (merge: ' .
6620                                 join(' ', map {
6621                                         $cgi->a({-href => href(action=>"commitdiff",
6622                                                                hash=>$_)},
6623                                                 esc_html(substr($_, 0, 7)));
6624                                 } @{$co{'parents'}} ) .
6625                                 ')';
6626                 }
6627         }
6628
6629         my $hash_parent_param = $hash_parent;
6630         if (!defined $hash_parent_param) {
6631                 # --cc for multiple parents, --root for parentless
6632                 $hash_parent_param =
6633                         @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
6634         }
6635
6636         # read commitdiff
6637         my $fd;
6638         my @difftree;
6639         if ($format eq 'html') {
6640                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6641                         "--no-commit-id", "--patch-with-raw", "--full-index",
6642                         $hash_parent_param, $hash, "--"
6643                         or die_error(500, "Open git-diff-tree failed");
6644
6645                 while (my $line = <$fd>) {
6646                         chomp $line;
6647                         # empty line ends raw part of diff-tree output
6648                         last unless $line;
6649                         push @difftree, scalar parse_difftree_raw_line($line);
6650                 }
6651
6652         } elsif ($format eq 'plain') {
6653                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6654                         '-p', $hash_parent_param, $hash, "--"
6655                         or die_error(500, "Open git-diff-tree failed");
6656         } elsif ($format eq 'patch') {
6657                 # For commit ranges, we limit the output to the number of
6658                 # patches specified in the 'patches' feature.
6659                 # For single commits, we limit the output to a single patch,
6660                 # diverging from the git-format-patch default.
6661                 my @commit_spec = ();
6662                 if ($hash_parent) {
6663                         if ($patch_max > 0) {
6664                                 push @commit_spec, "-$patch_max";
6665                         }
6666                         push @commit_spec, '-n', "$hash_parent..$hash";
6667                 } else {
6668                         if ($params{-single}) {
6669                                 push @commit_spec, '-1';
6670                         } else {
6671                                 if ($patch_max > 0) {
6672                                         push @commit_spec, "-$patch_max";
6673                                 }
6674                                 push @commit_spec, "-n";
6675                         }
6676                         push @commit_spec, '--root', $hash;
6677                 }
6678                 open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
6679                         '--encoding=utf8', '--stdout', @commit_spec
6680                         or die_error(500, "Open git-format-patch failed");
6681         } else {
6682                 die_error(400, "Unknown commitdiff format");
6683         }
6684
6685         # non-textual hash id's can be cached
6686         my $expires;
6687         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6688                 $expires = "+1d";
6689         }
6690
6691         # write commit message
6692         if ($format eq 'html') {
6693                 my $refs = git_get_references();
6694                 my $ref = format_ref_marker($refs, $co{'id'});
6695
6696                 git_header_html(undef, $expires);
6697                 git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
6698                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
6699                 print "<div class=\"title_text\">\n" .
6700                       "<table class=\"object_header\">\n";
6701                 git_print_authorship_rows(\%co);
6702                 print "</table>".
6703                       "</div>\n";
6704                 print "<div class=\"page_body\">\n";
6705                 if (@{$co{'comment'}} > 1) {
6706                         print "<div class=\"log\">\n";
6707                         git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
6708                         print "</div>\n"; # class="log"
6709                 }
6710
6711         } elsif ($format eq 'plain') {
6712                 my $refs = git_get_references("tags");
6713                 my $tagname = git_get_rev_name_tags($hash);
6714                 my $filename = basename($project) . "-$hash.patch";
6715
6716                 print $cgi->header(
6717                         -type => 'text/plain',
6718                         -charset => 'utf-8',
6719                         -expires => $expires,
6720                         -content_disposition => 'inline; filename="' . "$filename" . '"');
6721                 my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
6722                 print "From: " . to_utf8($co{'author'}) . "\n";
6723                 print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
6724                 print "Subject: " . to_utf8($co{'title'}) . "\n";
6725
6726                 print "X-Git-Tag: $tagname\n" if $tagname;
6727                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6728
6729                 foreach my $line (@{$co{'comment'}}) {
6730                         print to_utf8($line) . "\n";
6731                 }
6732                 print "---\n\n";
6733         } elsif ($format eq 'patch') {
6734                 my $filename = basename($project) . "-$hash.patch";
6735
6736                 print $cgi->header(
6737                         -type => 'text/plain',
6738                         -charset => 'utf-8',
6739                         -expires => $expires,
6740                         -content_disposition => 'inline; filename="' . "$filename" . '"');
6741         }
6742
6743         # write patch
6744         if ($format eq 'html') {
6745                 my $use_parents = !defined $hash_parent ||
6746                         $hash_parent eq '-c' || $hash_parent eq '--cc';
6747                 git_difftree_body(\@difftree, $hash,
6748                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
6749                 print "<br/>\n";
6750
6751                 git_patchset_body($fd, \@difftree, $hash,
6752                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
6753                 close $fd;
6754                 print "</div>\n"; # class="page_body"
6755                 git_footer_html();
6756
6757         } elsif ($format eq 'plain') {
6758                 local $/ = undef;
6759                 print <$fd>;
6760                 close $fd
6761                         or print "Reading git-diff-tree failed\n";
6762         } elsif ($format eq 'patch') {
6763                 local $/ = undef;
6764                 print <$fd>;
6765                 close $fd
6766                         or print "Reading git-format-patch failed\n";
6767         }
6768 }
6769
6770 sub git_commitdiff_plain {
6771         git_commitdiff(-format => 'plain');
6772 }
6773
6774 # format-patch-style patches
6775 sub git_patch {
6776         git_commitdiff(-format => 'patch', -single => 1);
6777 }
6778
6779 sub git_patches {
6780         git_commitdiff(-format => 'patch');
6781 }
6782
6783 sub git_history {
6784         git_log_generic('history', \&git_history_body,
6785                         $hash_base, $hash_parent_base,
6786                         $file_name, $hash);
6787 }
6788
6789 sub git_search {
6790         gitweb_check_feature('search') or die_error(403, "Search is disabled");
6791         if (!defined $searchtext) {
6792                 die_error(400, "Text field is empty");
6793         }
6794         if (!defined $hash) {
6795                 $hash = git_get_head_hash($project);
6796         }
6797         my %co = parse_commit($hash);
6798         if (!%co) {
6799                 die_error(404, "Unknown commit object");
6800         }
6801         if (!defined $page) {
6802                 $page = 0;
6803         }
6804
6805         $searchtype ||= 'commit';
6806         if ($searchtype eq 'pickaxe') {
6807                 # pickaxe may take all resources of your box and run for several minutes
6808                 # with every query - so decide by yourself how public you make this feature
6809                 gitweb_check_feature('pickaxe')
6810                     or die_error(403, "Pickaxe is disabled");
6811         }
6812         if ($searchtype eq 'grep') {
6813                 gitweb_check_feature('grep')
6814                     or die_error(403, "Grep is disabled");
6815         }
6816
6817         git_header_html();
6818
6819         if ($searchtype eq 'commit' or $searchtype eq 'author' or $searchtype eq 'committer') {
6820                 my $greptype;
6821                 if ($searchtype eq 'commit') {
6822                         $greptype = "--grep=";
6823                 } elsif ($searchtype eq 'author') {
6824                         $greptype = "--author=";
6825                 } elsif ($searchtype eq 'committer') {
6826                         $greptype = "--committer=";
6827                 }
6828                 $greptype .= $searchtext;
6829                 my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
6830                                                $greptype, '--regexp-ignore-case',
6831                                                $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
6832
6833                 my $paging_nav = '';
6834                 if ($page > 0) {
6835                         $paging_nav .=
6836                                 $cgi->a({-href => href(action=>"search", hash=>$hash,
6837                                                        searchtext=>$searchtext,
6838                                                        searchtype=>$searchtype)},
6839                                         "first");
6840                         $paging_nav .= " &sdot; " .
6841                                 $cgi->a({-href => href(-replay=>1, page=>$page-1),
6842                                          -accesskey => "p", -title => "Alt-p"}, "prev");
6843                 } else {
6844                         $paging_nav .= "first";
6845                         $paging_nav .= " &sdot; prev";
6846                 }
6847                 my $next_link = '';
6848                 if ($#commitlist >= 100) {
6849                         $next_link =
6850                                 $cgi->a({-href => href(-replay=>1, page=>$page+1),
6851                                          -accesskey => "n", -title => "Alt-n"}, "next");
6852                         $paging_nav .= " &sdot; $next_link";
6853                 } else {
6854                         $paging_nav .= " &sdot; next";
6855                 }
6856
6857                 git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
6858                 git_print_header_div('commit', esc_html($co{'title'}), $hash);
6859                 if ($page == 0 && !@commitlist) {
6860                         print "<p>No match.</p>\n";
6861                 } else {
6862                         git_search_grep_body(\@commitlist, 0, 99, $next_link);
6863                 }
6864         }
6865
6866         if ($searchtype eq 'pickaxe') {
6867                 git_print_page_nav('','', $hash,$co{'tree'},$hash);
6868                 git_print_header_div('commit', esc_html($co{'title'}), $hash);
6869
6870                 print "<table class=\"pickaxe search\">\n";
6871                 my $alternate = 1;
6872                 local $/ = "\n";
6873                 open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
6874                         '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
6875                         ($search_use_regexp ? '--pickaxe-regex' : ());
6876                 undef %co;
6877                 my @files;
6878                 while (my $line = <$fd>) {
6879                         chomp $line;
6880                         next unless $line;
6881
6882                         my %set = parse_difftree_raw_line($line);
6883                         if (defined $set{'commit'}) {
6884                                 # finish previous commit
6885                                 if (%co) {
6886                                         print "</td>\n" .
6887                                               "<td class=\"link\">" .
6888                                               $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6889                                               " | " .
6890                                               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6891                                         print "</td>\n" .
6892                                               "</tr>\n";
6893                                 }
6894
6895                                 if ($alternate) {
6896                                         print "<tr class=\"dark\">\n";
6897                                 } else {
6898                                         print "<tr class=\"light\">\n";
6899                                 }
6900                                 $alternate ^= 1;
6901                                 %co = parse_commit($set{'commit'});
6902                                 my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6903                                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6904                                       "<td><i>$author</i></td>\n" .
6905                                       "<td>" .
6906                                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6907                                               -class => "list subject"},
6908                                               chop_and_escape_str($co{'title'}, 50) . "<br/>");
6909                         } elsif (defined $set{'to_id'}) {
6910                                 next if ($set{'to_id'} =~ m/^0{40}$/);
6911
6912                                 print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6913                                                              hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6914                                               -class => "list"},
6915                                               "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6916                                       "<br/>\n";
6917                         }
6918                 }
6919                 close $fd;
6920
6921                 # finish last commit (warning: repetition!)
6922                 if (%co) {
6923                         print "</td>\n" .
6924                               "<td class=\"link\">" .
6925                               $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6926                               " | " .
6927                               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6928                         print "</td>\n" .
6929                               "</tr>\n";
6930                 }
6931
6932                 print "</table>\n";
6933         }
6934
6935         if ($searchtype eq 'grep') {
6936                 git_print_page_nav('','', $hash,$co{'tree'},$hash);
6937                 git_print_header_div('commit', esc_html($co{'title'}), $hash);
6938
6939                 print "<table class=\"grep_search\">\n";
6940                 my $alternate = 1;
6941                 my $matches = 0;
6942                 local $/ = "\n";
6943                 open my $fd, "-|", git_cmd(), 'grep', '-n',
6944                         $search_use_regexp ? ('-E', '-i') : '-F',
6945                         $searchtext, $co{'tree'};
6946                 my $lastfile = '';
6947                 while (my $line = <$fd>) {
6948                         chomp $line;
6949                         my ($file, $lno, $ltext, $binary);
6950                         last if ($matches++ > 1000);
6951                         if ($line =~ /^Binary file (.+) matches$/) {
6952                                 $file = $1;
6953                                 $binary = 1;
6954                         } else {
6955                                 (undef, $file, $lno, $ltext) = split(/:/, $line, 4);
6956                         }
6957                         if ($file ne $lastfile) {
6958                                 $lastfile and print "</td></tr>\n";
6959                                 if ($alternate++) {
6960                                         print "<tr class=\"dark\">\n";
6961                                 } else {
6962                                         print "<tr class=\"light\">\n";
6963                                 }
6964                                 print "<td class=\"list\">".
6965                                         $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6966                                                                file_name=>"$file"),
6967                                                 -class => "list"}, esc_path($file));
6968                                 print "</td><td>\n";
6969                                 $lastfile = $file;
6970                         }
6971                         if ($binary) {
6972                                 print "<div class=\"binary\">Binary file</div>\n";
6973                         } else {
6974                                 $ltext = untabify($ltext);
6975                                 if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6976                                         $ltext = esc_html($1, -nbsp=>1);
6977                                         $ltext .= '<span class="match">';
6978                                         $ltext .= esc_html($2, -nbsp=>1);
6979                                         $ltext .= '</span>';
6980                                         $ltext .= esc_html($3, -nbsp=>1);
6981                                 } else {
6982                                         $ltext = esc_html($ltext, -nbsp=>1);
6983                                 }
6984                                 print "<div class=\"pre\">" .
6985                                         $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6986                                                                file_name=>"$file").'#l'.$lno,
6987                                                 -class => "linenr"}, sprintf('%4i', $lno))
6988                                         . ' ' .  $ltext . "</div>\n";
6989                         }
6990                 }
6991                 if ($lastfile) {
6992                         print "</td></tr>\n";
6993                         if ($matches > 1000) {
6994                                 print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6995                         }
6996                 } else {
6997                         print "<div class=\"diff nodifferences\">No matches found</div>\n";
6998                 }
6999                 close $fd;
7000
7001                 print "</table>\n";
7002         }
7003         git_footer_html();
7004 }
7005
7006 sub git_search_help {
7007         git_header_html();
7008         git_print_page_nav('','', $hash,$hash,$hash);
7009         print <<EOT;
7010 <p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7011 regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7012 the pattern entered is recognized as the POSIX extended
7013 <a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7014 insensitive).</p>
7015 <dl>
7016 <dt><b>commit</b></dt>
7017 <dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7018 EOT
7019         my $have_grep = gitweb_check_feature('grep');
7020         if ($have_grep) {
7021                 print <<EOT;
7022 <dt><b>grep</b></dt>
7023 <dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7024     a different one) are searched for the given pattern. On large trees, this search can take
7025 a while and put some strain on the server, so please use it with some consideration. Note that
7026 due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7027 case-sensitive.</dd>
7028 EOT
7029         }
7030         print <<EOT;
7031 <dt><b>author</b></dt>
7032 <dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7033 <dt><b>committer</b></dt>
7034 <dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7035 EOT
7036         my $have_pickaxe = gitweb_check_feature('pickaxe');
7037         if ($have_pickaxe) {
7038                 print <<EOT;
7039 <dt><b>pickaxe</b></dt>
7040 <dd>All commits that caused the string to appear or disappear from any file (changes that
7041 added, removed or "modified" the string) will be listed. This search can take a while and
7042 takes a lot of strain on the server, so please use it wisely. Note that since you may be
7043 interested even in changes just changing the case as well, this search is case sensitive.</dd>
7044 EOT
7045         }
7046         print "</dl>\n";
7047         git_footer_html();
7048 }
7049
7050 sub git_shortlog {
7051         git_log_generic('shortlog', \&git_shortlog_body,
7052                         $hash, $hash_parent);
7053 }
7054
7055 ## ......................................................................
7056 ## feeds (RSS, Atom; OPML)
7057
7058 sub git_feed {
7059         my $format = shift || 'atom';
7060         my $have_blame = gitweb_check_feature('blame');
7061
7062         # Atom: http://www.atomenabled.org/developers/syndication/
7063         # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7064         if ($format ne 'rss' && $format ne 'atom') {
7065                 die_error(400, "Unknown web feed format");
7066         }
7067
7068         # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7069         my $head = $hash || 'HEAD';
7070         my @commitlist = parse_commits($head, 150, 0, $file_name);
7071
7072         my %latest_commit;
7073         my %latest_date;
7074         my $content_type = "application/$format+xml";
7075         if (defined $cgi->http('HTTP_ACCEPT') &&
7076                  $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7077                 # browser (feed reader) prefers text/xml
7078                 $content_type = 'text/xml';
7079         }
7080         if (defined($commitlist[0])) {
7081                 %latest_commit = %{$commitlist[0]};
7082                 my $latest_epoch = $latest_commit{'committer_epoch'};
7083                 %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7084                 my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7085                 if (defined $if_modified) {
7086                         my $since;
7087                         if (eval { require HTTP::Date; 1; }) {
7088                                 $since = HTTP::Date::str2time($if_modified);
7089                         } elsif (eval { require Time::ParseDate; 1; }) {
7090                                 $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7091                         }
7092                         if (defined $since && $latest_epoch <= $since) {
7093                                 print $cgi->header(
7094                                         -type => $content_type,
7095                                         -charset => 'utf-8',
7096                                         -last_modified => $latest_date{'rfc2822'},
7097                                         -status => '304 Not Modified');
7098                                 return;
7099                         }
7100                 }
7101                 print $cgi->header(
7102                         -type => $content_type,
7103                         -charset => 'utf-8',
7104                         -last_modified => $latest_date{'rfc2822'});
7105         } else {
7106                 print $cgi->header(
7107                         -type => $content_type,
7108                         -charset => 'utf-8');
7109         }
7110
7111         # Optimization: skip generating the body if client asks only
7112         # for Last-Modified date.
7113         return if ($cgi->request_method() eq 'HEAD');
7114
7115         # header variables
7116         my $title = "$site_name - $project/$action";
7117         my $feed_type = 'log';
7118         if (defined $hash) {
7119                 $title .= " - '$hash'";
7120                 $feed_type = 'branch log';
7121                 if (defined $file_name) {
7122                         $title .= " :: $file_name";
7123                         $feed_type = 'history';
7124                 }
7125         } elsif (defined $file_name) {
7126                 $title .= " - $file_name";
7127                 $feed_type = 'history';
7128         }
7129         $title .= " $feed_type";
7130         my $descr = git_get_project_description($project);
7131         if (defined $descr) {
7132                 $descr = esc_html($descr);
7133         } else {
7134                 $descr = "$project " .
7135                          ($format eq 'rss' ? 'RSS' : 'Atom') .
7136                          " feed";
7137         }
7138         my $owner = git_get_project_owner($project);
7139         $owner = esc_html($owner);
7140
7141         #header
7142         my $alt_url;
7143         if (defined $file_name) {
7144                 $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7145         } elsif (defined $hash) {
7146                 $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7147         } else {
7148                 $alt_url = href(-full=>1, action=>"summary");
7149         }
7150         print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7151         if ($format eq 'rss') {
7152                 print <<XML;
7153 <rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7154 <channel>
7155 XML
7156                 print "<title>$title</title>\n" .
7157                       "<link>$alt_url</link>\n" .
7158                       "<description>$descr</description>\n" .
7159                       "<language>en</language>\n" .
7160                       # project owner is responsible for 'editorial' content
7161                       "<managingEditor>$owner</managingEditor>\n";
7162                 if (defined $logo || defined $favicon) {
7163                         # prefer the logo to the favicon, since RSS
7164                         # doesn't allow both
7165                         my $img = esc_url($logo || $favicon);
7166                         print "<image>\n" .
7167                               "<url>$img</url>\n" .
7168                               "<title>$title</title>\n" .
7169                               "<link>$alt_url</link>\n" .
7170                               "</image>\n";
7171                 }
7172                 if (%latest_date) {
7173                         print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7174                         print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7175                 }
7176                 print "<generator>gitweb v.$version/$git_version</generator>\n";
7177         } elsif ($format eq 'atom') {
7178                 print <<XML;
7179 <feed xmlns="http://www.w3.org/2005/Atom">
7180 XML
7181                 print "<title>$title</title>\n" .
7182                       "<subtitle>$descr</subtitle>\n" .
7183                       '<link rel="alternate" type="text/html" href="' .
7184                       $alt_url . '" />' . "\n" .
7185                       '<link rel="self" type="' . $content_type . '" href="' .
7186                       $cgi->self_url() . '" />' . "\n" .
7187                       "<id>" . href(-full=>1) . "</id>\n" .
7188                       # use project owner for feed author
7189                       "<author><name>$owner</name></author>\n";
7190                 if (defined $favicon) {
7191                         print "<icon>" . esc_url($favicon) . "</icon>\n";
7192                 }
7193                 if (defined $logo) {
7194                         # not twice as wide as tall: 72 x 27 pixels
7195                         print "<logo>" . esc_url($logo) . "</logo>\n";
7196                 }
7197                 if (! %latest_date) {
7198                         # dummy date to keep the feed valid until commits trickle in:
7199                         print "<updated>1970-01-01T00:00:00Z</updated>\n";
7200                 } else {
7201                         print "<updated>$latest_date{'iso-8601'}</updated>\n";
7202                 }
7203                 print "<generator version='$version/$git_version'>gitweb</generator>\n";
7204         }
7205
7206         # contents
7207         for (my $i = 0; $i <= $#commitlist; $i++) {
7208                 my %co = %{$commitlist[$i]};
7209                 my $commit = $co{'id'};
7210                 # we read 150, we always show 30 and the ones more recent than 48 hours
7211                 if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7212                         last;
7213                 }
7214                 my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7215
7216                 # get list of changed files
7217                 open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7218                         $co{'parent'} || "--root",
7219                         $co{'id'}, "--", (defined $file_name ? $file_name : ())
7220                         or next;
7221                 my @difftree = map { chomp; $_ } <$fd>;
7222                 close $fd
7223                         or next;
7224
7225                 # print element (entry, item)
7226                 my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7227                 if ($format eq 'rss') {
7228                         print "<item>\n" .
7229                               "<title>" . esc_html($co{'title'}) . "</title>\n" .
7230                               "<author>" . esc_html($co{'author'}) . "</author>\n" .
7231                               "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7232                               "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7233                               "<link>$co_url</link>\n" .
7234                               "<description>" . esc_html($co{'title'}) . "</description>\n" .
7235                               "<content:encoded>" .
7236                               "<![CDATA[\n";
7237                 } elsif ($format eq 'atom') {
7238                         print "<entry>\n" .
7239                               "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7240                               "<updated>$cd{'iso-8601'}</updated>\n" .
7241                               "<author>\n" .
7242                               "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7243                         if ($co{'author_email'}) {
7244                                 print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7245                         }
7246                         print "</author>\n" .
7247                               # use committer for contributor
7248                               "<contributor>\n" .
7249                               "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7250                         if ($co{'committer_email'}) {
7251                                 print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7252                         }
7253                         print "</contributor>\n" .
7254                               "<published>$cd{'iso-8601'}</published>\n" .
7255                               "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7256                               "<id>$co_url</id>\n" .
7257                               "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
7258                               "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
7259                 }
7260                 my $comment = $co{'comment'};
7261                 print "<pre>\n";
7262                 foreach my $line (@$comment) {
7263                         $line = esc_html($line);
7264                         print "$line\n";
7265                 }
7266                 print "</pre><ul>\n";
7267                 foreach my $difftree_line (@difftree) {
7268                         my %difftree = parse_difftree_raw_line($difftree_line);
7269                         next if !$difftree{'from_id'};
7270
7271                         my $file = $difftree{'file'} || $difftree{'to_file'};
7272
7273                         print "<li>" .
7274                               "[" .
7275                               $cgi->a({-href => href(-full=>1, action=>"blobdiff",
7276                                                      hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
7277                                                      hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
7278                                                      file_name=>$file, file_parent=>$difftree{'from_file'}),
7279                                       -title => "diff"}, 'D');
7280                         if ($have_blame) {
7281                                 print $cgi->a({-href => href(-full=>1, action=>"blame",
7282                                                              file_name=>$file, hash_base=>$commit),
7283                                               -title => "blame"}, 'B');
7284                         }
7285                         # if this is not a feed of a file history
7286                         if (!defined $file_name || $file_name ne $file) {
7287                                 print $cgi->a({-href => href(-full=>1, action=>"history",
7288                                                              file_name=>$file, hash=>$commit),
7289                                               -title => "history"}, 'H');
7290                         }
7291                         $file = esc_path($file);
7292                         print "] ".
7293                               "$file</li>\n";
7294                 }
7295                 if ($format eq 'rss') {
7296                         print "</ul>]]>\n" .
7297                               "</content:encoded>\n" .
7298                               "</item>\n";
7299                 } elsif ($format eq 'atom') {
7300                         print "</ul>\n</div>\n" .
7301                               "</content>\n" .
7302                               "</entry>\n";
7303                 }
7304         }
7305
7306         # end of feed
7307         if ($format eq 'rss') {
7308                 print "</channel>\n</rss>\n";
7309         } elsif ($format eq 'atom') {
7310                 print "</feed>\n";
7311         }
7312 }
7313
7314 sub git_rss {
7315         git_feed('rss');
7316 }
7317
7318 sub git_atom {
7319         git_feed('atom');
7320 }
7321
7322 sub git_opml {
7323         my @list = git_get_projects_list();
7324
7325         print $cgi->header(
7326                 -type => 'text/xml',
7327                 -charset => 'utf-8',
7328                 -content_disposition => 'inline; filename="opml.xml"');
7329
7330         print <<XML;
7331 <?xml version="1.0" encoding="utf-8"?>
7332 <opml version="1.0">
7333 <head>
7334   <title>$site_name OPML Export</title>
7335 </head>
7336 <body>
7337 <outline text="git RSS feeds">
7338 XML
7339
7340         foreach my $pr (@list) {
7341                 my %proj = %$pr;
7342                 my $head = git_get_head_hash($proj{'path'});
7343                 if (!defined $head) {
7344                         next;
7345                 }
7346                 $git_dir = "$projectroot/$proj{'path'}";
7347                 my %co = parse_commit($head);
7348                 if (!%co) {
7349                         next;
7350                 }
7351
7352                 my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7353                 my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7354                 my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7355                 print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7356         }
7357         print <<XML;
7358 </outline>
7359 </body>
7360 </opml>
7361 XML
7362 }