gitweb: provide a routine to display (sub)sections
[git] / gitweb / gitweb.perl
1 #!/usr/bin/perl
2
3 # gitweb - simple web interface to track changes in git repositories
4 #
5 # (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
6 # (C) 2005, Christian Gierke
7 #
8 # This program is licensed under the GPLv2
9
10 use 5.008;
11 use strict;
12 use warnings;
13 use CGI qw(:standard :escapeHTML -nosticky);
14 use CGI::Util qw(unescape);
15 use CGI::Carp qw(fatalsToBrowser set_message);
16 use Encode;
17 use Fcntl ':mode';
18 use File::Find qw();
19 use File::Basename qw(basename);
20 binmode STDOUT, ':utf8';
21
22 our $t0;
23 if (eval { require Time::HiRes; 1; }) {
24         $t0 = [Time::HiRes::gettimeofday()];
25 }
26 our $number_of_git_cmds = 0;
27
28 BEGIN {
29         CGI->compile() if $ENV{'MOD_PERL'};
30 }
31
32 our $version = "++GIT_VERSION++";
33
34 our ($my_url, $my_uri, $base_url, $path_info, $home_link);
35 sub evaluate_uri {
36         our $cgi;
37
38         our $my_url = $cgi->url();
39         our $my_uri = $cgi->url(-absolute => 1);
40
41         # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
42         # needed and used only for URLs with nonempty PATH_INFO
43         our $base_url = $my_url;
44
45         # When the script is used as DirectoryIndex, the URL does not contain the name
46         # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
47         # have to do it ourselves. We make $path_info global because it's also used
48         # later on.
49         #
50         # Another issue with the script being the DirectoryIndex is that the resulting
51         # $my_url data is not the full script URL: this is good, because we want
52         # generated links to keep implying the script name if it wasn't explicitly
53         # indicated in the URL we're handling, but it means that $my_url cannot be used
54         # as base URL.
55         # Therefore, if we needed to strip PATH_INFO, then we know that we have
56         # to build the base URL ourselves:
57         our $path_info = $ENV{"PATH_INFO"};
58         if ($path_info) {
59                 if ($my_url =~ s,\Q$path_info\E$,, &&
60                     $my_uri =~ s,\Q$path_info\E$,, &&
61                     defined $ENV{'SCRIPT_NAME'}) {
62                         $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
63                 }
64         }
65
66         # target of the home link on top of all pages
67         our $home_link = $my_uri || "/";
68 }
69
70 # core git executable to use
71 # this can just be "git" if your webserver has a sensible PATH
72 our $GIT = "++GIT_BINDIR++/git";
73
74 # absolute fs-path which will be prepended to the project path
75 #our $projectroot = "/pub/scm";
76 our $projectroot = "++GITWEB_PROJECTROOT++";
77
78 # fs traversing limit for getting project list
79 # the number is relative to the projectroot
80 our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
81
82 # string of the home link on top of all pages
83 our $home_link_str = "++GITWEB_HOME_LINK_STR++";
84
85 # name of your site or organization to appear in page titles
86 # replace this with something more descriptive for clearer bookmarks
87 our $site_name = "++GITWEB_SITENAME++"
88                  || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
89
90 # filename of html text to include at top of each page
91 our $site_header = "++GITWEB_SITE_HEADER++";
92 # html text to include at home page
93 our $home_text = "++GITWEB_HOMETEXT++";
94 # filename of html text to include at bottom of each page
95 our $site_footer = "++GITWEB_SITE_FOOTER++";
96
97 # URI of stylesheets
98 our @stylesheets = ("++GITWEB_CSS++");
99 # URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
100 our $stylesheet = undef;
101 # URI of GIT logo (72x27 size)
102 our $logo = "++GITWEB_LOGO++";
103 # URI of GIT favicon, assumed to be image/png type
104 our $favicon = "++GITWEB_FAVICON++";
105 # URI of gitweb.js (JavaScript code for gitweb)
106 our $javascript = "++GITWEB_JS++";
107
108 # URI and label (title) of GIT logo link
109 #our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
110 #our $logo_label = "git documentation";
111 our $logo_url = "http://git-scm.com/";
112 our $logo_label = "git homepage";
113
114 # source of projects list
115 our $projects_list = "++GITWEB_LIST++";
116
117 # the width (in characters) of the projects list "Description" column
118 our $projects_list_description_width = 25;
119
120 # default order of projects list
121 # valid values are none, project, descr, owner, and age
122 our $default_projects_order = "project";
123
124 # show repository only if this file exists
125 # (only effective if this variable evaluates to true)
126 our $export_ok = "++GITWEB_EXPORT_OK++";
127
128 # show repository only if this subroutine returns true
129 # when given the path to the project, for example:
130 #    sub { return -e "$_[0]/git-daemon-export-ok"; }
131 our $export_auth_hook = undef;
132
133 # only allow viewing of repositories also shown on the overview page
134 our $strict_export = "++GITWEB_STRICT_EXPORT++";
135
136 # list of git base URLs used for URL to where fetch project from,
137 # i.e. full URL is "$git_base_url/$project"
138 our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
139
140 # default blob_plain mimetype and default charset for text/plain blob
141 our $default_blob_plain_mimetype = 'text/plain';
142 our $default_text_plain_charset  = undef;
143
144 # file to use for guessing MIME types before trying /etc/mime.types
145 # (relative to the current git repository)
146 our $mimetypes_file = undef;
147
148 # assume this charset if line contains non-UTF-8 characters;
149 # it should be valid encoding (see Encoding::Supported(3pm) for list),
150 # for which encoding all byte sequences are valid, for example
151 # 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
152 # could be even 'utf-8' for the old behavior)
153 our $fallback_encoding = 'latin1';
154
155 # rename detection options for git-diff and git-diff-tree
156 # - default is '-M', with the cost proportional to
157 #   (number of removed files) * (number of new files).
158 # - more costly is '-C' (which implies '-M'), with the cost proportional to
159 #   (number of changed files + number of removed files) * (number of new files)
160 # - even more costly is '-C', '--find-copies-harder' with cost
161 #   (number of files in the original tree) * (number of new files)
162 # - one might want to include '-B' option, e.g. '-B', '-M'
163 our @diff_opts = ('-M'); # taken from git_commit
164
165 # Disables features that would allow repository owners to inject script into
166 # the gitweb domain.
167 our $prevent_xss = 0;
168
169 # Path to the highlight executable to use (must be the one from
170 # http://www.andre-simon.de due to assumptions about parameters and output).
171 # Useful if highlight is not installed on your webserver's PATH.
172 # [Default: highlight]
173 our $highlight_bin = "++HIGHLIGHT_BIN++";
174
175 # information about snapshot formats that gitweb is capable of serving
176 our %known_snapshot_formats = (
177         # name => {
178         #       'display' => display name,
179         #       'type' => mime type,
180         #       'suffix' => filename suffix,
181         #       'format' => --format for git-archive,
182         #       'compressor' => [compressor command and arguments]
183         #                       (array reference, optional)
184         #       'disabled' => boolean (optional)}
185         #
186         'tgz' => {
187                 'display' => 'tar.gz',
188                 'type' => 'application/x-gzip',
189                 'suffix' => '.tar.gz',
190                 'format' => 'tar',
191                 'compressor' => ['gzip']},
192
193         'tbz2' => {
194                 'display' => 'tar.bz2',
195                 'type' => 'application/x-bzip2',
196                 'suffix' => '.tar.bz2',
197                 'format' => 'tar',
198                 'compressor' => ['bzip2']},
199
200         'txz' => {
201                 'display' => 'tar.xz',
202                 'type' => 'application/x-xz',
203                 'suffix' => '.tar.xz',
204                 'format' => 'tar',
205                 'compressor' => ['xz'],
206                 'disabled' => 1},
207
208         'zip' => {
209                 'display' => 'zip',
210                 'type' => 'application/x-zip',
211                 'suffix' => '.zip',
212                 'format' => 'zip'},
213 );
214
215 # Aliases so we understand old gitweb.snapshot values in repository
216 # configuration.
217 our %known_snapshot_format_aliases = (
218         'gzip'  => 'tgz',
219         'bzip2' => 'tbz2',
220         'xz'    => 'txz',
221
222         # backward compatibility: legacy gitweb config support
223         'x-gzip' => undef, 'gz' => undef,
224         'x-bzip2' => undef, 'bz2' => undef,
225         'x-zip' => undef, '' => undef,
226 );
227
228 # Pixel sizes for icons and avatars. If the default font sizes or lineheights
229 # are changed, it may be appropriate to change these values too via
230 # $GITWEB_CONFIG.
231 our %avatar_size = (
232         'default' => 16,
233         'double'  => 32
234 );
235
236 # Used to set the maximum load that we will still respond to gitweb queries.
237 # If server load exceed this value then return "503 server busy" error.
238 # If gitweb cannot determined server load, it is taken to be 0.
239 # Leave it undefined (or set to 'undef') to turn off load checking.
240 our $maxload = 300;
241
242 # configuration for 'highlight' (http://www.andre-simon.de/)
243 # match by basename
244 our %highlight_basename = (
245         #'Program' => 'py',
246         #'Library' => 'py',
247         'SConstruct' => 'py', # SCons equivalent of Makefile
248         'Makefile' => 'make',
249 );
250 # match by extension
251 our %highlight_ext = (
252         # main extensions, defining name of syntax;
253         # see files in /usr/share/highlight/langDefs/ directory
254         map { $_ => $_ }
255                 qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl),
256         # alternate extensions, see /etc/highlight/filetypes.conf
257         'h' => 'c',
258         map { $_ => 'cpp' } qw(cxx c++ cc),
259         map { $_ => 'php' } qw(php3 php4),
260         map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
261         'mak' => 'make',
262         map { $_ => 'xml' } qw(xhtml html htm),
263 );
264
265 # You define site-wide feature defaults here; override them with
266 # $GITWEB_CONFIG as necessary.
267 our %feature = (
268         # feature => {
269         #       'sub' => feature-sub (subroutine),
270         #       'override' => allow-override (boolean),
271         #       'default' => [ default options...] (array reference)}
272         #
273         # if feature is overridable (it means that allow-override has true value),
274         # then feature-sub will be called with default options as parameters;
275         # return value of feature-sub indicates if to enable specified feature
276         #
277         # if there is no 'sub' key (no feature-sub), then feature cannot be
278         # overridden
279         #
280         # use gitweb_get_feature(<feature>) to retrieve the <feature> value
281         # (an array) or gitweb_check_feature(<feature>) to check if <feature>
282         # is enabled
283
284         # Enable the 'blame' blob view, showing the last commit that modified
285         # each line in the file. This can be very CPU-intensive.
286
287         # To enable system wide have in $GITWEB_CONFIG
288         # $feature{'blame'}{'default'} = [1];
289         # To have project specific config enable override in $GITWEB_CONFIG
290         # $feature{'blame'}{'override'} = 1;
291         # and in project config gitweb.blame = 0|1;
292         'blame' => {
293                 'sub' => sub { feature_bool('blame', @_) },
294                 'override' => 0,
295                 'default' => [0]},
296
297         # Enable the 'snapshot' link, providing a compressed archive of any
298         # tree. This can potentially generate high traffic if you have large
299         # project.
300
301         # Value is a list of formats defined in %known_snapshot_formats that
302         # you wish to offer.
303         # To disable system wide have in $GITWEB_CONFIG
304         # $feature{'snapshot'}{'default'} = [];
305         # To have project specific config enable override in $GITWEB_CONFIG
306         # $feature{'snapshot'}{'override'} = 1;
307         # and in project config, a comma-separated list of formats or "none"
308         # to disable.  Example: gitweb.snapshot = tbz2,zip;
309         'snapshot' => {
310                 'sub' => \&feature_snapshot,
311                 'override' => 0,
312                 'default' => ['tgz']},
313
314         # Enable text search, which will list the commits which match author,
315         # committer or commit text to a given string.  Enabled by default.
316         # Project specific override is not supported.
317         'search' => {
318                 'override' => 0,
319                 'default' => [1]},
320
321         # Enable grep search, which will list the files in currently selected
322         # tree containing the given string. Enabled by default. This can be
323         # potentially CPU-intensive, of course.
324
325         # To enable system wide have in $GITWEB_CONFIG
326         # $feature{'grep'}{'default'} = [1];
327         # To have project specific config enable override in $GITWEB_CONFIG
328         # $feature{'grep'}{'override'} = 1;
329         # and in project config gitweb.grep = 0|1;
330         'grep' => {
331                 'sub' => sub { feature_bool('grep', @_) },
332                 'override' => 0,
333                 'default' => [1]},
334
335         # Enable the pickaxe search, which will list the commits that modified
336         # a given string in a file. This can be practical and quite faster
337         # alternative to 'blame', but still potentially CPU-intensive.
338
339         # To enable system wide have in $GITWEB_CONFIG
340         # $feature{'pickaxe'}{'default'} = [1];
341         # To have project specific config enable override in $GITWEB_CONFIG
342         # $feature{'pickaxe'}{'override'} = 1;
343         # and in project config gitweb.pickaxe = 0|1;
344         'pickaxe' => {
345                 'sub' => sub { feature_bool('pickaxe', @_) },
346                 'override' => 0,
347                 'default' => [1]},
348
349         # Enable showing size of blobs in a 'tree' view, in a separate
350         # column, similar to what 'ls -l' does.  This cost a bit of IO.
351
352         # To disable system wide have in $GITWEB_CONFIG
353         # $feature{'show-sizes'}{'default'} = [0];
354         # To have project specific config enable override in $GITWEB_CONFIG
355         # $feature{'show-sizes'}{'override'} = 1;
356         # and in project config gitweb.showsizes = 0|1;
357         'show-sizes' => {
358                 'sub' => sub { feature_bool('showsizes', @_) },
359                 'override' => 0,
360                 'default' => [1]},
361
362         # Make gitweb use an alternative format of the URLs which can be
363         # more readable and natural-looking: project name is embedded
364         # directly in the path and the query string contains other
365         # auxiliary information. All gitweb installations recognize
366         # URL in either format; this configures in which formats gitweb
367         # generates links.
368
369         # To enable system wide have in $GITWEB_CONFIG
370         # $feature{'pathinfo'}{'default'} = [1];
371         # Project specific override is not supported.
372
373         # Note that you will need to change the default location of CSS,
374         # favicon, logo and possibly other files to an absolute URL. Also,
375         # if gitweb.cgi serves as your indexfile, you will need to force
376         # $my_uri to contain the script name in your $GITWEB_CONFIG.
377         'pathinfo' => {
378                 'override' => 0,
379                 'default' => [0]},
380
381         # Make gitweb consider projects in project root subdirectories
382         # to be forks of existing projects. Given project $projname.git,
383         # projects matching $projname/*.git will not be shown in the main
384         # projects list, instead a '+' mark will be added to $projname
385         # there and a 'forks' view will be enabled for the project, listing
386         # all the forks. If project list is taken from a file, forks have
387         # to be listed after the main project.
388
389         # To enable system wide have in $GITWEB_CONFIG
390         # $feature{'forks'}{'default'} = [1];
391         # Project specific override is not supported.
392         'forks' => {
393                 'override' => 0,
394                 'default' => [0]},
395
396         # Insert custom links to the action bar of all project pages.
397         # This enables you mainly to link to third-party scripts integrating
398         # into gitweb; e.g. git-browser for graphical history representation
399         # or custom web-based repository administration interface.
400
401         # The 'default' value consists of a list of triplets in the form
402         # (label, link, position) where position is the label after which
403         # to insert the link and link is a format string where %n expands
404         # to the project name, %f to the project path within the filesystem,
405         # %h to the current hash (h gitweb parameter) and %b to the current
406         # hash base (hb gitweb parameter); %% expands to %.
407
408         # To enable system wide have in $GITWEB_CONFIG e.g.
409         # $feature{'actions'}{'default'} = [('graphiclog',
410         #       '/git-browser/by-commit.html?r=%n', 'summary')];
411         # Project specific override is not supported.
412         'actions' => {
413                 'override' => 0,
414                 'default' => []},
415
416         # Allow gitweb scan project content tags described in ctags/
417         # of project repository, and display the popular Web 2.0-ish
418         # "tag cloud" near the project list. Note that this is something
419         # COMPLETELY different from the normal Git tags.
420
421         # gitweb by itself can show existing tags, but it does not handle
422         # tagging itself; you need an external application for that.
423         # For an example script, check Girocco's cgi/tagproj.cgi.
424         # You may want to install the HTML::TagCloud Perl module to get
425         # a pretty tag cloud instead of just a list of tags.
426
427         # To enable system wide have in $GITWEB_CONFIG
428         # $feature{'ctags'}{'default'} = ['path_to_tag_script'];
429         # Project specific override is not supported.
430         'ctags' => {
431                 'override' => 0,
432                 'default' => [0]},
433
434         # The maximum number of patches in a patchset generated in patch
435         # view. Set this to 0 or undef to disable patch view, or to a
436         # negative number to remove any limit.
437
438         # To disable system wide have in $GITWEB_CONFIG
439         # $feature{'patches'}{'default'} = [0];
440         # To have project specific config enable override in $GITWEB_CONFIG
441         # $feature{'patches'}{'override'} = 1;
442         # and in project config gitweb.patches = 0|n;
443         # where n is the maximum number of patches allowed in a patchset.
444         'patches' => {
445                 'sub' => \&feature_patches,
446                 'override' => 0,
447                 'default' => [16]},
448
449         # Avatar support. When this feature is enabled, views such as
450         # shortlog or commit will display an avatar associated with
451         # the email of the committer(s) and/or author(s).
452
453         # Currently available providers are gravatar and picon.
454         # If an unknown provider is specified, the feature is disabled.
455
456         # Gravatar depends on Digest::MD5.
457         # Picon currently relies on the indiana.edu database.
458
459         # To enable system wide have in $GITWEB_CONFIG
460         # $feature{'avatar'}{'default'} = ['<provider>'];
461         # where <provider> is either gravatar or picon.
462         # To have project specific config enable override in $GITWEB_CONFIG
463         # $feature{'avatar'}{'override'} = 1;
464         # and in project config gitweb.avatar = <provider>;
465         'avatar' => {
466                 'sub' => \&feature_avatar,
467                 'override' => 0,
468                 'default' => ['']},
469
470         # Enable displaying how much time and how many git commands
471         # it took to generate and display page.  Disabled by default.
472         # Project specific override is not supported.
473         'timed' => {
474                 'override' => 0,
475                 'default' => [0]},
476
477         # Enable turning some links into links to actions which require
478         # JavaScript to run (like 'blame_incremental').  Not enabled by
479         # default.  Project specific override is currently not supported.
480         'javascript-actions' => {
481                 'override' => 0,
482                 'default' => [0]},
483
484         # Syntax highlighting support. This is based on Daniel Svensson's
485         # and Sham Chukoury's work in gitweb-xmms2.git.
486         # It requires the 'highlight' program present in $PATH,
487         # and therefore is disabled by default.
488
489         # To enable system wide have in $GITWEB_CONFIG
490         # $feature{'highlight'}{'default'} = [1];
491
492         'highlight' => {
493                 'sub' => sub { feature_bool('highlight', @_) },
494                 'override' => 0,
495                 'default' => [0]},
496
497         # Enable displaying of remote heads in the heads list
498
499         # To enable system wide have in $GITWEB_CONFIG
500         # $feature{'remote_heads'}{'default'} = [1];
501         # To have project specific config enable override in $GITWEB_CONFIG
502         # $feature{'remote_heads'}{'override'} = 1;
503         # and in project config gitweb.remote_heads = 0|1;
504         'remote_heads' => {
505                 'sub' => sub { feature_bool('remote_heads', @_) },
506                 'override' => 0,
507                 'default' => [0]},
508 );
509
510 sub gitweb_get_feature {
511         my ($name) = @_;
512         return unless exists $feature{$name};
513         my ($sub, $override, @defaults) = (
514                 $feature{$name}{'sub'},
515                 $feature{$name}{'override'},
516                 @{$feature{$name}{'default'}});
517         # project specific override is possible only if we have project
518         our $git_dir; # global variable, declared later
519         if (!$override || !defined $git_dir) {
520                 return @defaults;
521         }
522         if (!defined $sub) {
523                 warn "feature $name is not overridable";
524                 return @defaults;
525         }
526         return $sub->(@defaults);
527 }
528
529 # A wrapper to check if a given feature is enabled.
530 # With this, you can say
531 #
532 #   my $bool_feat = gitweb_check_feature('bool_feat');
533 #   gitweb_check_feature('bool_feat') or somecode;
534 #
535 # instead of
536 #
537 #   my ($bool_feat) = gitweb_get_feature('bool_feat');
538 #   (gitweb_get_feature('bool_feat'))[0] or somecode;
539 #
540 sub gitweb_check_feature {
541         return (gitweb_get_feature(@_))[0];
542 }
543
544
545 sub feature_bool {
546         my $key = shift;
547         my ($val) = git_get_project_config($key, '--bool');
548
549         if (!defined $val) {
550                 return ($_[0]);
551         } elsif ($val eq 'true') {
552                 return (1);
553         } elsif ($val eq 'false') {
554                 return (0);
555         }
556 }
557
558 sub feature_snapshot {
559         my (@fmts) = @_;
560
561         my ($val) = git_get_project_config('snapshot');
562
563         if ($val) {
564                 @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
565         }
566
567         return @fmts;
568 }
569
570 sub feature_patches {
571         my @val = (git_get_project_config('patches', '--int'));
572
573         if (@val) {
574                 return @val;
575         }
576
577         return ($_[0]);
578 }
579
580 sub feature_avatar {
581         my @val = (git_get_project_config('avatar'));
582
583         return @val ? @val : @_;
584 }
585
586 # checking HEAD file with -e is fragile if the repository was
587 # initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
588 # and then pruned.
589 sub check_head_link {
590         my ($dir) = @_;
591         my $headfile = "$dir/HEAD";
592         return ((-e $headfile) ||
593                 (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
594 }
595
596 sub check_export_ok {
597         my ($dir) = @_;
598         return (check_head_link($dir) &&
599                 (!$export_ok || -e "$dir/$export_ok") &&
600                 (!$export_auth_hook || $export_auth_hook->($dir)));
601 }
602
603 # process alternate names for backward compatibility
604 # filter out unsupported (unknown) snapshot formats
605 sub filter_snapshot_fmts {
606         my @fmts = @_;
607
608         @fmts = map {
609                 exists $known_snapshot_format_aliases{$_} ?
610                        $known_snapshot_format_aliases{$_} : $_} @fmts;
611         @fmts = grep {
612                 exists $known_snapshot_formats{$_} &&
613                 !$known_snapshot_formats{$_}{'disabled'}} @fmts;
614 }
615
616 our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM);
617 sub evaluate_gitweb_config {
618         our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
619         our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
620         # die if there are errors parsing config file
621         if (-e $GITWEB_CONFIG) {
622                 do $GITWEB_CONFIG;
623                 die $@ if $@;
624         } elsif (-e $GITWEB_CONFIG_SYSTEM) {
625                 do $GITWEB_CONFIG_SYSTEM;
626                 die $@ if $@;
627         }
628 }
629
630 # Get loadavg of system, to compare against $maxload.
631 # Currently it requires '/proc/loadavg' present to get loadavg;
632 # if it is not present it returns 0, which means no load checking.
633 sub get_loadavg {
634         if( -e '/proc/loadavg' ){
635                 open my $fd, '<', '/proc/loadavg'
636                         or return 0;
637                 my @load = split(/\s+/, scalar <$fd>);
638                 close $fd;
639
640                 # The first three columns measure CPU and IO utilization of the last one,
641                 # five, and 10 minute periods.  The fourth column shows the number of
642                 # currently running processes and the total number of processes in the m/n
643                 # format.  The last column displays the last process ID used.
644                 return $load[0] || 0;
645         }
646         # additional checks for load average should go here for things that don't export
647         # /proc/loadavg
648
649         return 0;
650 }
651
652 # version of the core git binary
653 our $git_version;
654 sub evaluate_git_version {
655         our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
656         $number_of_git_cmds++;
657 }
658
659 sub check_loadavg {
660         if (defined $maxload && get_loadavg() > $maxload) {
661                 die_error(503, "The load average on the server is too high");
662         }
663 }
664
665 # ======================================================================
666 # input validation and dispatch
667
668 # input parameters can be collected from a variety of sources (presently, CGI
669 # and PATH_INFO), so we define an %input_params hash that collects them all
670 # together during validation: this allows subsequent uses (e.g. href()) to be
671 # agnostic of the parameter origin
672
673 our %input_params = ();
674
675 # input parameters are stored with the long parameter name as key. This will
676 # also be used in the href subroutine to convert parameters to their CGI
677 # equivalent, and since the href() usage is the most frequent one, we store
678 # the name -> CGI key mapping here, instead of the reverse.
679 #
680 # XXX: Warning: If you touch this, check the search form for updating,
681 # too.
682
683 our @cgi_param_mapping = (
684         project => "p",
685         action => "a",
686         file_name => "f",
687         file_parent => "fp",
688         hash => "h",
689         hash_parent => "hp",
690         hash_base => "hb",
691         hash_parent_base => "hpb",
692         page => "pg",
693         order => "o",
694         searchtext => "s",
695         searchtype => "st",
696         snapshot_format => "sf",
697         extra_options => "opt",
698         search_use_regexp => "sr",
699         # this must be last entry (for manipulation from JavaScript)
700         javascript => "js"
701 );
702 our %cgi_param_mapping = @cgi_param_mapping;
703
704 # we will also need to know the possible actions, for validation
705 our %actions = (
706         "blame" => \&git_blame,
707         "blame_incremental" => \&git_blame_incremental,
708         "blame_data" => \&git_blame_data,
709         "blobdiff" => \&git_blobdiff,
710         "blobdiff_plain" => \&git_blobdiff_plain,
711         "blob" => \&git_blob,
712         "blob_plain" => \&git_blob_plain,
713         "commitdiff" => \&git_commitdiff,
714         "commitdiff_plain" => \&git_commitdiff_plain,
715         "commit" => \&git_commit,
716         "forks" => \&git_forks,
717         "heads" => \&git_heads,
718         "history" => \&git_history,
719         "log" => \&git_log,
720         "patch" => \&git_patch,
721         "patches" => \&git_patches,
722         "remotes" => \&git_remotes,
723         "rss" => \&git_rss,
724         "atom" => \&git_atom,
725         "search" => \&git_search,
726         "search_help" => \&git_search_help,
727         "shortlog" => \&git_shortlog,
728         "summary" => \&git_summary,
729         "tag" => \&git_tag,
730         "tags" => \&git_tags,
731         "tree" => \&git_tree,
732         "snapshot" => \&git_snapshot,
733         "object" => \&git_object,
734         # those below don't need $project
735         "opml" => \&git_opml,
736         "project_list" => \&git_project_list,
737         "project_index" => \&git_project_index,
738 );
739
740 # finally, we have the hash of allowed extra_options for the commands that
741 # allow them
742 our %allowed_options = (
743         "--no-merges" => [ qw(rss atom log shortlog history) ],
744 );
745
746 # fill %input_params with the CGI parameters. All values except for 'opt'
747 # should be single values, but opt can be an array. We should probably
748 # build an array of parameters that can be multi-valued, but since for the time
749 # being it's only this one, we just single it out
750 sub evaluate_query_params {
751         our $cgi;
752
753         while (my ($name, $symbol) = each %cgi_param_mapping) {
754                 if ($symbol eq 'opt') {
755                         $input_params{$name} = [ $cgi->param($symbol) ];
756                 } else {
757                         $input_params{$name} = $cgi->param($symbol);
758                 }
759         }
760 }
761
762 # now read PATH_INFO and update the parameter list for missing parameters
763 sub evaluate_path_info {
764         return if defined $input_params{'project'};
765         return if !$path_info;
766         $path_info =~ s,^/+,,;
767         return if !$path_info;
768
769         # find which part of PATH_INFO is project
770         my $project = $path_info;
771         $project =~ s,/+$,,;
772         while ($project && !check_head_link("$projectroot/$project")) {
773                 $project =~ s,/*[^/]*$,,;
774         }
775         return unless $project;
776         $input_params{'project'} = $project;
777
778         # do not change any parameters if an action is given using the query string
779         return if $input_params{'action'};
780         $path_info =~ s,^\Q$project\E/*,,;
781
782         # next, check if we have an action
783         my $action = $path_info;
784         $action =~ s,/.*$,,;
785         if (exists $actions{$action}) {
786                 $path_info =~ s,^$action/*,,;
787                 $input_params{'action'} = $action;
788         }
789
790         # list of actions that want hash_base instead of hash, but can have no
791         # pathname (f) parameter
792         my @wants_base = (
793                 'tree',
794                 'history',
795         );
796
797         # we want to catch, among others
798         # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
799         my ($parentrefname, $parentpathname, $refname, $pathname) =
800                 ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
801
802         # first, analyze the 'current' part
803         if (defined $pathname) {
804                 # we got "branch:filename" or "branch:dir/"
805                 # we could use git_get_type(branch:pathname), but:
806                 # - it needs $git_dir
807                 # - it does a git() call
808                 # - the convention of terminating directories with a slash
809                 #   makes it superfluous
810                 # - embedding the action in the PATH_INFO would make it even
811                 #   more superfluous
812                 $pathname =~ s,^/+,,;
813                 if (!$pathname || substr($pathname, -1) eq "/") {
814                         $input_params{'action'} ||= "tree";
815                         $pathname =~ s,/$,,;
816                 } else {
817                         # the default action depends on whether we had parent info
818                         # or not
819                         if ($parentrefname) {
820                                 $input_params{'action'} ||= "blobdiff_plain";
821                         } else {
822                                 $input_params{'action'} ||= "blob_plain";
823                         }
824                 }
825                 $input_params{'hash_base'} ||= $refname;
826                 $input_params{'file_name'} ||= $pathname;
827         } elsif (defined $refname) {
828                 # we got "branch". In this case we have to choose if we have to
829                 # set hash or hash_base.
830                 #
831                 # Most of the actions without a pathname only want hash to be
832                 # set, except for the ones specified in @wants_base that want
833                 # hash_base instead. It should also be noted that hand-crafted
834                 # links having 'history' as an action and no pathname or hash
835                 # set will fail, but that happens regardless of PATH_INFO.
836                 if (defined $parentrefname) {
837                         # if there is parent let the default be 'shortlog' action
838                         # (for http://git.example.com/repo.git/A..B links); if there
839                         # is no parent, dispatch will detect type of object and set
840                         # action appropriately if required (if action is not set)
841                         $input_params{'action'} ||= "shortlog";
842                 }
843                 if ($input_params{'action'} &&
844                     grep { $_ eq $input_params{'action'} } @wants_base) {
845                         $input_params{'hash_base'} ||= $refname;
846                 } else {
847                         $input_params{'hash'} ||= $refname;
848                 }
849         }
850
851         # next, handle the 'parent' part, if present
852         if (defined $parentrefname) {
853                 # a missing pathspec defaults to the 'current' filename, allowing e.g.
854                 # someproject/blobdiff/oldrev..newrev:/filename
855                 if ($parentpathname) {
856                         $parentpathname =~ s,^/+,,;
857                         $parentpathname =~ s,/$,,;
858                         $input_params{'file_parent'} ||= $parentpathname;
859                 } else {
860                         $input_params{'file_parent'} ||= $input_params{'file_name'};
861                 }
862                 # we assume that hash_parent_base is wanted if a path was specified,
863                 # or if the action wants hash_base instead of hash
864                 if (defined $input_params{'file_parent'} ||
865                         grep { $_ eq $input_params{'action'} } @wants_base) {
866                         $input_params{'hash_parent_base'} ||= $parentrefname;
867                 } else {
868                         $input_params{'hash_parent'} ||= $parentrefname;
869                 }
870         }
871
872         # for the snapshot action, we allow URLs in the form
873         # $project/snapshot/$hash.ext
874         # where .ext determines the snapshot and gets removed from the
875         # passed $refname to provide the $hash.
876         #
877         # To be able to tell that $refname includes the format extension, we
878         # require the following two conditions to be satisfied:
879         # - the hash input parameter MUST have been set from the $refname part
880         #   of the URL (i.e. they must be equal)
881         # - the snapshot format MUST NOT have been defined already (e.g. from
882         #   CGI parameter sf)
883         # It's also useless to try any matching unless $refname has a dot,
884         # so we check for that too
885         if (defined $input_params{'action'} &&
886                 $input_params{'action'} eq 'snapshot' &&
887                 defined $refname && index($refname, '.') != -1 &&
888                 $refname eq $input_params{'hash'} &&
889                 !defined $input_params{'snapshot_format'}) {
890                 # We loop over the known snapshot formats, checking for
891                 # extensions. Allowed extensions are both the defined suffix
892                 # (which includes the initial dot already) and the snapshot
893                 # format key itself, with a prepended dot
894                 while (my ($fmt, $opt) = each %known_snapshot_formats) {
895                         my $hash = $refname;
896                         unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
897                                 next;
898                         }
899                         my $sfx = $1;
900                         # a valid suffix was found, so set the snapshot format
901                         # and reset the hash parameter
902                         $input_params{'snapshot_format'} = $fmt;
903                         $input_params{'hash'} = $hash;
904                         # we also set the format suffix to the one requested
905                         # in the URL: this way a request for e.g. .tgz returns
906                         # a .tgz instead of a .tar.gz
907                         $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
908                         last;
909                 }
910         }
911 }
912
913 our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
914      $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
915      $searchtext, $search_regexp);
916 sub evaluate_and_validate_params {
917         our $action = $input_params{'action'};
918         if (defined $action) {
919                 if (!validate_action($action)) {
920                         die_error(400, "Invalid action parameter");
921                 }
922         }
923
924         # parameters which are pathnames
925         our $project = $input_params{'project'};
926         if (defined $project) {
927                 if (!validate_project($project)) {
928                         undef $project;
929                         die_error(404, "No such project");
930                 }
931         }
932
933         our $file_name = $input_params{'file_name'};
934         if (defined $file_name) {
935                 if (!validate_pathname($file_name)) {
936                         die_error(400, "Invalid file parameter");
937                 }
938         }
939
940         our $file_parent = $input_params{'file_parent'};
941         if (defined $file_parent) {
942                 if (!validate_pathname($file_parent)) {
943                         die_error(400, "Invalid file parent parameter");
944                 }
945         }
946
947         # parameters which are refnames
948         our $hash = $input_params{'hash'};
949         if (defined $hash) {
950                 if (!validate_refname($hash)) {
951                         die_error(400, "Invalid hash parameter");
952                 }
953         }
954
955         our $hash_parent = $input_params{'hash_parent'};
956         if (defined $hash_parent) {
957                 if (!validate_refname($hash_parent)) {
958                         die_error(400, "Invalid hash parent parameter");
959                 }
960         }
961
962         our $hash_base = $input_params{'hash_base'};
963         if (defined $hash_base) {
964                 if (!validate_refname($hash_base)) {
965                         die_error(400, "Invalid hash base parameter");
966                 }
967         }
968
969         our @extra_options = @{$input_params{'extra_options'}};
970         # @extra_options is always defined, since it can only be (currently) set from
971         # CGI, and $cgi->param() returns the empty array in array context if the param
972         # is not set
973         foreach my $opt (@extra_options) {
974                 if (not exists $allowed_options{$opt}) {
975                         die_error(400, "Invalid option parameter");
976                 }
977                 if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
978                         die_error(400, "Invalid option parameter for this action");
979                 }
980         }
981
982         our $hash_parent_base = $input_params{'hash_parent_base'};
983         if (defined $hash_parent_base) {
984                 if (!validate_refname($hash_parent_base)) {
985                         die_error(400, "Invalid hash parent base parameter");
986                 }
987         }
988
989         # other parameters
990         our $page = $input_params{'page'};
991         if (defined $page) {
992                 if ($page =~ m/[^0-9]/) {
993                         die_error(400, "Invalid page parameter");
994                 }
995         }
996
997         our $searchtype = $input_params{'searchtype'};
998         if (defined $searchtype) {
999                 if ($searchtype =~ m/[^a-z]/) {
1000                         die_error(400, "Invalid searchtype parameter");
1001                 }
1002         }
1003
1004         our $search_use_regexp = $input_params{'search_use_regexp'};
1005
1006         our $searchtext = $input_params{'searchtext'};
1007         our $search_regexp;
1008         if (defined $searchtext) {
1009                 if (length($searchtext) < 2) {
1010                         die_error(403, "At least two characters are required for search parameter");
1011                 }
1012                 $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
1013         }
1014 }
1015
1016 # path to the current git repository
1017 our $git_dir;
1018 sub evaluate_git_dir {
1019         our $git_dir = "$projectroot/$project" if $project;
1020 }
1021
1022 our (@snapshot_fmts, $git_avatar);
1023 sub configure_gitweb_features {
1024         # list of supported snapshot formats
1025         our @snapshot_fmts = gitweb_get_feature('snapshot');
1026         @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1027
1028         # check that the avatar feature is set to a known provider name,
1029         # and for each provider check if the dependencies are satisfied.
1030         # if the provider name is invalid or the dependencies are not met,
1031         # reset $git_avatar to the empty string.
1032         our ($git_avatar) = gitweb_get_feature('avatar');
1033         if ($git_avatar eq 'gravatar') {
1034                 $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1035         } elsif ($git_avatar eq 'picon') {
1036                 # no dependencies
1037         } else {
1038                 $git_avatar = '';
1039         }
1040 }
1041
1042 # custom error handler: 'die <message>' is Internal Server Error
1043 sub handle_errors_html {
1044         my $msg = shift; # it is already HTML escaped
1045
1046         # to avoid infinite loop where error occurs in die_error,
1047         # change handler to default handler, disabling handle_errors_html
1048         set_message("Error occured when inside die_error:\n$msg");
1049
1050         # you cannot jump out of die_error when called as error handler;
1051         # the subroutine set via CGI::Carp::set_message is called _after_
1052         # HTTP headers are already written, so it cannot write them itself
1053         die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1054 }
1055 set_message(\&handle_errors_html);
1056
1057 # dispatch
1058 sub dispatch {
1059         if (!defined $action) {
1060                 if (defined $hash) {
1061                         $action = git_get_type($hash);
1062                 } elsif (defined $hash_base && defined $file_name) {
1063                         $action = git_get_type("$hash_base:$file_name");
1064                 } elsif (defined $project) {
1065                         $action = 'summary';
1066                 } else {
1067                         $action = 'project_list';
1068                 }
1069         }
1070         if (!defined($actions{$action})) {
1071                 die_error(400, "Unknown action");
1072         }
1073         if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1074             !$project) {
1075                 die_error(400, "Project needed");
1076         }
1077         $actions{$action}->();
1078 }
1079
1080 sub reset_timer {
1081         our $t0 = [Time::HiRes::gettimeofday()]
1082                 if defined $t0;
1083         our $number_of_git_cmds = 0;
1084 }
1085
1086 sub run_request {
1087         reset_timer();
1088
1089         evaluate_uri();
1090         evaluate_gitweb_config();
1091         check_loadavg();
1092
1093         # $projectroot and $projects_list might be set in gitweb config file
1094         $projects_list ||= $projectroot;
1095
1096         evaluate_query_params();
1097         evaluate_path_info();
1098         evaluate_and_validate_params();
1099         evaluate_git_dir();
1100
1101         configure_gitweb_features();
1102
1103         dispatch();
1104 }
1105
1106 our $is_last_request = sub { 1 };
1107 our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1108 our $CGI = 'CGI';
1109 our $cgi;
1110 sub configure_as_fcgi {
1111         require CGI::Fast;
1112         our $CGI = 'CGI::Fast';
1113
1114         my $request_number = 0;
1115         # let each child service 100 requests
1116         our $is_last_request = sub { ++$request_number > 100 };
1117 }
1118 sub evaluate_argv {
1119         my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1120         configure_as_fcgi()
1121                 if $script_name =~ /\.fcgi$/;
1122
1123         return unless (@ARGV);
1124
1125         require Getopt::Long;
1126         Getopt::Long::GetOptions(
1127                 'fastcgi|fcgi|f' => \&configure_as_fcgi,
1128                 'nproc|n=i' => sub {
1129                         my ($arg, $val) = @_;
1130                         return unless eval { require FCGI::ProcManager; 1; };
1131                         my $proc_manager = FCGI::ProcManager->new({
1132                                 n_processes => $val,
1133                         });
1134                         our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1135                         our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1136                         our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1137                 },
1138         );
1139 }
1140
1141 sub run {
1142         evaluate_argv();
1143         evaluate_git_version();
1144
1145         $pre_listen_hook->()
1146                 if $pre_listen_hook;
1147
1148  REQUEST:
1149         while ($cgi = $CGI->new()) {
1150                 $pre_dispatch_hook->()
1151                         if $pre_dispatch_hook;
1152
1153                 run_request();
1154
1155                 $post_dispatch_hook->()
1156                         if $post_dispatch_hook;
1157
1158                 last REQUEST if ($is_last_request->());
1159         }
1160
1161  DONE_GITWEB:
1162         1;
1163 }
1164
1165 run();
1166
1167 if (defined caller) {
1168         # wrapped in a subroutine processing requests,
1169         # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1170         return;
1171 } else {
1172         # pure CGI script, serving single request
1173         exit;
1174 }
1175
1176 ## ======================================================================
1177 ## action links
1178
1179 # possible values of extra options
1180 # -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1181 # -replay => 1      - start from a current view (replay with modifications)
1182 # -path_info => 0|1 - don't use/use path_info URL (if possible)
1183 sub href {
1184         my %params = @_;
1185         # default is to use -absolute url() i.e. $my_uri
1186         my $href = $params{-full} ? $my_url : $my_uri;
1187
1188         $params{'project'} = $project unless exists $params{'project'};
1189
1190         if ($params{-replay}) {
1191                 while (my ($name, $symbol) = each %cgi_param_mapping) {
1192                         if (!exists $params{$name}) {
1193                                 $params{$name} = $input_params{$name};
1194                         }
1195                 }
1196         }
1197
1198         my $use_pathinfo = gitweb_check_feature('pathinfo');
1199         if (defined $params{'project'} &&
1200             (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1201                 # try to put as many parameters as possible in PATH_INFO:
1202                 #   - project name
1203                 #   - action
1204                 #   - hash_parent or hash_parent_base:/file_parent
1205                 #   - hash or hash_base:/filename
1206                 #   - the snapshot_format as an appropriate suffix
1207
1208                 # When the script is the root DirectoryIndex for the domain,
1209                 # $href here would be something like http://gitweb.example.com/
1210                 # Thus, we strip any trailing / from $href, to spare us double
1211                 # slashes in the final URL
1212                 $href =~ s,/$,,;
1213
1214                 # Then add the project name, if present
1215                 $href .= "/".esc_url($params{'project'});
1216                 delete $params{'project'};
1217
1218                 # since we destructively absorb parameters, we keep this
1219                 # boolean that remembers if we're handling a snapshot
1220                 my $is_snapshot = $params{'action'} eq 'snapshot';
1221
1222                 # Summary just uses the project path URL, any other action is
1223                 # added to the URL
1224                 if (defined $params{'action'}) {
1225                         $href .= "/".esc_url($params{'action'}) unless $params{'action'} eq 'summary';
1226                         delete $params{'action'};
1227                 }
1228
1229                 # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1230                 # stripping nonexistent or useless pieces
1231                 $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1232                         || $params{'hash_parent'} || $params{'hash'});
1233                 if (defined $params{'hash_base'}) {
1234                         if (defined $params{'hash_parent_base'}) {
1235                                 $href .= esc_url($params{'hash_parent_base'});
1236                                 # skip the file_parent if it's the same as the file_name
1237                                 if (defined $params{'file_parent'}) {
1238                                         if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1239                                                 delete $params{'file_parent'};
1240                                         } elsif ($params{'file_parent'} !~ /\.\./) {
1241                                                 $href .= ":/".esc_url($params{'file_parent'});
1242                                                 delete $params{'file_parent'};
1243                                         }
1244                                 }
1245                                 $href .= "..";
1246                                 delete $params{'hash_parent'};
1247                                 delete $params{'hash_parent_base'};
1248                         } elsif (defined $params{'hash_parent'}) {
1249                                 $href .= esc_url($params{'hash_parent'}). "..";
1250                                 delete $params{'hash_parent'};
1251                         }
1252
1253                         $href .= esc_url($params{'hash_base'});
1254                         if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1255                                 $href .= ":/".esc_url($params{'file_name'});
1256                                 delete $params{'file_name'};
1257                         }
1258                         delete $params{'hash'};
1259                         delete $params{'hash_base'};
1260                 } elsif (defined $params{'hash'}) {
1261                         $href .= esc_url($params{'hash'});
1262                         delete $params{'hash'};
1263                 }
1264
1265                 # If the action was a snapshot, we can absorb the
1266                 # snapshot_format parameter too
1267                 if ($is_snapshot) {
1268                         my $fmt = $params{'snapshot_format'};
1269                         # snapshot_format should always be defined when href()
1270                         # is called, but just in case some code forgets, we
1271                         # fall back to the default
1272                         $fmt ||= $snapshot_fmts[0];
1273                         $href .= $known_snapshot_formats{$fmt}{'suffix'};
1274                         delete $params{'snapshot_format'};
1275                 }
1276         }
1277
1278         # now encode the parameters explicitly
1279         my @result = ();
1280         for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1281                 my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1282                 if (defined $params{$name}) {
1283                         if (ref($params{$name}) eq "ARRAY") {
1284                                 foreach my $par (@{$params{$name}}) {
1285                                         push @result, $symbol . "=" . esc_param($par);
1286                                 }
1287                         } else {
1288                                 push @result, $symbol . "=" . esc_param($params{$name});
1289                         }
1290                 }
1291         }
1292         $href .= "?" . join(';', @result) if scalar @result;
1293
1294         return $href;
1295 }
1296
1297
1298 ## ======================================================================
1299 ## validation, quoting/unquoting and escaping
1300
1301 sub validate_action {
1302         my $input = shift || return undef;
1303         return undef unless exists $actions{$input};
1304         return $input;
1305 }
1306
1307 sub validate_project {
1308         my $input = shift || return undef;
1309         if (!validate_pathname($input) ||
1310                 !(-d "$projectroot/$input") ||
1311                 !check_export_ok("$projectroot/$input") ||
1312                 ($strict_export && !project_in_list($input))) {
1313                 return undef;
1314         } else {
1315                 return $input;
1316         }
1317 }
1318
1319 sub validate_pathname {
1320         my $input = shift || return undef;
1321
1322         # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1323         # at the beginning, at the end, and between slashes.
1324         # also this catches doubled slashes
1325         if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1326                 return undef;
1327         }
1328         # no null characters
1329         if ($input =~ m!\0!) {
1330                 return undef;
1331         }
1332         return $input;
1333 }
1334
1335 sub validate_refname {
1336         my $input = shift || return undef;
1337
1338         # textual hashes are O.K.
1339         if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1340                 return $input;
1341         }
1342         # it must be correct pathname
1343         $input = validate_pathname($input)
1344                 or return undef;
1345         # restrictions on ref name according to git-check-ref-format
1346         if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1347                 return undef;
1348         }
1349         return $input;
1350 }
1351
1352 # decode sequences of octets in utf8 into Perl's internal form,
1353 # which is utf-8 with utf8 flag set if needed.  gitweb writes out
1354 # in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1355 sub to_utf8 {
1356         my $str = shift;
1357         return undef unless defined $str;
1358         if (utf8::valid($str)) {
1359                 utf8::decode($str);
1360                 return $str;
1361         } else {
1362                 return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1363         }
1364 }
1365
1366 # quote unsafe chars, but keep the slash, even when it's not
1367 # correct, but quoted slashes look too horrible in bookmarks
1368 sub esc_param {
1369         my $str = shift;
1370         return undef unless defined $str;
1371         $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1372         $str =~ s/ /\+/g;
1373         return $str;
1374 }
1375
1376 # quote unsafe chars in whole URL, so some characters cannot be quoted
1377 sub esc_url {
1378         my $str = shift;
1379         return undef unless defined $str;
1380         $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1381         $str =~ s/ /\+/g;
1382         return $str;
1383 }
1384
1385 # replace invalid utf8 character with SUBSTITUTION sequence
1386 sub esc_html {
1387         my $str = shift;
1388         my %opts = @_;
1389
1390         return undef unless defined $str;
1391
1392         $str = to_utf8($str);
1393         $str = $cgi->escapeHTML($str);
1394         if ($opts{'-nbsp'}) {
1395                 $str =~ s/ /&nbsp;/g;
1396         }
1397         $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1398         return $str;
1399 }
1400
1401 # quote control characters and escape filename to HTML
1402 sub esc_path {
1403         my $str = shift;
1404         my %opts = @_;
1405
1406         return undef unless defined $str;
1407
1408         $str = to_utf8($str);
1409         $str = $cgi->escapeHTML($str);
1410         if ($opts{'-nbsp'}) {
1411                 $str =~ s/ /&nbsp;/g;
1412         }
1413         $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1414         return $str;
1415 }
1416
1417 # Make control characters "printable", using character escape codes (CEC)
1418 sub quot_cec {
1419         my $cntrl = shift;
1420         my %opts = @_;
1421         my %es = ( # character escape codes, aka escape sequences
1422                 "\t" => '\t',   # tab            (HT)
1423                 "\n" => '\n',   # line feed      (LF)
1424                 "\r" => '\r',   # carrige return (CR)
1425                 "\f" => '\f',   # form feed      (FF)
1426                 "\b" => '\b',   # backspace      (BS)
1427                 "\a" => '\a',   # alarm (bell)   (BEL)
1428                 "\e" => '\e',   # escape         (ESC)
1429                 "\013" => '\v', # vertical tab   (VT)
1430                 "\000" => '\0', # nul character  (NUL)
1431         );
1432         my $chr = ( (exists $es{$cntrl})
1433                     ? $es{$cntrl}
1434                     : sprintf('\%2x', ord($cntrl)) );
1435         if ($opts{-nohtml}) {
1436                 return $chr;
1437         } else {
1438                 return "<span class=\"cntrl\">$chr</span>";
1439         }
1440 }
1441
1442 # Alternatively use unicode control pictures codepoints,
1443 # Unicode "printable representation" (PR)
1444 sub quot_upr {
1445         my $cntrl = shift;
1446         my %opts = @_;
1447
1448         my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1449         if ($opts{-nohtml}) {
1450                 return $chr;
1451         } else {
1452                 return "<span class=\"cntrl\">$chr</span>";
1453         }
1454 }
1455
1456 # git may return quoted and escaped filenames
1457 sub unquote {
1458         my $str = shift;
1459
1460         sub unq {
1461                 my $seq = shift;
1462                 my %es = ( # character escape codes, aka escape sequences
1463                         't' => "\t",   # tab            (HT, TAB)
1464                         'n' => "\n",   # newline        (NL)
1465                         'r' => "\r",   # return         (CR)
1466                         'f' => "\f",   # form feed      (FF)
1467                         'b' => "\b",   # backspace      (BS)
1468                         'a' => "\a",   # alarm (bell)   (BEL)
1469                         'e' => "\e",   # escape         (ESC)
1470                         'v' => "\013", # vertical tab   (VT)
1471                 );
1472
1473                 if ($seq =~ m/^[0-7]{1,3}$/) {
1474                         # octal char sequence
1475                         return chr(oct($seq));
1476                 } elsif (exists $es{$seq}) {
1477                         # C escape sequence, aka character escape code
1478                         return $es{$seq};
1479                 }
1480                 # quoted ordinary character
1481                 return $seq;
1482         }
1483
1484         if ($str =~ m/^"(.*)"$/) {
1485                 # needs unquoting
1486                 $str = $1;
1487                 $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1488         }
1489         return $str;
1490 }
1491
1492 # escape tabs (convert tabs to spaces)
1493 sub untabify {
1494         my $line = shift;
1495
1496         while ((my $pos = index($line, "\t")) != -1) {
1497                 if (my $count = (8 - ($pos % 8))) {
1498                         my $spaces = ' ' x $count;
1499                         $line =~ s/\t/$spaces/;
1500                 }
1501         }
1502
1503         return $line;
1504 }
1505
1506 sub project_in_list {
1507         my $project = shift;
1508         my @list = git_get_projects_list();
1509         return @list && scalar(grep { $_->{'path'} eq $project } @list);
1510 }
1511
1512 ## ----------------------------------------------------------------------
1513 ## HTML aware string manipulation
1514
1515 # Try to chop given string on a word boundary between position
1516 # $len and $len+$add_len. If there is no word boundary there,
1517 # chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1518 # (marking chopped part) would be longer than given string.
1519 sub chop_str {
1520         my $str = shift;
1521         my $len = shift;
1522         my $add_len = shift || 10;
1523         my $where = shift || 'right'; # 'left' | 'center' | 'right'
1524
1525         # Make sure perl knows it is utf8 encoded so we don't
1526         # cut in the middle of a utf8 multibyte char.
1527         $str = to_utf8($str);
1528
1529         # allow only $len chars, but don't cut a word if it would fit in $add_len
1530         # if it doesn't fit, cut it if it's still longer than the dots we would add
1531         # remove chopped character entities entirely
1532
1533         # when chopping in the middle, distribute $len into left and right part
1534         # return early if chopping wouldn't make string shorter
1535         if ($where eq 'center') {
1536                 return $str if ($len + 5 >= length($str)); # filler is length 5
1537                 $len = int($len/2);
1538         } else {
1539                 return $str if ($len + 4 >= length($str)); # filler is length 4
1540         }
1541
1542         # regexps: ending and beginning with word part up to $add_len
1543         my $endre = qr/.{$len}\w{0,$add_len}/;
1544         my $begre = qr/\w{0,$add_len}.{$len}/;
1545
1546         if ($where eq 'left') {
1547                 $str =~ m/^(.*?)($begre)$/;
1548                 my ($lead, $body) = ($1, $2);
1549                 if (length($lead) > 4) {
1550                         $lead = " ...";
1551                 }
1552                 return "$lead$body";
1553
1554         } elsif ($where eq 'center') {
1555                 $str =~ m/^($endre)(.*)$/;
1556                 my ($left, $str)  = ($1, $2);
1557                 $str =~ m/^(.*?)($begre)$/;
1558                 my ($mid, $right) = ($1, $2);
1559                 if (length($mid) > 5) {
1560                         $mid = " ... ";
1561                 }
1562                 return "$left$mid$right";
1563
1564         } else {
1565                 $str =~ m/^($endre)(.*)$/;
1566                 my $body = $1;
1567                 my $tail = $2;
1568                 if (length($tail) > 4) {
1569                         $tail = "... ";
1570                 }
1571                 return "$body$tail";
1572         }
1573 }
1574
1575 # takes the same arguments as chop_str, but also wraps a <span> around the
1576 # result with a title attribute if it does get chopped. Additionally, the
1577 # string is HTML-escaped.
1578 sub chop_and_escape_str {
1579         my ($str) = @_;
1580
1581         my $chopped = chop_str(@_);
1582         if ($chopped eq $str) {
1583                 return esc_html($chopped);
1584         } else {
1585                 $str =~ s/[[:cntrl:]]/?/g;
1586                 return $cgi->span({-title=>$str}, esc_html($chopped));
1587         }
1588 }
1589
1590 ## ----------------------------------------------------------------------
1591 ## functions returning short strings
1592
1593 # CSS class for given age value (in seconds)
1594 sub age_class {
1595         my $age = shift;
1596
1597         if (!defined $age) {
1598                 return "noage";
1599         } elsif ($age < 60*60*2) {
1600                 return "age0";
1601         } elsif ($age < 60*60*24*2) {
1602                 return "age1";
1603         } else {
1604                 return "age2";
1605         }
1606 }
1607
1608 # convert age in seconds to "nn units ago" string
1609 sub age_string {
1610         my $age = shift;
1611         my $age_str;
1612
1613         if ($age > 60*60*24*365*2) {
1614                 $age_str = (int $age/60/60/24/365);
1615                 $age_str .= " years ago";
1616         } elsif ($age > 60*60*24*(365/12)*2) {
1617                 $age_str = int $age/60/60/24/(365/12);
1618                 $age_str .= " months ago";
1619         } elsif ($age > 60*60*24*7*2) {
1620                 $age_str = int $age/60/60/24/7;
1621                 $age_str .= " weeks ago";
1622         } elsif ($age > 60*60*24*2) {
1623                 $age_str = int $age/60/60/24;
1624                 $age_str .= " days ago";
1625         } elsif ($age > 60*60*2) {
1626                 $age_str = int $age/60/60;
1627                 $age_str .= " hours ago";
1628         } elsif ($age > 60*2) {
1629                 $age_str = int $age/60;
1630                 $age_str .= " min ago";
1631         } elsif ($age > 2) {
1632                 $age_str = int $age;
1633                 $age_str .= " sec ago";
1634         } else {
1635                 $age_str .= " right now";
1636         }
1637         return $age_str;
1638 }
1639
1640 use constant {
1641         S_IFINVALID => 0030000,
1642         S_IFGITLINK => 0160000,
1643 };
1644
1645 # submodule/subproject, a commit object reference
1646 sub S_ISGITLINK {
1647         my $mode = shift;
1648
1649         return (($mode & S_IFMT) == S_IFGITLINK)
1650 }
1651
1652 # convert file mode in octal to symbolic file mode string
1653 sub mode_str {
1654         my $mode = oct shift;
1655
1656         if (S_ISGITLINK($mode)) {
1657                 return 'm---------';
1658         } elsif (S_ISDIR($mode & S_IFMT)) {
1659                 return 'drwxr-xr-x';
1660         } elsif (S_ISLNK($mode)) {
1661                 return 'lrwxrwxrwx';
1662         } elsif (S_ISREG($mode)) {
1663                 # git cares only about the executable bit
1664                 if ($mode & S_IXUSR) {
1665                         return '-rwxr-xr-x';
1666                 } else {
1667                         return '-rw-r--r--';
1668                 };
1669         } else {
1670                 return '----------';
1671         }
1672 }
1673
1674 # convert file mode in octal to file type string
1675 sub file_type {
1676         my $mode = shift;
1677
1678         if ($mode !~ m/^[0-7]+$/) {
1679                 return $mode;
1680         } else {
1681                 $mode = oct $mode;
1682         }
1683
1684         if (S_ISGITLINK($mode)) {
1685                 return "submodule";
1686         } elsif (S_ISDIR($mode & S_IFMT)) {
1687                 return "directory";
1688         } elsif (S_ISLNK($mode)) {
1689                 return "symlink";
1690         } elsif (S_ISREG($mode)) {
1691                 return "file";
1692         } else {
1693                 return "unknown";
1694         }
1695 }
1696
1697 # convert file mode in octal to file type description string
1698 sub file_type_long {
1699         my $mode = shift;
1700
1701         if ($mode !~ m/^[0-7]+$/) {
1702                 return $mode;
1703         } else {
1704                 $mode = oct $mode;
1705         }
1706
1707         if (S_ISGITLINK($mode)) {
1708                 return "submodule";
1709         } elsif (S_ISDIR($mode & S_IFMT)) {
1710                 return "directory";
1711         } elsif (S_ISLNK($mode)) {
1712                 return "symlink";
1713         } elsif (S_ISREG($mode)) {
1714                 if ($mode & S_IXUSR) {
1715                         return "executable";
1716                 } else {
1717                         return "file";
1718                 };
1719         } else {
1720                 return "unknown";
1721         }
1722 }
1723
1724
1725 ## ----------------------------------------------------------------------
1726 ## functions returning short HTML fragments, or transforming HTML fragments
1727 ## which don't belong to other sections
1728
1729 # format line of commit message.
1730 sub format_log_line_html {
1731         my $line = shift;
1732
1733         $line = esc_html($line, -nbsp=>1);
1734         $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1735                 $cgi->a({-href => href(action=>"object", hash=>$1),
1736                                         -class => "text"}, $1);
1737         }eg;
1738
1739         return $line;
1740 }
1741
1742 # format marker of refs pointing to given object
1743
1744 # the destination action is chosen based on object type and current context:
1745 # - for annotated tags, we choose the tag view unless it's the current view
1746 #   already, in which case we go to shortlog view
1747 # - for other refs, we keep the current view if we're in history, shortlog or
1748 #   log view, and select shortlog otherwise
1749 sub format_ref_marker {
1750         my ($refs, $id) = @_;
1751         my $markers = '';
1752
1753         if (defined $refs->{$id}) {
1754                 foreach my $ref (@{$refs->{$id}}) {
1755                         # this code exploits the fact that non-lightweight tags are the
1756                         # only indirect objects, and that they are the only objects for which
1757                         # we want to use tag instead of shortlog as action
1758                         my ($type, $name) = qw();
1759                         my $indirect = ($ref =~ s/\^\{\}$//);
1760                         # e.g. tags/v2.6.11 or heads/next
1761                         if ($ref =~ m!^(.*?)s?/(.*)$!) {
1762                                 $type = $1;
1763                                 $name = $2;
1764                         } else {
1765                                 $type = "ref";
1766                                 $name = $ref;
1767                         }
1768
1769                         my $class = $type;
1770                         $class .= " indirect" if $indirect;
1771
1772                         my $dest_action = "shortlog";
1773
1774                         if ($indirect) {
1775                                 $dest_action = "tag" unless $action eq "tag";
1776                         } elsif ($action =~ /^(history|(short)?log)$/) {
1777                                 $dest_action = $action;
1778                         }
1779
1780                         my $dest = "";
1781                         $dest .= "refs/" unless $ref =~ m!^refs/!;
1782                         $dest .= $ref;
1783
1784                         my $link = $cgi->a({
1785                                 -href => href(
1786                                         action=>$dest_action,
1787                                         hash=>$dest
1788                                 )}, $name);
1789
1790                         $markers .= " <span class=\"$class\" title=\"$ref\">" .
1791                                 $link . "</span>";
1792                 }
1793         }
1794
1795         if ($markers) {
1796                 return ' <span class="refs">'. $markers . '</span>';
1797         } else {
1798                 return "";
1799         }
1800 }
1801
1802 # format, perhaps shortened and with markers, title line
1803 sub format_subject_html {
1804         my ($long, $short, $href, $extra) = @_;
1805         $extra = '' unless defined($extra);
1806
1807         if (length($short) < length($long)) {
1808                 $long =~ s/[[:cntrl:]]/?/g;
1809                 return $cgi->a({-href => $href, -class => "list subject",
1810                                 -title => to_utf8($long)},
1811                        esc_html($short)) . $extra;
1812         } else {
1813                 return $cgi->a({-href => $href, -class => "list subject"},
1814                        esc_html($long)) . $extra;
1815         }
1816 }
1817
1818 # Rather than recomputing the url for an email multiple times, we cache it
1819 # after the first hit. This gives a visible benefit in views where the avatar
1820 # for the same email is used repeatedly (e.g. shortlog).
1821 # The cache is shared by all avatar engines (currently gravatar only), which
1822 # are free to use it as preferred. Since only one avatar engine is used for any
1823 # given page, there's no risk for cache conflicts.
1824 our %avatar_cache = ();
1825
1826 # Compute the picon url for a given email, by using the picon search service over at
1827 # http://www.cs.indiana.edu/picons/search.html
1828 sub picon_url {
1829         my $email = lc shift;
1830         if (!$avatar_cache{$email}) {
1831                 my ($user, $domain) = split('@', $email);
1832                 $avatar_cache{$email} =
1833                         "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1834                         "$domain/$user/" .
1835                         "users+domains+unknown/up/single";
1836         }
1837         return $avatar_cache{$email};
1838 }
1839
1840 # Compute the gravatar url for a given email, if it's not in the cache already.
1841 # Gravatar stores only the part of the URL before the size, since that's the
1842 # one computationally more expensive. This also allows reuse of the cache for
1843 # different sizes (for this particular engine).
1844 sub gravatar_url {
1845         my $email = lc shift;
1846         my $size = shift;
1847         $avatar_cache{$email} ||=
1848                 "http://www.gravatar.com/avatar/" .
1849                         Digest::MD5::md5_hex($email) . "?s=";
1850         return $avatar_cache{$email} . $size;
1851 }
1852
1853 # Insert an avatar for the given $email at the given $size if the feature
1854 # is enabled.
1855 sub git_get_avatar {
1856         my ($email, %opts) = @_;
1857         my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1858         my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1859         $opts{-size} ||= 'default';
1860         my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1861         my $url = "";
1862         if ($git_avatar eq 'gravatar') {
1863                 $url = gravatar_url($email, $size);
1864         } elsif ($git_avatar eq 'picon') {
1865                 $url = picon_url($email);
1866         }
1867         # Other providers can be added by extending the if chain, defining $url
1868         # as needed. If no variant puts something in $url, we assume avatars
1869         # are completely disabled/unavailable.
1870         if ($url) {
1871                 return $pre_white .
1872                        "<img width=\"$size\" " .
1873                             "class=\"avatar\" " .
1874                             "src=\"$url\" " .
1875                             "alt=\"\" " .
1876                        "/>" . $post_white;
1877         } else {
1878                 return "";
1879         }
1880 }
1881
1882 sub format_search_author {
1883         my ($author, $searchtype, $displaytext) = @_;
1884         my $have_search = gitweb_check_feature('search');
1885
1886         if ($have_search) {
1887                 my $performed = "";
1888                 if ($searchtype eq 'author') {
1889                         $performed = "authored";
1890                 } elsif ($searchtype eq 'committer') {
1891                         $performed = "committed";
1892                 }
1893
1894                 return $cgi->a({-href => href(action=>"search", hash=>$hash,
1895                                 searchtext=>$author,
1896                                 searchtype=>$searchtype), class=>"list",
1897                                 title=>"Search for commits $performed by $author"},
1898                                 $displaytext);
1899
1900         } else {
1901                 return $displaytext;
1902         }
1903 }
1904
1905 # format the author name of the given commit with the given tag
1906 # the author name is chopped and escaped according to the other
1907 # optional parameters (see chop_str).
1908 sub format_author_html {
1909         my $tag = shift;
1910         my $co = shift;
1911         my $author = chop_and_escape_str($co->{'author_name'}, @_);
1912         return "<$tag class=\"author\">" .
1913                format_search_author($co->{'author_name'}, "author",
1914                        git_get_avatar($co->{'author_email'}, -pad_after => 1) .
1915                        $author) .
1916                "</$tag>";
1917 }
1918
1919 # format git diff header line, i.e. "diff --(git|combined|cc) ..."
1920 sub format_git_diff_header_line {
1921         my $line = shift;
1922         my $diffinfo = shift;
1923         my ($from, $to) = @_;
1924
1925         if ($diffinfo->{'nparents'}) {
1926                 # combined diff
1927                 $line =~ s!^(diff (.*?) )"?.*$!$1!;
1928                 if ($to->{'href'}) {
1929                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1930                                          esc_path($to->{'file'}));
1931                 } else { # file was deleted (no href)
1932                         $line .= esc_path($to->{'file'});
1933                 }
1934         } else {
1935                 # "ordinary" diff
1936                 $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
1937                 if ($from->{'href'}) {
1938                         $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
1939                                          'a/' . esc_path($from->{'file'}));
1940                 } else { # file was added (no href)
1941                         $line .= 'a/' . esc_path($from->{'file'});
1942                 }
1943                 $line .= ' ';
1944                 if ($to->{'href'}) {
1945                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
1946                                          'b/' . esc_path($to->{'file'}));
1947                 } else { # file was deleted
1948                         $line .= 'b/' . esc_path($to->{'file'});
1949                 }
1950         }
1951
1952         return "<div class=\"diff header\">$line</div>\n";
1953 }
1954
1955 # format extended diff header line, before patch itself
1956 sub format_extended_diff_header_line {
1957         my $line = shift;
1958         my $diffinfo = shift;
1959         my ($from, $to) = @_;
1960
1961         # match <path>
1962         if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
1963                 $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
1964                                        esc_path($from->{'file'}));
1965         }
1966         if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
1967                 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
1968                                  esc_path($to->{'file'}));
1969         }
1970         # match single <mode>
1971         if ($line =~ m/\s(\d{6})$/) {
1972                 $line .= '<span class="info"> (' .
1973                          file_type_long($1) .
1974                          ')</span>';
1975         }
1976         # match <hash>
1977         if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
1978                 # can match only for combined diff
1979                 $line = 'index ';
1980                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
1981                         if ($from->{'href'}[$i]) {
1982                                 $line .= $cgi->a({-href=>$from->{'href'}[$i],
1983                                                   -class=>"hash"},
1984                                                  substr($diffinfo->{'from_id'}[$i],0,7));
1985                         } else {
1986                                 $line .= '0' x 7;
1987                         }
1988                         # separator
1989                         $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
1990                 }
1991                 $line .= '..';
1992                 if ($to->{'href'}) {
1993                         $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
1994                                          substr($diffinfo->{'to_id'},0,7));
1995                 } else {
1996                         $line .= '0' x 7;
1997                 }
1998
1999         } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2000                 # can match only for ordinary diff
2001                 my ($from_link, $to_link);
2002                 if ($from->{'href'}) {
2003                         $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2004                                              substr($diffinfo->{'from_id'},0,7));
2005                 } else {
2006                         $from_link = '0' x 7;
2007                 }
2008                 if ($to->{'href'}) {
2009                         $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2010                                            substr($diffinfo->{'to_id'},0,7));
2011                 } else {
2012                         $to_link = '0' x 7;
2013                 }
2014                 my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2015                 $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2016         }
2017
2018         return $line . "<br/>\n";
2019 }
2020
2021 # format from-file/to-file diff header
2022 sub format_diff_from_to_header {
2023         my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2024         my $line;
2025         my $result = '';
2026
2027         $line = $from_line;
2028         #assert($line =~ m/^---/) if DEBUG;
2029         # no extra formatting for "^--- /dev/null"
2030         if (! $diffinfo->{'nparents'}) {
2031                 # ordinary (single parent) diff
2032                 if ($line =~ m!^--- "?a/!) {
2033                         if ($from->{'href'}) {
2034                                 $line = '--- a/' .
2035                                         $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2036                                                 esc_path($from->{'file'}));
2037                         } else {
2038                                 $line = '--- a/' .
2039                                         esc_path($from->{'file'});
2040                         }
2041                 }
2042                 $result .= qq!<div class="diff from_file">$line</div>\n!;
2043
2044         } else {
2045                 # combined diff (merge commit)
2046                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2047                         if ($from->{'href'}[$i]) {
2048                                 $line = '--- ' .
2049                                         $cgi->a({-href=>href(action=>"blobdiff",
2050                                                              hash_parent=>$diffinfo->{'from_id'}[$i],
2051                                                              hash_parent_base=>$parents[$i],
2052                                                              file_parent=>$from->{'file'}[$i],
2053                                                              hash=>$diffinfo->{'to_id'},
2054                                                              hash_base=>$hash,
2055                                                              file_name=>$to->{'file'}),
2056                                                  -class=>"path",
2057                                                  -title=>"diff" . ($i+1)},
2058                                                 $i+1) .
2059                                         '/' .
2060                                         $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2061                                                 esc_path($from->{'file'}[$i]));
2062                         } else {
2063                                 $line = '--- /dev/null';
2064                         }
2065                         $result .= qq!<div class="diff from_file">$line</div>\n!;
2066                 }
2067         }
2068
2069         $line = $to_line;
2070         #assert($line =~ m/^\+\+\+/) if DEBUG;
2071         # no extra formatting for "^+++ /dev/null"
2072         if ($line =~ m!^\+\+\+ "?b/!) {
2073                 if ($to->{'href'}) {
2074                         $line = '+++ b/' .
2075                                 $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2076                                         esc_path($to->{'file'}));
2077                 } else {
2078                         $line = '+++ b/' .
2079                                 esc_path($to->{'file'});
2080                 }
2081         }
2082         $result .= qq!<div class="diff to_file">$line</div>\n!;
2083
2084         return $result;
2085 }
2086
2087 # create note for patch simplified by combined diff
2088 sub format_diff_cc_simplified {
2089         my ($diffinfo, @parents) = @_;
2090         my $result = '';
2091
2092         $result .= "<div class=\"diff header\">" .
2093                    "diff --cc ";
2094         if (!is_deleted($diffinfo)) {
2095                 $result .= $cgi->a({-href => href(action=>"blob",
2096                                                   hash_base=>$hash,
2097                                                   hash=>$diffinfo->{'to_id'},
2098                                                   file_name=>$diffinfo->{'to_file'}),
2099                                     -class => "path"},
2100                                    esc_path($diffinfo->{'to_file'}));
2101         } else {
2102                 $result .= esc_path($diffinfo->{'to_file'});
2103         }
2104         $result .= "</div>\n" . # class="diff header"
2105                    "<div class=\"diff nodifferences\">" .
2106                    "Simple merge" .
2107                    "</div>\n"; # class="diff nodifferences"
2108
2109         return $result;
2110 }
2111
2112 # format patch (diff) line (not to be used for diff headers)
2113 sub format_diff_line {
2114         my $line = shift;
2115         my ($from, $to) = @_;
2116         my $diff_class = "";
2117
2118         chomp $line;
2119
2120         if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2121                 # combined diff
2122                 my $prefix = substr($line, 0, scalar @{$from->{'href'}});
2123                 if ($line =~ m/^\@{3}/) {
2124                         $diff_class = " chunk_header";
2125                 } elsif ($line =~ m/^\\/) {
2126                         $diff_class = " incomplete";
2127                 } elsif ($prefix =~ tr/+/+/) {
2128                         $diff_class = " add";
2129                 } elsif ($prefix =~ tr/-/-/) {
2130                         $diff_class = " rem";
2131                 }
2132         } else {
2133                 # assume ordinary diff
2134                 my $char = substr($line, 0, 1);
2135                 if ($char eq '+') {
2136                         $diff_class = " add";
2137                 } elsif ($char eq '-') {
2138                         $diff_class = " rem";
2139                 } elsif ($char eq '@') {
2140                         $diff_class = " chunk_header";
2141                 } elsif ($char eq "\\") {
2142                         $diff_class = " incomplete";
2143                 }
2144         }
2145         $line = untabify($line);
2146         if ($from && $to && $line =~ m/^\@{2} /) {
2147                 my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2148                         $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2149
2150                 $from_lines = 0 unless defined $from_lines;
2151                 $to_lines   = 0 unless defined $to_lines;
2152
2153                 if ($from->{'href'}) {
2154                         $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2155                                              -class=>"list"}, $from_text);
2156                 }
2157                 if ($to->{'href'}) {
2158                         $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2159                                              -class=>"list"}, $to_text);
2160                 }
2161                 $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2162                         "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2163                 return "<div class=\"diff$diff_class\">$line</div>\n";
2164         } elsif ($from && $to && $line =~ m/^\@{3}/) {
2165                 my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2166                 my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2167
2168                 @from_text = split(' ', $ranges);
2169                 for (my $i = 0; $i < @from_text; ++$i) {
2170                         ($from_start[$i], $from_nlines[$i]) =
2171                                 (split(',', substr($from_text[$i], 1)), 0);
2172                 }
2173
2174                 $to_text   = pop @from_text;
2175                 $to_start  = pop @from_start;
2176                 $to_nlines = pop @from_nlines;
2177
2178                 $line = "<span class=\"chunk_info\">$prefix ";
2179                 for (my $i = 0; $i < @from_text; ++$i) {
2180                         if ($from->{'href'}[$i]) {
2181                                 $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2182                                                   -class=>"list"}, $from_text[$i]);
2183                         } else {
2184                                 $line .= $from_text[$i];
2185                         }
2186                         $line .= " ";
2187                 }
2188                 if ($to->{'href'}) {
2189                         $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2190                                           -class=>"list"}, $to_text);
2191                 } else {
2192                         $line .= $to_text;
2193                 }
2194                 $line .= " $prefix</span>" .
2195                          "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2196                 return "<div class=\"diff$diff_class\">$line</div>\n";
2197         }
2198         return "<div class=\"diff$diff_class\">" . esc_html($line, -nbsp=>1) . "</div>\n";
2199 }
2200
2201 # Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2202 # linked.  Pass the hash of the tree/commit to snapshot.
2203 sub format_snapshot_links {
2204         my ($hash) = @_;
2205         my $num_fmts = @snapshot_fmts;
2206         if ($num_fmts > 1) {
2207                 # A parenthesized list of links bearing format names.
2208                 # e.g. "snapshot (_tar.gz_ _zip_)"
2209                 return "snapshot (" . join(' ', map
2210                         $cgi->a({
2211                                 -href => href(
2212                                         action=>"snapshot",
2213                                         hash=>$hash,
2214                                         snapshot_format=>$_
2215                                 )
2216                         }, $known_snapshot_formats{$_}{'display'})
2217                 , @snapshot_fmts) . ")";
2218         } elsif ($num_fmts == 1) {
2219                 # A single "snapshot" link whose tooltip bears the format name.
2220                 # i.e. "_snapshot_"
2221                 my ($fmt) = @snapshot_fmts;
2222                 return
2223                         $cgi->a({
2224                                 -href => href(
2225                                         action=>"snapshot",
2226                                         hash=>$hash,
2227                                         snapshot_format=>$fmt
2228                                 ),
2229                                 -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2230                         }, "snapshot");
2231         } else { # $num_fmts == 0
2232                 return undef;
2233         }
2234 }
2235
2236 ## ......................................................................
2237 ## functions returning values to be passed, perhaps after some
2238 ## transformation, to other functions; e.g. returning arguments to href()
2239
2240 # returns hash to be passed to href to generate gitweb URL
2241 # in -title key it returns description of link
2242 sub get_feed_info {
2243         my $format = shift || 'Atom';
2244         my %res = (action => lc($format));
2245
2246         # feed links are possible only for project views
2247         return unless (defined $project);
2248         # some views should link to OPML, or to generic project feed,
2249         # or don't have specific feed yet (so they should use generic)
2250         return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2251
2252         my $branch;
2253         # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2254         # from tag links; this also makes possible to detect branch links
2255         if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2256             (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2257                 $branch = $1;
2258         }
2259         # find log type for feed description (title)
2260         my $type = 'log';
2261         if (defined $file_name) {
2262                 $type  = "history of $file_name";
2263                 $type .= "/" if ($action eq 'tree');
2264                 $type .= " on '$branch'" if (defined $branch);
2265         } else {
2266                 $type = "log of $branch" if (defined $branch);
2267         }
2268
2269         $res{-title} = $type;
2270         $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2271         $res{'file_name'} = $file_name;
2272
2273         return %res;
2274 }
2275
2276 ## ----------------------------------------------------------------------
2277 ## git utility subroutines, invoking git commands
2278
2279 # returns path to the core git executable and the --git-dir parameter as list
2280 sub git_cmd {
2281         $number_of_git_cmds++;
2282         return $GIT, '--git-dir='.$git_dir;
2283 }
2284
2285 # quote the given arguments for passing them to the shell
2286 # quote_command("command", "arg 1", "arg with ' and ! characters")
2287 # => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2288 # Try to avoid using this function wherever possible.
2289 sub quote_command {
2290         return join(' ',
2291                 map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2292 }
2293
2294 # get HEAD ref of given project as hash
2295 sub git_get_head_hash {
2296         return git_get_full_hash(shift, 'HEAD');
2297 }
2298
2299 sub git_get_full_hash {
2300         return git_get_hash(@_);
2301 }
2302
2303 sub git_get_short_hash {
2304         return git_get_hash(@_, '--short=7');
2305 }
2306
2307 sub git_get_hash {
2308         my ($project, $hash, @options) = @_;
2309         my $o_git_dir = $git_dir;
2310         my $retval = undef;
2311         $git_dir = "$projectroot/$project";
2312         if (open my $fd, '-|', git_cmd(), 'rev-parse',
2313             '--verify', '-q', @options, $hash) {
2314                 $retval = <$fd>;
2315                 chomp $retval if defined $retval;
2316                 close $fd;
2317         }
2318         if (defined $o_git_dir) {
2319                 $git_dir = $o_git_dir;
2320         }
2321         return $retval;
2322 }
2323
2324 # get type of given object
2325 sub git_get_type {
2326         my $hash = shift;
2327
2328         open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2329         my $type = <$fd>;
2330         close $fd or return;
2331         chomp $type;
2332         return $type;
2333 }
2334
2335 # repository configuration
2336 our $config_file = '';
2337 our %config;
2338
2339 # store multiple values for single key as anonymous array reference
2340 # single values stored directly in the hash, not as [ <value> ]
2341 sub hash_set_multi {
2342         my ($hash, $key, $value) = @_;
2343
2344         if (!exists $hash->{$key}) {
2345                 $hash->{$key} = $value;
2346         } elsif (!ref $hash->{$key}) {
2347                 $hash->{$key} = [ $hash->{$key}, $value ];
2348         } else {
2349                 push @{$hash->{$key}}, $value;
2350         }
2351 }
2352
2353 # return hash of git project configuration
2354 # optionally limited to some section, e.g. 'gitweb'
2355 sub git_parse_project_config {
2356         my $section_regexp = shift;
2357         my %config;
2358
2359         local $/ = "\0";
2360
2361         open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2362                 or return;
2363
2364         while (my $keyval = <$fh>) {
2365                 chomp $keyval;
2366                 my ($key, $value) = split(/\n/, $keyval, 2);
2367
2368                 hash_set_multi(\%config, $key, $value)
2369                         if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2370         }
2371         close $fh;
2372
2373         return %config;
2374 }
2375
2376 # convert config value to boolean: 'true' or 'false'
2377 # no value, number > 0, 'true' and 'yes' values are true
2378 # rest of values are treated as false (never as error)
2379 sub config_to_bool {
2380         my $val = shift;
2381
2382         return 1 if !defined $val;             # section.key
2383
2384         # strip leading and trailing whitespace
2385         $val =~ s/^\s+//;
2386         $val =~ s/\s+$//;
2387
2388         return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2389                 ($val =~ /^(?:true|yes)$/i));  # section.key = true
2390 }
2391
2392 # convert config value to simple decimal number
2393 # an optional value suffix of 'k', 'm', or 'g' will cause the value
2394 # to be multiplied by 1024, 1048576, or 1073741824
2395 sub config_to_int {
2396         my $val = shift;
2397
2398         # strip leading and trailing whitespace
2399         $val =~ s/^\s+//;
2400         $val =~ s/\s+$//;
2401
2402         if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2403                 $unit = lc($unit);
2404                 # unknown unit is treated as 1
2405                 return $num * ($unit eq 'g' ? 1073741824 :
2406                                $unit eq 'm' ?    1048576 :
2407                                $unit eq 'k' ?       1024 : 1);
2408         }
2409         return $val;
2410 }
2411
2412 # convert config value to array reference, if needed
2413 sub config_to_multi {
2414         my $val = shift;
2415
2416         return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2417 }
2418
2419 sub git_get_project_config {
2420         my ($key, $type) = @_;
2421
2422         return unless defined $git_dir;
2423
2424         # key sanity check
2425         return unless ($key);
2426         $key =~ s/^gitweb\.//;
2427         return if ($key =~ m/\W/);
2428
2429         # type sanity check
2430         if (defined $type) {
2431                 $type =~ s/^--//;
2432                 $type = undef
2433                         unless ($type eq 'bool' || $type eq 'int');
2434         }
2435
2436         # get config
2437         if (!defined $config_file ||
2438             $config_file ne "$git_dir/config") {
2439                 %config = git_parse_project_config('gitweb');
2440                 $config_file = "$git_dir/config";
2441         }
2442
2443         # check if config variable (key) exists
2444         return unless exists $config{"gitweb.$key"};
2445
2446         # ensure given type
2447         if (!defined $type) {
2448                 return $config{"gitweb.$key"};
2449         } elsif ($type eq 'bool') {
2450                 # backward compatibility: 'git config --bool' returns true/false
2451                 return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2452         } elsif ($type eq 'int') {
2453                 return config_to_int($config{"gitweb.$key"});
2454         }
2455         return $config{"gitweb.$key"};
2456 }
2457
2458 # get hash of given path at given ref
2459 sub git_get_hash_by_path {
2460         my $base = shift;
2461         my $path = shift || return undef;
2462         my $type = shift;
2463
2464         $path =~ s,/+$,,;
2465
2466         open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2467                 or die_error(500, "Open git-ls-tree failed");
2468         my $line = <$fd>;
2469         close $fd or return undef;
2470
2471         if (!defined $line) {
2472                 # there is no tree or hash given by $path at $base
2473                 return undef;
2474         }
2475
2476         #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2477         $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2478         if (defined $type && $type ne $2) {
2479                 # type doesn't match
2480                 return undef;
2481         }
2482         return $3;
2483 }
2484
2485 # get path of entry with given hash at given tree-ish (ref)
2486 # used to get 'from' filename for combined diff (merge commit) for renames
2487 sub git_get_path_by_hash {
2488         my $base = shift || return;
2489         my $hash = shift || return;
2490
2491         local $/ = "\0";
2492
2493         open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2494                 or return undef;
2495         while (my $line = <$fd>) {
2496                 chomp $line;
2497
2498                 #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2499                 #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2500                 if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2501                         close $fd;
2502                         return $1;
2503                 }
2504         }
2505         close $fd;
2506         return undef;
2507 }
2508
2509 ## ......................................................................
2510 ## git utility functions, directly accessing git repository
2511
2512 sub git_get_project_description {
2513         my $path = shift;
2514
2515         $git_dir = "$projectroot/$path";
2516         open my $fd, '<', "$git_dir/description"
2517                 or return git_get_project_config('description');
2518         my $descr = <$fd>;
2519         close $fd;
2520         if (defined $descr) {
2521                 chomp $descr;
2522         }
2523         return $descr;
2524 }
2525
2526 sub git_get_project_ctags {
2527         my $path = shift;
2528         my $ctags = {};
2529
2530         $git_dir = "$projectroot/$path";
2531         opendir my $dh, "$git_dir/ctags"
2532                 or return $ctags;
2533         foreach (grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh)) {
2534                 open my $ct, '<', $_ or next;
2535                 my $val = <$ct>;
2536                 chomp $val;
2537                 close $ct;
2538                 my $ctag = $_; $ctag =~ s#.*/##;
2539                 $ctags->{$ctag} = $val;
2540         }
2541         closedir $dh;
2542         $ctags;
2543 }
2544
2545 sub git_populate_project_tagcloud {
2546         my $ctags = shift;
2547
2548         # First, merge different-cased tags; tags vote on casing
2549         my %ctags_lc;
2550         foreach (keys %$ctags) {
2551                 $ctags_lc{lc $_}->{count} += $ctags->{$_};
2552                 if (not $ctags_lc{lc $_}->{topcount}
2553                     or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2554                         $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2555                         $ctags_lc{lc $_}->{topname} = $_;
2556                 }
2557         }
2558
2559         my $cloud;
2560         if (eval { require HTML::TagCloud; 1; }) {
2561                 $cloud = HTML::TagCloud->new;
2562                 foreach (sort keys %ctags_lc) {
2563                         # Pad the title with spaces so that the cloud looks
2564                         # less crammed.
2565                         my $title = $ctags_lc{$_}->{topname};
2566                         $title =~ s/ /&nbsp;/g;
2567                         $title =~ s/^/&nbsp;/g;
2568                         $title =~ s/$/&nbsp;/g;
2569                         $cloud->add($title, $home_link."?by_tag=".$_, $ctags_lc{$_}->{count});
2570                 }
2571         } else {
2572                 $cloud = \%ctags_lc;
2573         }
2574         $cloud;
2575 }
2576
2577 sub git_show_project_tagcloud {
2578         my ($cloud, $count) = @_;
2579         print STDERR ref($cloud)."..\n";
2580         if (ref $cloud eq 'HTML::TagCloud') {
2581                 return $cloud->html_and_css($count);
2582         } else {
2583                 my @tags = sort { $cloud->{$a}->{count} <=> $cloud->{$b}->{count} } keys %$cloud;
2584                 return '<p align="center">' . join (', ', map {
2585                         "<a href=\"$home_link?by_tag=$_\">$cloud->{$_}->{topname}</a>"
2586                 } splice(@tags, 0, $count)) . '</p>';
2587         }
2588 }
2589
2590 sub git_get_project_url_list {
2591         my $path = shift;
2592
2593         $git_dir = "$projectroot/$path";
2594         open my $fd, '<', "$git_dir/cloneurl"
2595                 or return wantarray ?
2596                 @{ config_to_multi(git_get_project_config('url')) } :
2597                    config_to_multi(git_get_project_config('url'));
2598         my @git_project_url_list = map { chomp; $_ } <$fd>;
2599         close $fd;
2600
2601         return wantarray ? @git_project_url_list : \@git_project_url_list;
2602 }
2603
2604 sub git_get_projects_list {
2605         my ($filter) = @_;
2606         my @list;
2607
2608         $filter ||= '';
2609         $filter =~ s/\.git$//;
2610
2611         my $check_forks = gitweb_check_feature('forks');
2612
2613         if (-d $projects_list) {
2614                 # search in directory
2615                 my $dir = $projects_list . ($filter ? "/$filter" : '');
2616                 # remove the trailing "/"
2617                 $dir =~ s!/+$!!;
2618                 my $pfxlen = length("$dir");
2619                 my $pfxdepth = ($dir =~ tr!/!!);
2620
2621                 File::Find::find({
2622                         follow_fast => 1, # follow symbolic links
2623                         follow_skip => 2, # ignore duplicates
2624                         dangling_symlinks => 0, # ignore dangling symlinks, silently
2625                         wanted => sub {
2626                                 # global variables
2627                                 our $project_maxdepth;
2628                                 our $projectroot;
2629                                 # skip project-list toplevel, if we get it.
2630                                 return if (m!^[/.]$!);
2631                                 # only directories can be git repositories
2632                                 return unless (-d $_);
2633                                 # don't traverse too deep (Find is super slow on os x)
2634                                 if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2635                                         $File::Find::prune = 1;
2636                                         return;
2637                                 }
2638
2639                                 my $subdir = substr($File::Find::name, $pfxlen + 1);
2640                                 # we check related file in $projectroot
2641                                 my $path = ($filter ? "$filter/" : '') . $subdir;
2642                                 if (check_export_ok("$projectroot/$path")) {
2643                                         push @list, { path => $path };
2644                                         $File::Find::prune = 1;
2645                                 }
2646                         },
2647                 }, "$dir");
2648
2649         } elsif (-f $projects_list) {
2650                 # read from file(url-encoded):
2651                 # 'git%2Fgit.git Linus+Torvalds'
2652                 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2653                 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2654                 my %paths;
2655                 open my $fd, '<', $projects_list or return;
2656         PROJECT:
2657                 while (my $line = <$fd>) {
2658                         chomp $line;
2659                         my ($path, $owner) = split ' ', $line;
2660                         $path = unescape($path);
2661                         $owner = unescape($owner);
2662                         if (!defined $path) {
2663                                 next;
2664                         }
2665                         if ($filter ne '') {
2666                                 # looking for forks;
2667                                 my $pfx = substr($path, 0, length($filter));
2668                                 if ($pfx ne $filter) {
2669                                         next PROJECT;
2670                                 }
2671                                 my $sfx = substr($path, length($filter));
2672                                 if ($sfx !~ /^\/.*\.git$/) {
2673                                         next PROJECT;
2674                                 }
2675                         } elsif ($check_forks) {
2676                         PATH:
2677                                 foreach my $filter (keys %paths) {
2678                                         # looking for forks;
2679                                         my $pfx = substr($path, 0, length($filter));
2680                                         if ($pfx ne $filter) {
2681                                                 next PATH;
2682                                         }
2683                                         my $sfx = substr($path, length($filter));
2684                                         if ($sfx !~ /^\/.*\.git$/) {
2685                                                 next PATH;
2686                                         }
2687                                         # is a fork, don't include it in
2688                                         # the list
2689                                         next PROJECT;
2690                                 }
2691                         }
2692                         if (check_export_ok("$projectroot/$path")) {
2693                                 my $pr = {
2694                                         path => $path,
2695                                         owner => to_utf8($owner),
2696                                 };
2697                                 push @list, $pr;
2698                                 (my $forks_path = $path) =~ s/\.git$//;
2699                                 $paths{$forks_path}++;
2700                         }
2701                 }
2702                 close $fd;
2703         }
2704         return @list;
2705 }
2706
2707 our $gitweb_project_owner = undef;
2708 sub git_get_project_list_from_file {
2709
2710         return if (defined $gitweb_project_owner);
2711
2712         $gitweb_project_owner = {};
2713         # read from file (url-encoded):
2714         # 'git%2Fgit.git Linus+Torvalds'
2715         # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2716         # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2717         if (-f $projects_list) {
2718                 open(my $fd, '<', $projects_list);
2719                 while (my $line = <$fd>) {
2720                         chomp $line;
2721                         my ($pr, $ow) = split ' ', $line;
2722                         $pr = unescape($pr);
2723                         $ow = unescape($ow);
2724                         $gitweb_project_owner->{$pr} = to_utf8($ow);
2725                 }
2726                 close $fd;
2727         }
2728 }
2729
2730 sub git_get_project_owner {
2731         my $project = shift;
2732         my $owner;
2733
2734         return undef unless $project;
2735         $git_dir = "$projectroot/$project";
2736
2737         if (!defined $gitweb_project_owner) {
2738                 git_get_project_list_from_file();
2739         }
2740
2741         if (exists $gitweb_project_owner->{$project}) {
2742                 $owner = $gitweb_project_owner->{$project};
2743         }
2744         if (!defined $owner){
2745                 $owner = git_get_project_config('owner');
2746         }
2747         if (!defined $owner) {
2748                 $owner = get_file_owner("$git_dir");
2749         }
2750
2751         return $owner;
2752 }
2753
2754 sub git_get_last_activity {
2755         my ($path) = @_;
2756         my $fd;
2757
2758         $git_dir = "$projectroot/$path";
2759         open($fd, "-|", git_cmd(), 'for-each-ref',
2760              '--format=%(committer)',
2761              '--sort=-committerdate',
2762              '--count=1',
2763              'refs/heads') or return;
2764         my $most_recent = <$fd>;
2765         close $fd or return;
2766         if (defined $most_recent &&
2767             $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
2768                 my $timestamp = $1;
2769                 my $age = time - $timestamp;
2770                 return ($age, age_string($age));
2771         }
2772         return (undef, undef);
2773 }
2774
2775 sub git_get_references {
2776         my $type = shift || "";
2777         my %refs;
2778         # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
2779         # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
2780         open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
2781                 ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
2782                 or return;
2783
2784         while (my $line = <$fd>) {
2785                 chomp $line;
2786                 if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
2787                         if (defined $refs{$1}) {
2788                                 push @{$refs{$1}}, $2;
2789                         } else {
2790                                 $refs{$1} = [ $2 ];
2791                         }
2792                 }
2793         }
2794         close $fd or return;
2795         return \%refs;
2796 }
2797
2798 sub git_get_rev_name_tags {
2799         my $hash = shift || return undef;
2800
2801         open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
2802                 or return;
2803         my $name_rev = <$fd>;
2804         close $fd;
2805
2806         if ($name_rev =~ m|^$hash tags/(.*)$|) {
2807                 return $1;
2808         } else {
2809                 # catches also '$hash undefined' output
2810                 return undef;
2811         }
2812 }
2813
2814 ## ----------------------------------------------------------------------
2815 ## parse to hash functions
2816
2817 sub parse_date {
2818         my $epoch = shift;
2819         my $tz = shift || "-0000";
2820
2821         my %date;
2822         my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
2823         my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
2824         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
2825         $date{'hour'} = $hour;
2826         $date{'minute'} = $min;
2827         $date{'mday'} = $mday;
2828         $date{'day'} = $days[$wday];
2829         $date{'month'} = $months[$mon];
2830         $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
2831                              $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
2832         $date{'mday-time'} = sprintf "%d %s %02d:%02d",
2833                              $mday, $months[$mon], $hour ,$min;
2834         $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
2835                              1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
2836
2837         $tz =~ m/^([+\-][0-9][0-9])([0-9][0-9])$/;
2838         my $local = $epoch + ((int $1 + ($2/60)) * 3600);
2839         ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
2840         $date{'hour_local'} = $hour;
2841         $date{'minute_local'} = $min;
2842         $date{'tz_local'} = $tz;
2843         $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
2844                                   1900+$year, $mon+1, $mday,
2845                                   $hour, $min, $sec, $tz);
2846         return %date;
2847 }
2848
2849 sub parse_tag {
2850         my $tag_id = shift;
2851         my %tag;
2852         my @comment;
2853
2854         open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
2855         $tag{'id'} = $tag_id;
2856         while (my $line = <$fd>) {
2857                 chomp $line;
2858                 if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
2859                         $tag{'object'} = $1;
2860                 } elsif ($line =~ m/^type (.+)$/) {
2861                         $tag{'type'} = $1;
2862                 } elsif ($line =~ m/^tag (.+)$/) {
2863                         $tag{'name'} = $1;
2864                 } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
2865                         $tag{'author'} = $1;
2866                         $tag{'author_epoch'} = $2;
2867                         $tag{'author_tz'} = $3;
2868                         if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
2869                                 $tag{'author_name'}  = $1;
2870                                 $tag{'author_email'} = $2;
2871                         } else {
2872                                 $tag{'author_name'} = $tag{'author'};
2873                         }
2874                 } elsif ($line =~ m/--BEGIN/) {
2875                         push @comment, $line;
2876                         last;
2877                 } elsif ($line eq "") {
2878                         last;
2879                 }
2880         }
2881         push @comment, <$fd>;
2882         $tag{'comment'} = \@comment;
2883         close $fd or return;
2884         if (!defined $tag{'name'}) {
2885                 return
2886         };
2887         return %tag
2888 }
2889
2890 sub parse_commit_text {
2891         my ($commit_text, $withparents) = @_;
2892         my @commit_lines = split '\n', $commit_text;
2893         my %co;
2894
2895         pop @commit_lines; # Remove '\0'
2896
2897         if (! @commit_lines) {
2898                 return;
2899         }
2900
2901         my $header = shift @commit_lines;
2902         if ($header !~ m/^[0-9a-fA-F]{40}/) {
2903                 return;
2904         }
2905         ($co{'id'}, my @parents) = split ' ', $header;
2906         while (my $line = shift @commit_lines) {
2907                 last if $line eq "\n";
2908                 if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
2909                         $co{'tree'} = $1;
2910                 } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
2911                         push @parents, $1;
2912                 } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
2913                         $co{'author'} = to_utf8($1);
2914                         $co{'author_epoch'} = $2;
2915                         $co{'author_tz'} = $3;
2916                         if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
2917                                 $co{'author_name'}  = $1;
2918                                 $co{'author_email'} = $2;
2919                         } else {
2920                                 $co{'author_name'} = $co{'author'};
2921                         }
2922                 } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
2923                         $co{'committer'} = to_utf8($1);
2924                         $co{'committer_epoch'} = $2;
2925                         $co{'committer_tz'} = $3;
2926                         if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
2927                                 $co{'committer_name'}  = $1;
2928                                 $co{'committer_email'} = $2;
2929                         } else {
2930                                 $co{'committer_name'} = $co{'committer'};
2931                         }
2932                 }
2933         }
2934         if (!defined $co{'tree'}) {
2935                 return;
2936         };
2937         $co{'parents'} = \@parents;
2938         $co{'parent'} = $parents[0];
2939
2940         foreach my $title (@commit_lines) {
2941                 $title =~ s/^    //;
2942                 if ($title ne "") {
2943                         $co{'title'} = chop_str($title, 80, 5);
2944                         # remove leading stuff of merges to make the interesting part visible
2945                         if (length($title) > 50) {
2946                                 $title =~ s/^Automatic //;
2947                                 $title =~ s/^merge (of|with) /Merge ... /i;
2948                                 if (length($title) > 50) {
2949                                         $title =~ s/(http|rsync):\/\///;
2950                                 }
2951                                 if (length($title) > 50) {
2952                                         $title =~ s/(master|www|rsync)\.//;
2953                                 }
2954                                 if (length($title) > 50) {
2955                                         $title =~ s/kernel.org:?//;
2956                                 }
2957                                 if (length($title) > 50) {
2958                                         $title =~ s/\/pub\/scm//;
2959                                 }
2960                         }
2961                         $co{'title_short'} = chop_str($title, 50, 5);
2962                         last;
2963                 }
2964         }
2965         if (! defined $co{'title'} || $co{'title'} eq "") {
2966                 $co{'title'} = $co{'title_short'} = '(no commit message)';
2967         }
2968         # remove added spaces
2969         foreach my $line (@commit_lines) {
2970                 $line =~ s/^    //;
2971         }
2972         $co{'comment'} = \@commit_lines;
2973
2974         my $age = time - $co{'committer_epoch'};
2975         $co{'age'} = $age;
2976         $co{'age_string'} = age_string($age);
2977         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
2978         if ($age > 60*60*24*7*2) {
2979                 $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
2980                 $co{'age_string_age'} = $co{'age_string'};
2981         } else {
2982                 $co{'age_string_date'} = $co{'age_string'};
2983                 $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
2984         }
2985         return %co;
2986 }
2987
2988 sub parse_commit {
2989         my ($commit_id) = @_;
2990         my %co;
2991
2992         local $/ = "\0";
2993
2994         open my $fd, "-|", git_cmd(), "rev-list",
2995                 "--parents",
2996                 "--header",
2997                 "--max-count=1",
2998                 $commit_id,
2999                 "--",
3000                 or die_error(500, "Open git-rev-list failed");
3001         %co = parse_commit_text(<$fd>, 1);
3002         close $fd;
3003
3004         return %co;
3005 }
3006
3007 sub parse_commits {
3008         my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3009         my @cos;
3010
3011         $maxcount ||= 1;
3012         $skip ||= 0;
3013
3014         local $/ = "\0";
3015
3016         open my $fd, "-|", git_cmd(), "rev-list",
3017                 "--header",
3018                 @args,
3019                 ("--max-count=" . $maxcount),
3020                 ("--skip=" . $skip),
3021                 @extra_options,
3022                 $commit_id,
3023                 "--",
3024                 ($filename ? ($filename) : ())
3025                 or die_error(500, "Open git-rev-list failed");
3026         while (my $line = <$fd>) {
3027                 my %co = parse_commit_text($line);
3028                 push @cos, \%co;
3029         }
3030         close $fd;
3031
3032         return wantarray ? @cos : \@cos;
3033 }
3034
3035 # parse line of git-diff-tree "raw" output
3036 sub parse_difftree_raw_line {
3037         my $line = shift;
3038         my %res;
3039
3040         # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3041         # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3042         if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3043                 $res{'from_mode'} = $1;
3044                 $res{'to_mode'} = $2;
3045                 $res{'from_id'} = $3;
3046                 $res{'to_id'} = $4;
3047                 $res{'status'} = $5;
3048                 $res{'similarity'} = $6;
3049                 if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3050                         ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3051                 } else {
3052                         $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3053                 }
3054         }
3055         # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3056         # combined diff (for merge commit)
3057         elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3058                 $res{'nparents'}  = length($1);
3059                 $res{'from_mode'} = [ split(' ', $2) ];
3060                 $res{'to_mode'} = pop @{$res{'from_mode'}};
3061                 $res{'from_id'} = [ split(' ', $3) ];
3062                 $res{'to_id'} = pop @{$res{'from_id'}};
3063                 $res{'status'} = [ split('', $4) ];
3064                 $res{'to_file'} = unquote($5);
3065         }
3066         # 'c512b523472485aef4fff9e57b229d9d243c967f'
3067         elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3068                 $res{'commit'} = $1;
3069         }
3070
3071         return wantarray ? %res : \%res;
3072 }
3073
3074 # wrapper: return parsed line of git-diff-tree "raw" output
3075 # (the argument might be raw line, or parsed info)
3076 sub parsed_difftree_line {
3077         my $line_or_ref = shift;
3078
3079         if (ref($line_or_ref) eq "HASH") {
3080                 # pre-parsed (or generated by hand)
3081                 return $line_or_ref;
3082         } else {
3083                 return parse_difftree_raw_line($line_or_ref);
3084         }
3085 }
3086
3087 # parse line of git-ls-tree output
3088 sub parse_ls_tree_line {
3089         my $line = shift;
3090         my %opts = @_;
3091         my %res;
3092
3093         if ($opts{'-l'}) {
3094                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3095                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3096
3097                 $res{'mode'} = $1;
3098                 $res{'type'} = $2;
3099                 $res{'hash'} = $3;
3100                 $res{'size'} = $4;
3101                 if ($opts{'-z'}) {
3102                         $res{'name'} = $5;
3103                 } else {
3104                         $res{'name'} = unquote($5);
3105                 }
3106         } else {
3107                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3108                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3109
3110                 $res{'mode'} = $1;
3111                 $res{'type'} = $2;
3112                 $res{'hash'} = $3;
3113                 if ($opts{'-z'}) {
3114                         $res{'name'} = $4;
3115                 } else {
3116                         $res{'name'} = unquote($4);
3117                 }
3118         }
3119
3120         return wantarray ? %res : \%res;
3121 }
3122
3123 # generates _two_ hashes, references to which are passed as 2 and 3 argument
3124 sub parse_from_to_diffinfo {
3125         my ($diffinfo, $from, $to, @parents) = @_;
3126
3127         if ($diffinfo->{'nparents'}) {
3128                 # combined diff
3129                 $from->{'file'} = [];
3130                 $from->{'href'} = [];
3131                 fill_from_file_info($diffinfo, @parents)
3132                         unless exists $diffinfo->{'from_file'};
3133                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3134                         $from->{'file'}[$i] =
3135                                 defined $diffinfo->{'from_file'}[$i] ?
3136                                         $diffinfo->{'from_file'}[$i] :
3137                                         $diffinfo->{'to_file'};
3138                         if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3139                                 $from->{'href'}[$i] = href(action=>"blob",
3140                                                            hash_base=>$parents[$i],
3141                                                            hash=>$diffinfo->{'from_id'}[$i],
3142                                                            file_name=>$from->{'file'}[$i]);
3143                         } else {
3144                                 $from->{'href'}[$i] = undef;
3145                         }
3146                 }
3147         } else {
3148                 # ordinary (not combined) diff
3149                 $from->{'file'} = $diffinfo->{'from_file'};
3150                 if ($diffinfo->{'status'} ne "A") { # not new (added) file
3151                         $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3152                                                hash=>$diffinfo->{'from_id'},
3153                                                file_name=>$from->{'file'});
3154                 } else {
3155                         delete $from->{'href'};
3156                 }
3157         }
3158
3159         $to->{'file'} = $diffinfo->{'to_file'};
3160         if (!is_deleted($diffinfo)) { # file exists in result
3161                 $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3162                                      hash=>$diffinfo->{'to_id'},
3163                                      file_name=>$to->{'file'});
3164         } else {
3165                 delete $to->{'href'};
3166         }
3167 }
3168
3169 ## ......................................................................
3170 ## parse to array of hashes functions
3171
3172 sub git_get_heads_list {
3173         my ($limit, @classes) = @_;
3174         @classes = ('heads') unless @classes;
3175         my @patterns = map { "refs/$_" } @classes;
3176         my @headslist;
3177
3178         open my $fd, '-|', git_cmd(), 'for-each-ref',
3179                 ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3180                 '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3181                 @patterns
3182                 or return;
3183         while (my $line = <$fd>) {
3184                 my %ref_item;
3185
3186                 chomp $line;
3187                 my ($refinfo, $committerinfo) = split(/\0/, $line);
3188                 my ($hash, $name, $title) = split(' ', $refinfo, 3);
3189                 my ($committer, $epoch, $tz) =
3190                         ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3191                 $ref_item{'fullname'}  = $name;
3192                 $name =~ s!^refs/(?:head|remote)s/!!;
3193
3194                 $ref_item{'name'}  = $name;
3195                 $ref_item{'id'}    = $hash;
3196                 $ref_item{'title'} = $title || '(no commit message)';
3197                 $ref_item{'epoch'} = $epoch;
3198                 if ($epoch) {
3199                         $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3200                 } else {
3201                         $ref_item{'age'} = "unknown";
3202                 }
3203
3204                 push @headslist, \%ref_item;
3205         }
3206         close $fd;
3207
3208         return wantarray ? @headslist : \@headslist;
3209 }
3210
3211 sub git_get_tags_list {
3212         my $limit = shift;
3213         my @tagslist;
3214
3215         open my $fd, '-|', git_cmd(), 'for-each-ref',
3216                 ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3217                 '--format=%(objectname) %(objecttype) %(refname) '.
3218                 '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3219                 'refs/tags'
3220                 or return;
3221         while (my $line = <$fd>) {
3222                 my %ref_item;
3223
3224                 chomp $line;
3225                 my ($refinfo, $creatorinfo) = split(/\0/, $line);
3226                 my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3227                 my ($creator, $epoch, $tz) =
3228                         ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3229                 $ref_item{'fullname'} = $name;
3230                 $name =~ s!^refs/tags/!!;
3231
3232                 $ref_item{'type'} = $type;
3233                 $ref_item{'id'} = $id;
3234                 $ref_item{'name'} = $name;
3235                 if ($type eq "tag") {
3236                         $ref_item{'subject'} = $title;
3237                         $ref_item{'reftype'} = $reftype;
3238                         $ref_item{'refid'}   = $refid;
3239                 } else {
3240                         $ref_item{'reftype'} = $type;
3241                         $ref_item{'refid'}   = $id;
3242                 }
3243
3244                 if ($type eq "tag" || $type eq "commit") {
3245                         $ref_item{'epoch'} = $epoch;
3246                         if ($epoch) {
3247                                 $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3248                         } else {
3249                                 $ref_item{'age'} = "unknown";
3250                         }
3251                 }
3252
3253                 push @tagslist, \%ref_item;
3254         }
3255         close $fd;
3256
3257         return wantarray ? @tagslist : \@tagslist;
3258 }
3259
3260 ## ----------------------------------------------------------------------
3261 ## filesystem-related functions
3262
3263 sub get_file_owner {
3264         my $path = shift;
3265
3266         my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3267         my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3268         if (!defined $gcos) {
3269                 return undef;
3270         }
3271         my $owner = $gcos;
3272         $owner =~ s/[,;].*$//;
3273         return to_utf8($owner);
3274 }
3275
3276 # assume that file exists
3277 sub insert_file {
3278         my $filename = shift;
3279
3280         open my $fd, '<', $filename;
3281         print map { to_utf8($_) } <$fd>;
3282         close $fd;
3283 }
3284
3285 ## ......................................................................
3286 ## mimetype related functions
3287
3288 sub mimetype_guess_file {
3289         my $filename = shift;
3290         my $mimemap = shift;
3291         -r $mimemap or return undef;
3292
3293         my %mimemap;
3294         open(my $mh, '<', $mimemap) or return undef;
3295         while (<$mh>) {
3296                 next if m/^#/; # skip comments
3297                 my ($mimetype, $exts) = split(/\t+/);
3298                 if (defined $exts) {
3299                         my @exts = split(/\s+/, $exts);
3300                         foreach my $ext (@exts) {
3301                                 $mimemap{$ext} = $mimetype;
3302                         }
3303                 }
3304         }
3305         close($mh);
3306
3307         $filename =~ /\.([^.]*)$/;
3308         return $mimemap{$1};
3309 }
3310
3311 sub mimetype_guess {
3312         my $filename = shift;
3313         my $mime;
3314         $filename =~ /\./ or return undef;
3315
3316         if ($mimetypes_file) {
3317                 my $file = $mimetypes_file;
3318                 if ($file !~ m!^/!) { # if it is relative path
3319                         # it is relative to project
3320                         $file = "$projectroot/$project/$file";
3321                 }
3322                 $mime = mimetype_guess_file($filename, $file);
3323         }
3324         $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3325         return $mime;
3326 }
3327
3328 sub blob_mimetype {
3329         my $fd = shift;
3330         my $filename = shift;
3331
3332         if ($filename) {
3333                 my $mime = mimetype_guess($filename);
3334                 $mime and return $mime;
3335         }
3336
3337         # just in case
3338         return $default_blob_plain_mimetype unless $fd;
3339
3340         if (-T $fd) {
3341                 return 'text/plain';
3342         } elsif (! $filename) {
3343                 return 'application/octet-stream';
3344         } elsif ($filename =~ m/\.png$/i) {
3345                 return 'image/png';
3346         } elsif ($filename =~ m/\.gif$/i) {
3347                 return 'image/gif';
3348         } elsif ($filename =~ m/\.jpe?g$/i) {
3349                 return 'image/jpeg';
3350         } else {
3351                 return 'application/octet-stream';
3352         }
3353 }
3354
3355 sub blob_contenttype {
3356         my ($fd, $file_name, $type) = @_;
3357
3358         $type ||= blob_mimetype($fd, $file_name);
3359         if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3360                 $type .= "; charset=$default_text_plain_charset";
3361         }
3362
3363         return $type;
3364 }
3365
3366 # guess file syntax for syntax highlighting; return undef if no highlighting
3367 # the name of syntax can (in the future) depend on syntax highlighter used
3368 sub guess_file_syntax {
3369         my ($highlight, $mimetype, $file_name) = @_;
3370         return undef unless ($highlight && defined $file_name);
3371         my $basename = basename($file_name, '.in');
3372         return $highlight_basename{$basename}
3373                 if exists $highlight_basename{$basename};
3374
3375         $basename =~ /\.([^.]*)$/;
3376         my $ext = $1 or return undef;
3377         return $highlight_ext{$ext}
3378                 if exists $highlight_ext{$ext};
3379
3380         return undef;
3381 }
3382
3383 # run highlighter and return FD of its output,
3384 # or return original FD if no highlighting
3385 sub run_highlighter {
3386         my ($fd, $highlight, $syntax) = @_;
3387         return $fd unless ($highlight && defined $syntax);
3388
3389         close $fd
3390                 or die_error(404, "Reading blob failed");
3391         open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3392                   quote_command($highlight_bin).
3393                   " --xhtml --fragment --syntax $syntax |"
3394                 or die_error(500, "Couldn't open file or run syntax highlighter");
3395         return $fd;
3396 }
3397
3398 ## ======================================================================
3399 ## functions printing HTML: header, footer, error page
3400
3401 sub get_page_title {
3402         my $title = to_utf8($site_name);
3403
3404         return $title unless (defined $project);
3405         $title .= " - " . to_utf8($project);
3406
3407         return $title unless (defined $action);
3408         $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3409
3410         return $title unless (defined $file_name);
3411         $title .= " - " . esc_path($file_name);
3412         if ($action eq "tree" && $file_name !~ m|/$|) {
3413                 $title .= "/";
3414         }
3415
3416         return $title;
3417 }
3418
3419 sub git_header_html {
3420         my $status = shift || "200 OK";
3421         my $expires = shift;
3422         my %opts = @_;
3423
3424         my $title = get_page_title();
3425         my $content_type;
3426         # require explicit support from the UA if we are to send the page as
3427         # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3428         # we have to do this because MSIE sometimes globs '*/*', pretending to
3429         # support xhtml+xml but choking when it gets what it asked for.
3430         if (defined $cgi->http('HTTP_ACCEPT') &&
3431             $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3432             $cgi->Accept('application/xhtml+xml') != 0) {
3433                 $content_type = 'application/xhtml+xml';
3434         } else {
3435                 $content_type = 'text/html';
3436         }
3437         print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3438                            -status=> $status, -expires => $expires)
3439                 unless ($opts{'-no_http_header'});
3440         my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3441         print <<EOF;
3442 <?xml version="1.0" encoding="utf-8"?>
3443 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3444 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3445 <!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3446 <!-- git core binaries version $git_version -->
3447 <head>
3448 <meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3449 <meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3450 <meta name="robots" content="index, nofollow"/>
3451 <title>$title</title>
3452 EOF
3453         # the stylesheet, favicon etc urls won't work correctly with path_info
3454         # unless we set the appropriate base URL
3455         if ($ENV{'PATH_INFO'}) {
3456                 print "<base href=\"".esc_url($base_url)."\" />\n";
3457         }
3458         # print out each stylesheet that exist, providing backwards capability
3459         # for those people who defined $stylesheet in a config file
3460         if (defined $stylesheet) {
3461                 print '<link rel="stylesheet" type="text/css" href="'.$stylesheet.'"/>'."\n";
3462         } else {
3463                 foreach my $stylesheet (@stylesheets) {
3464                         next unless $stylesheet;
3465                         print '<link rel="stylesheet" type="text/css" href="'.$stylesheet.'"/>'."\n";
3466                 }
3467         }
3468         if (defined $project) {
3469                 my %href_params = get_feed_info();
3470                 if (!exists $href_params{'-title'}) {
3471                         $href_params{'-title'} = 'log';
3472                 }
3473
3474                 foreach my $format qw(RSS Atom) {
3475                         my $type = lc($format);
3476                         my %link_attr = (
3477                                 '-rel' => 'alternate',
3478                                 '-title' => "$project - $href_params{'-title'} - $format feed",
3479                                 '-type' => "application/$type+xml"
3480                         );
3481
3482                         $href_params{'action'} = $type;
3483                         $link_attr{'-href'} = href(%href_params);
3484                         print "<link ".
3485                               "rel=\"$link_attr{'-rel'}\" ".
3486                               "title=\"$link_attr{'-title'}\" ".
3487                               "href=\"$link_attr{'-href'}\" ".
3488                               "type=\"$link_attr{'-type'}\" ".
3489                               "/>\n";
3490
3491                         $href_params{'extra_options'} = '--no-merges';
3492                         $link_attr{'-href'} = href(%href_params);
3493                         $link_attr{'-title'} .= ' (no merges)';
3494                         print "<link ".
3495                               "rel=\"$link_attr{'-rel'}\" ".
3496                               "title=\"$link_attr{'-title'}\" ".
3497                               "href=\"$link_attr{'-href'}\" ".
3498                               "type=\"$link_attr{'-type'}\" ".
3499                               "/>\n";
3500                 }
3501
3502         } else {
3503                 printf('<link rel="alternate" title="%s projects list" '.
3504                        'href="%s" type="text/plain; charset=utf-8" />'."\n",
3505                        $site_name, href(project=>undef, action=>"project_index"));
3506                 printf('<link rel="alternate" title="%s projects feeds" '.
3507                        'href="%s" type="text/x-opml" />'."\n",
3508                        $site_name, href(project=>undef, action=>"opml"));
3509         }
3510         if (defined $favicon) {
3511                 print qq(<link rel="shortcut icon" href="$favicon" type="image/png" />\n);
3512         }
3513
3514         print "</head>\n" .
3515               "<body>\n";
3516
3517         if (defined $site_header && -f $site_header) {
3518                 insert_file($site_header);
3519         }
3520
3521         print "<div class=\"page_header\">\n" .
3522               $cgi->a({-href => esc_url($logo_url),
3523                        -title => $logo_label},
3524                       qq(<img src="$logo" width="72" height="27" alt="git" class="logo"/>));
3525         print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3526         if (defined $project) {
3527                 print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3528                 if (defined $action) {
3529                         my $action_print = $action ;
3530                         if (defined $opts{-action_extra}) {
3531                                 $action_print = $cgi->a({-href => href(action=>$action)},
3532                                         $action);
3533                         }
3534                         print " / $action_print";
3535                 }
3536                 if (defined $opts{-action_extra}) {
3537                         print " / $opts{-action_extra}";
3538                 }
3539                 print "\n";
3540         }
3541         print "</div>\n";
3542
3543         my $have_search = gitweb_check_feature('search');
3544         if (defined $project && $have_search) {
3545                 if (!defined $searchtext) {
3546                         $searchtext = "";
3547                 }
3548                 my $search_hash;
3549                 if (defined $hash_base) {
3550                         $search_hash = $hash_base;
3551                 } elsif (defined $hash) {
3552                         $search_hash = $hash;
3553                 } else {
3554                         $search_hash = "HEAD";
3555                 }
3556                 my $action = $my_uri;
3557                 my $use_pathinfo = gitweb_check_feature('pathinfo');
3558                 if ($use_pathinfo) {
3559                         $action .= "/".esc_url($project);
3560                 }
3561                 print $cgi->startform(-method => "get", -action => $action) .
3562                       "<div class=\"search\">\n" .
3563                       (!$use_pathinfo &&
3564                       $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3565                       $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3566                       $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3567                       $cgi->popup_menu(-name => 'st', -default => 'commit',
3568                                        -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3569                       $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3570                       " search:\n",
3571                       $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3572                       "<span title=\"Extended regular expression\">" .
3573                       $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3574                                      -checked => $search_use_regexp) .
3575                       "</span>" .
3576                       "</div>" .
3577                       $cgi->end_form() . "\n";
3578         }
3579 }
3580
3581 sub git_footer_html {
3582         my $feed_class = 'rss_logo';
3583
3584         print "<div class=\"page_footer\">\n";
3585         if (defined $project) {
3586                 my $descr = git_get_project_description($project);
3587                 if (defined $descr) {
3588                         print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3589                 }
3590
3591                 my %href_params = get_feed_info();
3592                 if (!%href_params) {
3593                         $feed_class .= ' generic';
3594                 }
3595                 $href_params{'-title'} ||= 'log';
3596
3597                 foreach my $format qw(RSS Atom) {
3598                         $href_params{'action'} = lc($format);
3599                         print $cgi->a({-href => href(%href_params),
3600                                       -title => "$href_params{'-title'} $format feed",
3601                                       -class => $feed_class}, $format)."\n";
3602                 }
3603
3604         } else {
3605                 print $cgi->a({-href => href(project=>undef, action=>"opml"),
3606                               -class => $feed_class}, "OPML") . " ";
3607                 print $cgi->a({-href => href(project=>undef, action=>"project_index"),
3608                               -class => $feed_class}, "TXT") . "\n";
3609         }
3610         print "</div>\n"; # class="page_footer"
3611
3612         if (defined $t0 && gitweb_check_feature('timed')) {
3613                 print "<div id=\"generating_info\">\n";
3614                 print 'This page took '.
3615                       '<span id="generating_time" class="time_span">'.
3616                       Time::HiRes::tv_interval($t0, [Time::HiRes::gettimeofday()]).
3617                       ' seconds </span>'.
3618                       ' and '.
3619                       '<span id="generating_cmd">'.
3620                       $number_of_git_cmds.
3621                       '</span> git commands '.
3622                       " to generate.\n";
3623                 print "</div>\n"; # class="page_footer"
3624         }
3625
3626         if (defined $site_footer && -f $site_footer) {
3627                 insert_file($site_footer);
3628         }
3629
3630         print qq!<script type="text/javascript" src="$javascript"></script>\n!;
3631         if (defined $action &&
3632             $action eq 'blame_incremental') {
3633                 print qq!<script type="text/javascript">\n!.
3634                       qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
3635                       qq!           "!. href() .qq!");\n!.
3636                       qq!</script>\n!;
3637         } elsif (gitweb_check_feature('javascript-actions')) {
3638                 print qq!<script type="text/javascript">\n!.
3639                       qq!window.onload = fixLinks;\n!.
3640                       qq!</script>\n!;
3641         }
3642
3643         print "</body>\n" .
3644               "</html>";
3645 }
3646
3647 # die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
3648 # Example: die_error(404, 'Hash not found')
3649 # By convention, use the following status codes (as defined in RFC 2616):
3650 # 400: Invalid or missing CGI parameters, or
3651 #      requested object exists but has wrong type.
3652 # 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
3653 #      this server or project.
3654 # 404: Requested object/revision/project doesn't exist.
3655 # 500: The server isn't configured properly, or
3656 #      an internal error occurred (e.g. failed assertions caused by bugs), or
3657 #      an unknown error occurred (e.g. the git binary died unexpectedly).
3658 # 503: The server is currently unavailable (because it is overloaded,
3659 #      or down for maintenance).  Generally, this is a temporary state.
3660 sub die_error {
3661         my $status = shift || 500;
3662         my $error = esc_html(shift) || "Internal Server Error";
3663         my $extra = shift;
3664         my %opts = @_;
3665
3666         my %http_responses = (
3667                 400 => '400 Bad Request',
3668                 403 => '403 Forbidden',
3669                 404 => '404 Not Found',
3670                 500 => '500 Internal Server Error',
3671                 503 => '503 Service Unavailable',
3672         );
3673         git_header_html($http_responses{$status}, undef, %opts);
3674         print <<EOF;
3675 <div class="page_body">
3676 <br /><br />
3677 $status - $error
3678 <br />
3679 EOF
3680         if (defined $extra) {
3681                 print "<hr />\n" .
3682                       "$extra\n";
3683         }
3684         print "</div>\n";
3685
3686         git_footer_html();
3687         goto DONE_GITWEB
3688                 unless ($opts{'-error_handler'});
3689 }
3690
3691 ## ----------------------------------------------------------------------
3692 ## functions printing or outputting HTML: navigation
3693
3694 sub git_print_page_nav {
3695         my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
3696         $extra = '' if !defined $extra; # pager or formats
3697
3698         my @navs = qw(summary shortlog log commit commitdiff tree);
3699         if ($suppress) {
3700                 @navs = grep { $_ ne $suppress } @navs;
3701         }
3702
3703         my %arg = map { $_ => {action=>$_} } @navs;
3704         if (defined $head) {
3705                 for (qw(commit commitdiff)) {
3706                         $arg{$_}{'hash'} = $head;
3707                 }
3708                 if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
3709                         for (qw(shortlog log)) {
3710                                 $arg{$_}{'hash'} = $head;
3711                         }
3712                 }
3713         }
3714
3715         $arg{'tree'}{'hash'} = $treehead if defined $treehead;
3716         $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
3717
3718         my @actions = gitweb_get_feature('actions');
3719         my %repl = (
3720                 '%' => '%',
3721                 'n' => $project,         # project name
3722                 'f' => $git_dir,         # project path within filesystem
3723                 'h' => $treehead || '',  # current hash ('h' parameter)
3724                 'b' => $treebase || '',  # hash base ('hb' parameter)
3725         );
3726         while (@actions) {
3727                 my ($label, $link, $pos) = splice(@actions,0,3);
3728                 # insert
3729                 @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
3730                 # munch munch
3731                 $link =~ s/%([%nfhb])/$repl{$1}/g;
3732                 $arg{$label}{'_href'} = $link;
3733         }
3734
3735         print "<div class=\"page_nav\">\n" .
3736                 (join " | ",
3737                  map { $_ eq $current ?
3738                        $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
3739                  } @navs);
3740         print "<br/>\n$extra<br/>\n" .
3741               "</div>\n";
3742 }
3743
3744 # returns a submenu for the nagivation of the refs views (tags, heads,
3745 # remotes) with the current view disabled and the remotes view only
3746 # available if the feature is enabled
3747 sub format_ref_views {
3748         my ($current) = @_;
3749         my @ref_views = qw{tags heads};
3750         push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
3751         return join " | ", map {
3752                 $_ eq $current ? $_ :
3753                 $cgi->a({-href => href(action=>$_)}, $_)
3754         } @ref_views
3755 }
3756
3757 sub format_paging_nav {
3758         my ($action, $page, $has_next_link) = @_;
3759         my $paging_nav;
3760
3761
3762         if ($page > 0) {
3763                 $paging_nav .=
3764                         $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
3765                         " &sdot; " .
3766                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
3767                                  -accesskey => "p", -title => "Alt-p"}, "prev");
3768         } else {
3769                 $paging_nav .= "first &sdot; prev";
3770         }
3771
3772         if ($has_next_link) {
3773                 $paging_nav .= " &sdot; " .
3774                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
3775                                  -accesskey => "n", -title => "Alt-n"}, "next");
3776         } else {
3777                 $paging_nav .= " &sdot; next";
3778         }
3779
3780         return $paging_nav;
3781 }
3782
3783 ## ......................................................................
3784 ## functions printing or outputting HTML: div
3785
3786 sub git_print_header_div {
3787         my ($action, $title, $hash, $hash_base) = @_;
3788         my %args = ();
3789
3790         $args{'action'} = $action;
3791         $args{'hash'} = $hash if $hash;
3792         $args{'hash_base'} = $hash_base if $hash_base;
3793
3794         print "<div class=\"header\">\n" .
3795               $cgi->a({-href => href(%args), -class => "title"},
3796               $title ? $title : $action) .
3797               "\n</div>\n";
3798 }
3799
3800 sub format_repo_url {
3801         my ($name, $url) = @_;
3802         return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
3803 }
3804
3805 # Group output by placing it in a DIV element and adding a header.
3806 # Options for start_div() can be provided by passing a hash reference as the
3807 # first parameter to the function.
3808 # Options to git_print_header_div() can be provided by passing an array
3809 # reference. This must follow the options to start_div if they are present.
3810 # The content can be a scalar, which is output as-is, a scalar reference, which
3811 # is output after html escaping, an IO handle passed either as *handle or
3812 # *handle{IO}, or a function reference. In the latter case all following
3813 # parameters will be taken as argument to the content function call.
3814 sub git_print_section {
3815         my ($div_args, $header_args, $content);
3816         my $arg = shift;
3817         if (ref($arg) eq 'HASH') {
3818                 $div_args = $arg;
3819                 $arg = shift;
3820         }
3821         if (ref($arg) eq 'ARRAY') {
3822                 $header_args = $arg;
3823                 $arg = shift;
3824         }
3825         $content = $arg;
3826
3827         print $cgi->start_div($div_args);
3828         git_print_header_div(@$header_args);
3829
3830         if (ref($content) eq 'CODE') {
3831                 $content->(@_);
3832         } elsif (ref($content) eq 'SCALAR') {
3833                 print esc_html($$content);
3834         } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
3835                 print <$content>;
3836         } elsif (!ref($content) && defined($content)) {
3837                 print $content;
3838         }
3839
3840         print $cgi->end_div;
3841 }
3842
3843 sub print_local_time {
3844         print format_local_time(@_);
3845 }
3846
3847 sub format_local_time {
3848         my $localtime = '';
3849         my %date = @_;
3850         if ($date{'hour_local'} < 6) {
3851                 $localtime .= sprintf(" (<span class=\"atnight\">%02d:%02d</span> %s)",
3852                         $date{'hour_local'}, $date{'minute_local'}, $date{'tz_local'});
3853         } else {
3854                 $localtime .= sprintf(" (%02d:%02d %s)",
3855                         $date{'hour_local'}, $date{'minute_local'}, $date{'tz_local'});
3856         }
3857
3858         return $localtime;
3859 }
3860
3861 # Outputs the author name and date in long form
3862 sub git_print_authorship {
3863         my $co = shift;
3864         my %opts = @_;
3865         my $tag = $opts{-tag} || 'div';
3866         my $author = $co->{'author_name'};
3867
3868         my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
3869         print "<$tag class=\"author_date\">" .
3870               format_search_author($author, "author", esc_html($author)) .
3871               " [$ad{'rfc2822'}";
3872         print_local_time(%ad) if ($opts{-localtime});
3873         print "]" . git_get_avatar($co->{'author_email'}, -pad_before => 1)
3874                   . "</$tag>\n";
3875 }
3876
3877 # Outputs table rows containing the full author or committer information,
3878 # in the format expected for 'commit' view (& similar).
3879 # Parameters are a commit hash reference, followed by the list of people
3880 # to output information for. If the list is empty it defaults to both
3881 # author and committer.
3882 sub git_print_authorship_rows {
3883         my $co = shift;
3884         # too bad we can't use @people = @_ || ('author', 'committer')
3885         my @people = @_;
3886         @people = ('author', 'committer') unless @people;
3887         foreach my $who (@people) {
3888                 my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
3889                 print "<tr><td>$who</td><td>" .
3890                       format_search_author($co->{"${who}_name"}, $who,
3891                                esc_html($co->{"${who}_name"})) . " " .
3892                       format_search_author($co->{"${who}_email"}, $who,
3893                                esc_html("<" . $co->{"${who}_email"} . ">")) .
3894                       "</td><td rowspan=\"2\">" .
3895                       git_get_avatar($co->{"${who}_email"}, -size => 'double') .
3896                       "</td></tr>\n" .
3897                       "<tr>" .
3898                       "<td></td><td> $wd{'rfc2822'}";
3899                 print_local_time(%wd);
3900                 print "</td>" .
3901                       "</tr>\n";
3902         }
3903 }
3904
3905 sub git_print_page_path {
3906         my $name = shift;
3907         my $type = shift;
3908         my $hb = shift;
3909
3910
3911         print "<div class=\"page_path\">";
3912         print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
3913                       -title => 'tree root'}, to_utf8("[$project]"));
3914         print " / ";
3915         if (defined $name) {
3916                 my @dirname = split '/', $name;
3917                 my $basename = pop @dirname;
3918                 my $fullname = '';
3919
3920                 foreach my $dir (@dirname) {
3921                         $fullname .= ($fullname ? '/' : '') . $dir;
3922                         print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
3923                                                      hash_base=>$hb),
3924                                       -title => $fullname}, esc_path($dir));
3925                         print " / ";
3926                 }
3927                 if (defined $type && $type eq 'blob') {
3928                         print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
3929                                                      hash_base=>$hb),
3930                                       -title => $name}, esc_path($basename));
3931                 } elsif (defined $type && $type eq 'tree') {
3932                         print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
3933                                                      hash_base=>$hb),
3934                                       -title => $name}, esc_path($basename));
3935                         print " / ";
3936                 } else {
3937                         print esc_path($basename);
3938                 }
3939         }
3940         print "<br/></div>\n";
3941 }
3942
3943 sub git_print_log {
3944         my $log = shift;
3945         my %opts = @_;
3946
3947         if ($opts{'-remove_title'}) {
3948                 # remove title, i.e. first line of log
3949                 shift @$log;
3950         }
3951         # remove leading empty lines
3952         while (defined $log->[0] && $log->[0] eq "") {
3953                 shift @$log;
3954         }
3955
3956         # print log
3957         my $signoff = 0;
3958         my $empty = 0;
3959         foreach my $line (@$log) {
3960                 if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
3961                         $signoff = 1;
3962                         $empty = 0;
3963                         if (! $opts{'-remove_signoff'}) {
3964                                 print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
3965                                 next;
3966                         } else {
3967                                 # remove signoff lines
3968                                 next;
3969                         }
3970                 } else {
3971                         $signoff = 0;
3972                 }
3973
3974                 # print only one empty line
3975                 # do not print empty line after signoff
3976                 if ($line eq "") {
3977                         next if ($empty || $signoff);
3978                         $empty = 1;
3979                 } else {
3980                         $empty = 0;
3981                 }
3982
3983                 print format_log_line_html($line) . "<br/>\n";
3984         }
3985
3986         if ($opts{'-final_empty_line'}) {
3987                 # end with single empty line
3988                 print "<br/>\n" unless $empty;
3989         }
3990 }
3991
3992 # return link target (what link points to)
3993 sub git_get_link_target {
3994         my $hash = shift;
3995         my $link_target;
3996
3997         # read link
3998         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
3999                 or return;
4000         {
4001                 local $/ = undef;
4002                 $link_target = <$fd>;
4003         }
4004         close $fd
4005                 or return;
4006
4007         return $link_target;
4008 }
4009
4010 # given link target, and the directory (basedir) the link is in,
4011 # return target of link relative to top directory (top tree);
4012 # return undef if it is not possible (including absolute links).
4013 sub normalize_link_target {
4014         my ($link_target, $basedir) = @_;
4015
4016         # absolute symlinks (beginning with '/') cannot be normalized
4017         return if (substr($link_target, 0, 1) eq '/');
4018
4019         # normalize link target to path from top (root) tree (dir)
4020         my $path;
4021         if ($basedir) {
4022                 $path = $basedir . '/' . $link_target;
4023         } else {
4024                 # we are in top (root) tree (dir)
4025                 $path = $link_target;
4026         }
4027
4028         # remove //, /./, and /../
4029         my @path_parts;
4030         foreach my $part (split('/', $path)) {
4031                 # discard '.' and ''
4032                 next if (!$part || $part eq '.');
4033                 # handle '..'
4034                 if ($part eq '..') {
4035                         if (@path_parts) {
4036                                 pop @path_parts;
4037                         } else {
4038                                 # link leads outside repository (outside top dir)
4039                                 return;
4040                         }
4041                 } else {
4042                         push @path_parts, $part;
4043                 }
4044         }
4045         $path = join('/', @path_parts);
4046
4047         return $path;
4048 }
4049
4050 # print tree entry (row of git_tree), but without encompassing <tr> element
4051 sub git_print_tree_entry {
4052         my ($t, $basedir, $hash_base, $have_blame) = @_;
4053
4054         my %base_key = ();
4055         $base_key{'hash_base'} = $hash_base if defined $hash_base;
4056
4057         # The format of a table row is: mode list link.  Where mode is
4058         # the mode of the entry, list is the name of the entry, an href,
4059         # and link is the action links of the entry.
4060
4061         print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4062         if (exists $t->{'size'}) {
4063                 print "<td class=\"size\">$t->{'size'}</td>\n";
4064         }
4065         if ($t->{'type'} eq "blob") {
4066                 print "<td class=\"list\">" .
4067                         $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4068                                                file_name=>"$basedir$t->{'name'}", %base_key),
4069                                 -class => "list"}, esc_path($t->{'name'}));
4070                 if (S_ISLNK(oct $t->{'mode'})) {
4071                         my $link_target = git_get_link_target($t->{'hash'});
4072                         if ($link_target) {
4073                                 my $norm_target = normalize_link_target($link_target, $basedir);
4074                                 if (defined $norm_target) {
4075                                         print " -> " .
4076                                               $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4077                                                                      file_name=>$norm_target),
4078                                                        -title => $norm_target}, esc_path($link_target));
4079                                 } else {
4080                                         print " -> " . esc_path($link_target);
4081                                 }
4082                         }
4083                 }
4084                 print "</td>\n";
4085                 print "<td class=\"link\">";
4086                 print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4087                                              file_name=>"$basedir$t->{'name'}", %base_key)},
4088                               "blob");
4089                 if ($have_blame) {
4090                         print " | " .
4091                               $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4092                                                      file_name=>"$basedir$t->{'name'}", %base_key)},
4093                                       "blame");
4094                 }
4095                 if (defined $hash_base) {
4096                         print " | " .
4097                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4098                                                      hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4099                                       "history");
4100                 }
4101                 print " | " .
4102                         $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4103                                                file_name=>"$basedir$t->{'name'}")},
4104                                 "raw");
4105                 print "</td>\n";
4106
4107         } elsif ($t->{'type'} eq "tree") {
4108                 print "<td class=\"list\">";
4109                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4110                                              file_name=>"$basedir$t->{'name'}",
4111                                              %base_key)},
4112                               esc_path($t->{'name'}));
4113                 print "</td>\n";
4114                 print "<td class=\"link\">";
4115                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4116                                              file_name=>"$basedir$t->{'name'}",
4117                                              %base_key)},
4118                               "tree");
4119                 if (defined $hash_base) {
4120                         print " | " .
4121                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4122                                                      file_name=>"$basedir$t->{'name'}")},
4123                                       "history");
4124                 }
4125                 print "</td>\n";
4126         } else {
4127                 # unknown object: we can only present history for it
4128                 # (this includes 'commit' object, i.e. submodule support)
4129                 print "<td class=\"list\">" .
4130                       esc_path($t->{'name'}) .
4131                       "</td>\n";
4132                 print "<td class=\"link\">";
4133                 if (defined $hash_base) {
4134                         print $cgi->a({-href => href(action=>"history",
4135                                                      hash_base=>$hash_base,
4136                                                      file_name=>"$basedir$t->{'name'}")},
4137                                       "history");
4138                 }
4139                 print "</td>\n";
4140         }
4141 }
4142
4143 ## ......................................................................
4144 ## functions printing large fragments of HTML
4145
4146 # get pre-image filenames for merge (combined) diff
4147 sub fill_from_file_info {
4148         my ($diff, @parents) = @_;
4149
4150         $diff->{'from_file'} = [ ];
4151         $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4152         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4153                 if ($diff->{'status'}[$i] eq 'R' ||
4154                     $diff->{'status'}[$i] eq 'C') {
4155                         $diff->{'from_file'}[$i] =
4156                                 git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4157                 }
4158         }
4159
4160         return $diff;
4161 }
4162
4163 # is current raw difftree line of file deletion
4164 sub is_deleted {
4165         my $diffinfo = shift;
4166
4167         return $diffinfo->{'to_id'} eq ('0' x 40);
4168 }
4169
4170 # does patch correspond to [previous] difftree raw line
4171 # $diffinfo  - hashref of parsed raw diff format
4172 # $patchinfo - hashref of parsed patch diff format
4173 #              (the same keys as in $diffinfo)
4174 sub is_patch_split {
4175         my ($diffinfo, $patchinfo) = @_;
4176
4177         return defined $diffinfo && defined $patchinfo
4178                 && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4179 }
4180
4181
4182 sub git_difftree_body {
4183         my ($difftree, $hash, @parents) = @_;
4184         my ($parent) = $parents[0];
4185         my $have_blame = gitweb_check_feature('blame');
4186         print "<div class=\"list_head\">\n";
4187         if ($#{$difftree} > 10) {
4188                 print(($#{$difftree} + 1) . " files changed:\n");
4189         }
4190         print "</div>\n";
4191
4192         print "<table class=\"" .
4193               (@parents > 1 ? "combined " : "") .
4194               "diff_tree\">\n";
4195
4196         # header only for combined diff in 'commitdiff' view
4197         my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4198         if ($has_header) {
4199                 # table header
4200                 print "<thead><tr>\n" .
4201                        "<th></th><th></th>\n"; # filename, patchN link
4202                 for (my $i = 0; $i < @parents; $i++) {
4203                         my $par = $parents[$i];
4204                         print "<th>" .
4205                               $cgi->a({-href => href(action=>"commitdiff",
4206                                                      hash=>$hash, hash_parent=>$par),
4207                                        -title => 'commitdiff to parent number ' .
4208                                                   ($i+1) . ': ' . substr($par,0,7)},
4209                                       $i+1) .
4210                               "&nbsp;</th>\n";
4211                 }
4212                 print "</tr></thead>\n<tbody>\n";
4213         }
4214
4215         my $alternate = 1;
4216         my $patchno = 0;
4217         foreach my $line (@{$difftree}) {
4218                 my $diff = parsed_difftree_line($line);
4219
4220                 if ($alternate) {
4221                         print "<tr class=\"dark\">\n";
4222                 } else {
4223                         print "<tr class=\"light\">\n";
4224                 }
4225                 $alternate ^= 1;
4226
4227                 if (exists $diff->{'nparents'}) { # combined diff
4228
4229                         fill_from_file_info($diff, @parents)
4230                                 unless exists $diff->{'from_file'};
4231
4232                         if (!is_deleted($diff)) {
4233                                 # file exists in the result (child) commit
4234                                 print "<td>" .
4235                                       $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4236                                                              file_name=>$diff->{'to_file'},
4237                                                              hash_base=>$hash),
4238                                               -class => "list"}, esc_path($diff->{'to_file'})) .
4239                                       "</td>\n";
4240                         } else {
4241                                 print "<td>" .
4242                                       esc_path($diff->{'to_file'}) .
4243                                       "</td>\n";
4244                         }
4245
4246                         if ($action eq 'commitdiff') {
4247                                 # link to patch
4248                                 $patchno++;
4249                                 print "<td class=\"link\">" .
4250                                       $cgi->a({-href => "#patch$patchno"}, "patch") .
4251                                       " | " .
4252                                       "</td>\n";
4253                         }
4254
4255                         my $has_history = 0;
4256                         my $not_deleted = 0;
4257                         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4258                                 my $hash_parent = $parents[$i];
4259                                 my $from_hash = $diff->{'from_id'}[$i];
4260                                 my $from_path = $diff->{'from_file'}[$i];
4261                                 my $status = $diff->{'status'}[$i];
4262
4263                                 $has_history ||= ($status ne 'A');
4264                                 $not_deleted ||= ($status ne 'D');
4265
4266                                 if ($status eq 'A') {
4267                                         print "<td  class=\"link\" align=\"right\"> | </td>\n";
4268                                 } elsif ($status eq 'D') {
4269                                         print "<td class=\"link\">" .
4270                                               $cgi->a({-href => href(action=>"blob",
4271                                                                      hash_base=>$hash,
4272                                                                      hash=>$from_hash,
4273                                                                      file_name=>$from_path)},
4274                                                       "blob" . ($i+1)) .
4275                                               " | </td>\n";
4276                                 } else {
4277                                         if ($diff->{'to_id'} eq $from_hash) {
4278                                                 print "<td class=\"link nochange\">";
4279                                         } else {
4280                                                 print "<td class=\"link\">";
4281                                         }
4282                                         print $cgi->a({-href => href(action=>"blobdiff",
4283                                                                      hash=>$diff->{'to_id'},
4284                                                                      hash_parent=>$from_hash,
4285                                                                      hash_base=>$hash,
4286                                                                      hash_parent_base=>$hash_parent,
4287                                                                      file_name=>$diff->{'to_file'},
4288                                                                      file_parent=>$from_path)},
4289                                                       "diff" . ($i+1)) .
4290                                               " | </td>\n";
4291                                 }
4292                         }
4293
4294                         print "<td class=\"link\">";
4295                         if ($not_deleted) {
4296                                 print $cgi->a({-href => href(action=>"blob",
4297                                                              hash=>$diff->{'to_id'},
4298                                                              file_name=>$diff->{'to_file'},
4299                                                              hash_base=>$hash)},
4300                                               "blob");
4301                                 print " | " if ($has_history);
4302                         }
4303                         if ($has_history) {
4304                                 print $cgi->a({-href => href(action=>"history",
4305                                                              file_name=>$diff->{'to_file'},
4306                                                              hash_base=>$hash)},
4307                                               "history");
4308                         }
4309                         print "</td>\n";
4310
4311                         print "</tr>\n";
4312                         next; # instead of 'else' clause, to avoid extra indent
4313                 }
4314                 # else ordinary diff
4315
4316                 my ($to_mode_oct, $to_mode_str, $to_file_type);
4317                 my ($from_mode_oct, $from_mode_str, $from_file_type);
4318                 if ($diff->{'to_mode'} ne ('0' x 6)) {
4319                         $to_mode_oct = oct $diff->{'to_mode'};
4320                         if (S_ISREG($to_mode_oct)) { # only for regular file
4321                                 $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4322                         }
4323                         $to_file_type = file_type($diff->{'to_mode'});
4324                 }
4325                 if ($diff->{'from_mode'} ne ('0' x 6)) {
4326                         $from_mode_oct = oct $diff->{'from_mode'};
4327                         if (S_ISREG($to_mode_oct)) { # only for regular file
4328                                 $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4329                         }
4330                         $from_file_type = file_type($diff->{'from_mode'});
4331                 }
4332
4333                 if ($diff->{'status'} eq "A") { # created
4334                         my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4335                         $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4336                         $mode_chng   .= "]</span>";
4337                         print "<td>";
4338                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4339                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4340                                       -class => "list"}, esc_path($diff->{'file'}));
4341                         print "</td>\n";
4342                         print "<td>$mode_chng</td>\n";
4343                         print "<td class=\"link\">";
4344                         if ($action eq 'commitdiff') {
4345                                 # link to patch
4346                                 $patchno++;
4347                                 print $cgi->a({-href => "#patch$patchno"}, "patch");
4348                                 print " | ";
4349                         }
4350                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4351                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4352                                       "blob");
4353                         print "</td>\n";
4354
4355                 } elsif ($diff->{'status'} eq "D") { # deleted
4356                         my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4357                         print "<td>";
4358                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4359                                                      hash_base=>$parent, file_name=>$diff->{'file'}),
4360                                        -class => "list"}, esc_path($diff->{'file'}));
4361                         print "</td>\n";
4362                         print "<td>$mode_chng</td>\n";
4363                         print "<td class=\"link\">";
4364                         if ($action eq 'commitdiff') {
4365                                 # link to patch
4366                                 $patchno++;
4367                                 print $cgi->a({-href => "#patch$patchno"}, "patch");
4368                                 print " | ";
4369                         }
4370                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4371                                                      hash_base=>$parent, file_name=>$diff->{'file'})},
4372                                       "blob") . " | ";
4373                         if ($have_blame) {
4374                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4375                                                              file_name=>$diff->{'file'})},
4376                                               "blame") . " | ";
4377                         }
4378                         print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4379                                                      file_name=>$diff->{'file'})},
4380                                       "history");
4381                         print "</td>\n";
4382
4383                 } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4384                         my $mode_chnge = "";
4385                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4386                                 $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4387                                 if ($from_file_type ne $to_file_type) {
4388                                         $mode_chnge .= " from $from_file_type to $to_file_type";
4389                                 }
4390                                 if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4391                                         if ($from_mode_str && $to_mode_str) {
4392                                                 $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4393                                         } elsif ($to_mode_str) {
4394                                                 $mode_chnge .= " mode: $to_mode_str";
4395                                         }
4396                                 }
4397                                 $mode_chnge .= "]</span>\n";
4398                         }
4399                         print "<td>";
4400                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4401                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4402                                       -class => "list"}, esc_path($diff->{'file'}));
4403                         print "</td>\n";
4404                         print "<td>$mode_chnge</td>\n";
4405                         print "<td class=\"link\">";
4406                         if ($action eq 'commitdiff') {
4407                                 # link to patch
4408                                 $patchno++;
4409                                 print $cgi->a({-href => "#patch$patchno"}, "patch") .
4410                                       " | ";
4411                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4412                                 # "commit" view and modified file (not onlu mode changed)
4413                                 print $cgi->a({-href => href(action=>"blobdiff",
4414                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4415                                                              hash_base=>$hash, hash_parent_base=>$parent,
4416                                                              file_name=>$diff->{'file'})},
4417                                               "diff") .
4418                                       " | ";
4419                         }
4420                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4421                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4422                                        "blob") . " | ";
4423                         if ($have_blame) {
4424                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4425                                                              file_name=>$diff->{'file'})},
4426                                               "blame") . " | ";
4427                         }
4428                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4429                                                      file_name=>$diff->{'file'})},
4430                                       "history");
4431                         print "</td>\n";
4432
4433                 } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4434                         my %status_name = ('R' => 'moved', 'C' => 'copied');
4435                         my $nstatus = $status_name{$diff->{'status'}};
4436                         my $mode_chng = "";
4437                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4438                                 # mode also for directories, so we cannot use $to_mode_str
4439                                 $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4440                         }
4441                         print "<td>" .
4442                               $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4443                                                      hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4444                                       -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4445                               "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4446                               $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4447                                                      hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4448                                       -class => "list"}, esc_path($diff->{'from_file'})) .
4449                               " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4450                               "<td class=\"link\">";
4451                         if ($action eq 'commitdiff') {
4452                                 # link to patch
4453                                 $patchno++;
4454                                 print $cgi->a({-href => "#patch$patchno"}, "patch") .
4455                                       " | ";
4456                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4457                                 # "commit" view and modified file (not only pure rename or copy)
4458                                 print $cgi->a({-href => href(action=>"blobdiff",
4459                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4460                                                              hash_base=>$hash, hash_parent_base=>$parent,
4461                                                              file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4462                                               "diff") .
4463                                       " | ";
4464                         }
4465                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4466                                                      hash_base=>$parent, file_name=>$diff->{'to_file'})},
4467                                       "blob") . " | ";
4468                         if ($have_blame) {
4469                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4470                                                              file_name=>$diff->{'to_file'})},
4471                                               "blame") . " | ";
4472                         }
4473                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4474                                                     file_name=>$diff->{'to_file'})},
4475                                       "history");
4476                         print "</td>\n";
4477
4478                 } # we should not encounter Unmerged (U) or Unknown (X) status
4479                 print "</tr>\n";
4480         }
4481         print "</tbody>" if $has_header;
4482         print "</table>\n";
4483 }
4484
4485 sub git_patchset_body {
4486         my ($fd, $difftree, $hash, @hash_parents) = @_;
4487         my ($hash_parent) = $hash_parents[0];
4488
4489         my $is_combined = (@hash_parents > 1);
4490         my $patch_idx = 0;
4491         my $patch_number = 0;
4492         my $patch_line;
4493         my $diffinfo;
4494         my $to_name;
4495         my (%from, %to);
4496
4497         print "<div class=\"patchset\">\n";
4498
4499         # skip to first patch
4500         while ($patch_line = <$fd>) {
4501                 chomp $patch_line;
4502
4503                 last if ($patch_line =~ m/^diff /);
4504         }
4505
4506  PATCH:
4507         while ($patch_line) {
4508
4509                 # parse "git diff" header line
4510                 if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
4511                         # $1 is from_name, which we do not use
4512                         $to_name = unquote($2);
4513                         $to_name =~ s!^b/!!;
4514                 } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
4515                         # $1 is 'cc' or 'combined', which we do not use
4516                         $to_name = unquote($2);
4517                 } else {
4518                         $to_name = undef;
4519                 }
4520
4521                 # check if current patch belong to current raw line
4522                 # and parse raw git-diff line if needed
4523                 if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
4524                         # this is continuation of a split patch
4525                         print "<div class=\"patch cont\">\n";
4526                 } else {
4527                         # advance raw git-diff output if needed
4528                         $patch_idx++ if defined $diffinfo;
4529
4530                         # read and prepare patch information
4531                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4532
4533                         # compact combined diff output can have some patches skipped
4534                         # find which patch (using pathname of result) we are at now;
4535                         if ($is_combined) {
4536                                 while ($to_name ne $diffinfo->{'to_file'}) {
4537                                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4538                                               format_diff_cc_simplified($diffinfo, @hash_parents) .
4539                                               "</div>\n";  # class="patch"
4540
4541                                         $patch_idx++;
4542                                         $patch_number++;
4543
4544                                         last if $patch_idx > $#$difftree;
4545                                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4546                                 }
4547                         }
4548
4549                         # modifies %from, %to hashes
4550                         parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
4551
4552                         # this is first patch for raw difftree line with $patch_idx index
4553                         # we index @$difftree array from 0, but number patches from 1
4554                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
4555                 }
4556
4557                 # git diff header
4558                 #assert($patch_line =~ m/^diff /) if DEBUG;
4559                 #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
4560                 $patch_number++;
4561                 # print "git diff" header
4562                 print format_git_diff_header_line($patch_line, $diffinfo,
4563                                                   \%from, \%to);
4564
4565                 # print extended diff header
4566                 print "<div class=\"diff extended_header\">\n";
4567         EXTENDED_HEADER:
4568                 while ($patch_line = <$fd>) {
4569                         chomp $patch_line;
4570
4571                         last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
4572
4573                         print format_extended_diff_header_line($patch_line, $diffinfo,
4574                                                                \%from, \%to);
4575                 }
4576                 print "</div>\n"; # class="diff extended_header"
4577
4578                 # from-file/to-file diff header
4579                 if (! $patch_line) {
4580                         print "</div>\n"; # class="patch"
4581                         last PATCH;
4582                 }
4583                 next PATCH if ($patch_line =~ m/^diff /);
4584                 #assert($patch_line =~ m/^---/) if DEBUG;
4585
4586                 my $last_patch_line = $patch_line;
4587                 $patch_line = <$fd>;
4588                 chomp $patch_line;
4589                 #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
4590
4591                 print format_diff_from_to_header($last_patch_line, $patch_line,
4592                                                  $diffinfo, \%from, \%to,
4593                                                  @hash_parents);
4594
4595                 # the patch itself
4596         LINE:
4597                 while ($patch_line = <$fd>) {
4598                         chomp $patch_line;
4599
4600                         next PATCH if ($patch_line =~ m/^diff /);
4601
4602                         print format_diff_line($patch_line, \%from, \%to);
4603                 }
4604
4605         } continue {
4606                 print "</div>\n"; # class="patch"
4607         }
4608
4609         # for compact combined (--cc) format, with chunk and patch simplification
4610         # the patchset might be empty, but there might be unprocessed raw lines
4611         for (++$patch_idx if $patch_number > 0;
4612              $patch_idx < @$difftree;
4613              ++$patch_idx) {
4614                 # read and prepare patch information
4615                 $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4616
4617                 # generate anchor for "patch" links in difftree / whatchanged part
4618                 print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4619                       format_diff_cc_simplified($diffinfo, @hash_parents) .
4620                       "</div>\n";  # class="patch"
4621
4622                 $patch_number++;
4623         }
4624
4625         if ($patch_number == 0) {
4626                 if (@hash_parents > 1) {
4627                         print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
4628                 } else {
4629                         print "<div class=\"diff nodifferences\">No differences found</div>\n";
4630                 }
4631         }
4632
4633         print "</div>\n"; # class="patchset"
4634 }
4635
4636 # . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
4637
4638 # fills project list info (age, description, owner, forks) for each
4639 # project in the list, removing invalid projects from returned list
4640 # NOTE: modifies $projlist, but does not remove entries from it
4641 sub fill_project_list_info {
4642         my ($projlist, $check_forks) = @_;
4643         my @projects;
4644
4645         my $show_ctags = gitweb_check_feature('ctags');
4646  PROJECT:
4647         foreach my $pr (@$projlist) {
4648                 my (@activity) = git_get_last_activity($pr->{'path'});
4649                 unless (@activity) {
4650                         next PROJECT;
4651                 }
4652                 ($pr->{'age'}, $pr->{'age_string'}) = @activity;
4653                 if (!defined $pr->{'descr'}) {
4654                         my $descr = git_get_project_description($pr->{'path'}) || "";
4655                         $descr = to_utf8($descr);
4656                         $pr->{'descr_long'} = $descr;
4657                         $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
4658                 }
4659                 if (!defined $pr->{'owner'}) {
4660                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
4661                 }
4662                 if ($check_forks) {
4663                         my $pname = $pr->{'path'};
4664                         if (($pname =~ s/\.git$//) &&
4665                             ($pname !~ /\/$/) &&
4666                             (-d "$projectroot/$pname")) {
4667                                 $pr->{'forks'} = "-d $projectroot/$pname";
4668                         } else {
4669                                 $pr->{'forks'} = 0;
4670                         }
4671                 }
4672                 $show_ctags and $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
4673                 push @projects, $pr;
4674         }
4675
4676         return @projects;
4677 }
4678
4679 # print 'sort by' <th> element, generating 'sort by $name' replay link
4680 # if that order is not selected
4681 sub print_sort_th {
4682         print format_sort_th(@_);
4683 }
4684
4685 sub format_sort_th {
4686         my ($name, $order, $header) = @_;
4687         my $sort_th = "";
4688         $header ||= ucfirst($name);
4689
4690         if ($order eq $name) {
4691                 $sort_th .= "<th>$header</th>\n";
4692         } else {
4693                 $sort_th .= "<th>" .
4694                             $cgi->a({-href => href(-replay=>1, order=>$name),
4695                                      -class => "header"}, $header) .
4696                             "</th>\n";
4697         }
4698
4699         return $sort_th;
4700 }
4701
4702 sub git_project_list_body {
4703         # actually uses global variable $project
4704         my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
4705
4706         my $check_forks = gitweb_check_feature('forks');
4707         my @projects = fill_project_list_info($projlist, $check_forks);
4708
4709         $order ||= $default_projects_order;
4710         $from = 0 unless defined $from;
4711         $to = $#projects if (!defined $to || $#projects < $to);
4712
4713         my %order_info = (
4714                 project => { key => 'path', type => 'str' },
4715                 descr => { key => 'descr_long', type => 'str' },
4716                 owner => { key => 'owner', type => 'str' },
4717                 age => { key => 'age', type => 'num' }
4718         );
4719         my $oi = $order_info{$order};
4720         if ($oi->{'type'} eq 'str') {
4721                 @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @projects;
4722         } else {
4723                 @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @projects;
4724         }
4725
4726         my $show_ctags = gitweb_check_feature('ctags');
4727         if ($show_ctags) {
4728                 my %ctags;
4729                 foreach my $p (@projects) {
4730                         foreach my $ct (keys %{$p->{'ctags'}}) {
4731                                 $ctags{$ct} += $p->{'ctags'}->{$ct};
4732                         }
4733                 }
4734                 my $cloud = git_populate_project_tagcloud(\%ctags);
4735                 print git_show_project_tagcloud($cloud, 64);
4736         }
4737
4738         print "<table class=\"project_list\">\n";
4739         unless ($no_header) {
4740                 print "<tr>\n";
4741                 if ($check_forks) {
4742                         print "<th></th>\n";
4743                 }
4744                 print_sort_th('project', $order, 'Project');
4745                 print_sort_th('descr', $order, 'Description');
4746                 print_sort_th('owner', $order, 'Owner');
4747                 print_sort_th('age', $order, 'Last Change');
4748                 print "<th></th>\n" . # for links
4749                       "</tr>\n";
4750         }
4751         my $alternate = 1;
4752         my $tagfilter = $cgi->param('by_tag');
4753         for (my $i = $from; $i <= $to; $i++) {
4754                 my $pr = $projects[$i];
4755
4756                 next if $tagfilter and $show_ctags and not grep { lc $_ eq lc $tagfilter } keys %{$pr->{'ctags'}};
4757                 next if $searchtext and not $pr->{'path'} =~ /$searchtext/
4758                         and not $pr->{'descr_long'} =~ /$searchtext/;
4759                 # Weed out forks or non-matching entries of search
4760                 if ($check_forks) {
4761                         my $forkbase = $project; $forkbase ||= ''; $forkbase =~ s#\.git$#/#;
4762                         $forkbase="^$forkbase" if $forkbase;
4763                         next if not $searchtext and not $tagfilter and $show_ctags
4764                                 and $pr->{'path'} =~ m#$forkbase.*/.*#; # regexp-safe
4765                 }
4766
4767                 if ($alternate) {
4768                         print "<tr class=\"dark\">\n";
4769                 } else {
4770                         print "<tr class=\"light\">\n";
4771                 }
4772                 $alternate ^= 1;
4773                 if ($check_forks) {
4774                         print "<td>";
4775                         if ($pr->{'forks'}) {
4776                                 print "<!-- $pr->{'forks'} -->\n";
4777                                 print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "+");
4778                         }
4779                         print "</td>\n";
4780                 }
4781                 print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4782                                         -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
4783                       "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
4784                                         -class => "list", -title => $pr->{'descr_long'}},
4785                                         esc_html($pr->{'descr'})) . "</td>\n" .
4786                       "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
4787                 print "<td class=\"". age_class($pr->{'age'}) . "\">" .
4788                       (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
4789                       "<td class=\"link\">" .
4790                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
4791                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
4792                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
4793                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
4794                       ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
4795                       "</td>\n" .
4796                       "</tr>\n";
4797         }
4798         if (defined $extra) {
4799                 print "<tr>\n";
4800                 if ($check_forks) {
4801                         print "<td></td>\n";
4802                 }
4803                 print "<td colspan=\"5\">$extra</td>\n" .
4804                       "</tr>\n";
4805         }
4806         print "</table>\n";
4807 }
4808
4809 sub git_log_body {
4810         # uses global variable $project
4811         my ($commitlist, $from, $to, $refs, $extra) = @_;
4812
4813         $from = 0 unless defined $from;
4814         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4815
4816         for (my $i = 0; $i <= $to; $i++) {
4817                 my %co = %{$commitlist->[$i]};
4818                 next if !%co;
4819                 my $commit = $co{'id'};
4820                 my $ref = format_ref_marker($refs, $commit);
4821                 my %ad = parse_date($co{'author_epoch'});
4822                 git_print_header_div('commit',
4823                                "<span class=\"age\">$co{'age_string'}</span>" .
4824                                esc_html($co{'title'}) . $ref,
4825                                $commit);
4826                 print "<div class=\"title_text\">\n" .
4827                       "<div class=\"log_link\">\n" .
4828                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
4829                       " | " .
4830                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
4831                       " | " .
4832                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
4833                       "<br/>\n" .
4834                       "</div>\n";
4835                       git_print_authorship(\%co, -tag => 'span');
4836                       print "<br/>\n</div>\n";
4837
4838                 print "<div class=\"log_body\">\n";
4839                 git_print_log($co{'comment'}, -final_empty_line=> 1);
4840                 print "</div>\n";
4841         }
4842         if ($extra) {
4843                 print "<div class=\"page_nav\">\n";
4844                 print "$extra\n";
4845                 print "</div>\n";
4846         }
4847 }
4848
4849 sub git_shortlog_body {
4850         # uses global variable $project
4851         my ($commitlist, $from, $to, $refs, $extra) = @_;
4852
4853         $from = 0 unless defined $from;
4854         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
4855
4856         print "<table class=\"shortlog\">\n";
4857         my $alternate = 1;
4858         for (my $i = $from; $i <= $to; $i++) {
4859                 my %co = %{$commitlist->[$i]};
4860                 my $commit = $co{'id'};
4861                 my $ref = format_ref_marker($refs, $commit);
4862                 if ($alternate) {
4863                         print "<tr class=\"dark\">\n";
4864                 } else {
4865                         print "<tr class=\"light\">\n";
4866                 }
4867                 $alternate ^= 1;
4868                 # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
4869                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4870                       format_author_html('td', \%co, 10) . "<td>";
4871                 print format_subject_html($co{'title'}, $co{'title_short'},
4872                                           href(action=>"commit", hash=>$commit), $ref);
4873                 print "</td>\n" .
4874                       "<td class=\"link\">" .
4875                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
4876                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
4877                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
4878                 my $snapshot_links = format_snapshot_links($commit);
4879                 if (defined $snapshot_links) {
4880                         print " | " . $snapshot_links;
4881                 }
4882                 print "</td>\n" .
4883                       "</tr>\n";
4884         }
4885         if (defined $extra) {
4886                 print "<tr>\n" .
4887                       "<td colspan=\"4\">$extra</td>\n" .
4888                       "</tr>\n";
4889         }
4890         print "</table>\n";
4891 }
4892
4893 sub git_history_body {
4894         # Warning: assumes constant type (blob or tree) during history
4895         my ($commitlist, $from, $to, $refs, $extra,
4896             $file_name, $file_hash, $ftype) = @_;
4897
4898         $from = 0 unless defined $from;
4899         $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
4900
4901         print "<table class=\"history\">\n";
4902         my $alternate = 1;
4903         for (my $i = $from; $i <= $to; $i++) {
4904                 my %co = %{$commitlist->[$i]};
4905                 if (!%co) {
4906                         next;
4907                 }
4908                 my $commit = $co{'id'};
4909
4910                 my $ref = format_ref_marker($refs, $commit);
4911
4912                 if ($alternate) {
4913                         print "<tr class=\"dark\">\n";
4914                 } else {
4915                         print "<tr class=\"light\">\n";
4916                 }
4917                 $alternate ^= 1;
4918                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
4919         # shortlog:   format_author_html('td', \%co, 10)
4920                       format_author_html('td', \%co, 15, 3) . "<td>";
4921                 # originally git_history used chop_str($co{'title'}, 50)
4922                 print format_subject_html($co{'title'}, $co{'title_short'},
4923                                           href(action=>"commit", hash=>$commit), $ref);
4924                 print "</td>\n" .
4925                       "<td class=\"link\">" .
4926                       $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
4927                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
4928
4929                 if ($ftype eq 'blob') {
4930                         my $blob_current = $file_hash;
4931                         my $blob_parent  = git_get_hash_by_path($commit, $file_name);
4932                         if (defined $blob_current && defined $blob_parent &&
4933                                         $blob_current ne $blob_parent) {
4934                                 print " | " .
4935                                         $cgi->a({-href => href(action=>"blobdiff",
4936                                                                hash=>$blob_current, hash_parent=>$blob_parent,
4937                                                                hash_base=>$hash_base, hash_parent_base=>$commit,
4938                                                                file_name=>$file_name)},
4939                                                 "diff to current");
4940                         }
4941                 }
4942                 print "</td>\n" .
4943                       "</tr>\n";
4944         }
4945         if (defined $extra) {
4946                 print "<tr>\n" .
4947                       "<td colspan=\"4\">$extra</td>\n" .
4948                       "</tr>\n";
4949         }
4950         print "</table>\n";
4951 }
4952
4953 sub git_tags_body {
4954         # uses global variable $project
4955         my ($taglist, $from, $to, $extra) = @_;
4956         $from = 0 unless defined $from;
4957         $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
4958
4959         print "<table class=\"tags\">\n";
4960         my $alternate = 1;
4961         for (my $i = $from; $i <= $to; $i++) {
4962                 my $entry = $taglist->[$i];
4963                 my %tag = %$entry;
4964                 my $comment = $tag{'subject'};
4965                 my $comment_short;
4966                 if (defined $comment) {
4967                         $comment_short = chop_str($comment, 30, 5);
4968                 }
4969                 if ($alternate) {
4970                         print "<tr class=\"dark\">\n";
4971                 } else {
4972                         print "<tr class=\"light\">\n";
4973                 }
4974                 $alternate ^= 1;
4975                 if (defined $tag{'age'}) {
4976                         print "<td><i>$tag{'age'}</i></td>\n";
4977                 } else {
4978                         print "<td></td>\n";
4979                 }
4980                 print "<td>" .
4981                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
4982                                -class => "list name"}, esc_html($tag{'name'})) .
4983                       "</td>\n" .
4984                       "<td>";
4985                 if (defined $comment) {
4986                         print format_subject_html($comment, $comment_short,
4987                                                   href(action=>"tag", hash=>$tag{'id'}));
4988                 }
4989                 print "</td>\n" .
4990                       "<td class=\"selflink\">";
4991                 if ($tag{'type'} eq "tag") {
4992                         print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
4993                 } else {
4994                         print "&nbsp;";
4995                 }
4996                 print "</td>\n" .
4997                       "<td class=\"link\">" . " | " .
4998                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
4999                 if ($tag{'reftype'} eq "commit") {
5000                         print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5001                               " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5002                 } elsif ($tag{'reftype'} eq "blob") {
5003                         print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5004                 }
5005                 print "</td>\n" .
5006                       "</tr>";
5007         }
5008         if (defined $extra) {
5009                 print "<tr>\n" .
5010                       "<td colspan=\"5\">$extra</td>\n" .
5011                       "</tr>\n";
5012         }
5013         print "</table>\n";
5014 }
5015
5016 sub git_heads_body {
5017         # uses global variable $project
5018         my ($headlist, $head, $from, $to, $extra) = @_;
5019         $from = 0 unless defined $from;
5020         $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5021
5022         print "<table class=\"heads\">\n";
5023         my $alternate = 1;
5024         for (my $i = $from; $i <= $to; $i++) {
5025                 my $entry = $headlist->[$i];
5026                 my %ref = %$entry;
5027                 my $curr = $ref{'id'} eq $head;
5028                 if ($alternate) {
5029                         print "<tr class=\"dark\">\n";
5030                 } else {
5031                         print "<tr class=\"light\">\n";
5032                 }
5033                 $alternate ^= 1;
5034                 print "<td><i>$ref{'age'}</i></td>\n" .
5035                       ($curr ? "<td class=\"current_head\">" : "<td>") .
5036                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5037                                -class => "list name"},esc_html($ref{'name'})) .
5038                       "</td>\n" .
5039                       "<td class=\"link\">" .
5040                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5041                       $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5042                       $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5043                       "</td>\n" .
5044                       "</tr>";
5045         }
5046         if (defined $extra) {
5047                 print "<tr>\n" .
5048                       "<td colspan=\"3\">$extra</td>\n" .
5049                       "</tr>\n";
5050         }
5051         print "</table>\n";
5052 }
5053
5054 sub git_search_grep_body {
5055         my ($commitlist, $from, $to, $extra) = @_;
5056         $from = 0 unless defined $from;
5057         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5058
5059         print "<table class=\"commit_search\">\n";
5060         my $alternate = 1;
5061         for (my $i = $from; $i <= $to; $i++) {
5062                 my %co = %{$commitlist->[$i]};
5063                 if (!%co) {
5064                         next;
5065                 }
5066                 my $commit = $co{'id'};
5067                 if ($alternate) {
5068                         print "<tr class=\"dark\">\n";
5069                 } else {
5070                         print "<tr class=\"light\">\n";
5071                 }
5072                 $alternate ^= 1;
5073                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5074                       format_author_html('td', \%co, 15, 5) .
5075                       "<td>" .
5076                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5077                                -class => "list subject"},
5078                               chop_and_escape_str($co{'title'}, 50) . "<br/>");
5079                 my $comment = $co{'comment'};
5080                 foreach my $line (@$comment) {
5081                         if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
5082                                 my ($lead, $match, $trail) = ($1, $2, $3);
5083                                 $match = chop_str($match, 70, 5, 'center');
5084                                 my $contextlen = int((80 - length($match))/2);
5085                                 $contextlen = 30 if ($contextlen > 30);
5086                                 $lead  = chop_str($lead,  $contextlen, 10, 'left');
5087                                 $trail = chop_str($trail, $contextlen, 10, 'right');
5088
5089                                 $lead  = esc_html($lead);
5090                                 $match = esc_html($match);
5091                                 $trail = esc_html($trail);
5092
5093                                 print "$lead<span class=\"match\">$match</span>$trail<br />";
5094                         }
5095                 }
5096                 print "</td>\n" .
5097                       "<td class=\"link\">" .
5098                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5099                       " | " .
5100                       $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5101                       " | " .
5102                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5103                 print "</td>\n" .
5104                       "</tr>\n";
5105         }
5106         if (defined $extra) {
5107                 print "<tr>\n" .
5108                       "<td colspan=\"3\">$extra</td>\n" .
5109                       "</tr>\n";
5110         }
5111         print "</table>\n";
5112 }
5113
5114 ## ======================================================================
5115 ## ======================================================================
5116 ## actions
5117
5118 sub git_project_list {
5119         my $order = $input_params{'order'};
5120         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5121                 die_error(400, "Unknown order parameter");
5122         }
5123
5124         my @list = git_get_projects_list();
5125         if (!@list) {
5126                 die_error(404, "No projects found");
5127         }
5128
5129         git_header_html();
5130         if (defined $home_text && -f $home_text) {
5131                 print "<div class=\"index_include\">\n";
5132                 insert_file($home_text);
5133                 print "</div>\n";
5134         }
5135         print $cgi->startform(-method => "get") .
5136               "<p class=\"projsearch\">Search:\n" .
5137               $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
5138               "</p>" .
5139               $cgi->end_form() . "\n";
5140         git_project_list_body(\@list, $order);
5141         git_footer_html();
5142 }
5143
5144 sub git_forks {
5145         my $order = $input_params{'order'};
5146         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5147                 die_error(400, "Unknown order parameter");
5148         }
5149
5150         my @list = git_get_projects_list($project);
5151         if (!@list) {
5152                 die_error(404, "No forks found");
5153         }
5154
5155         git_header_html();
5156         git_print_page_nav('','');
5157         git_print_header_div('summary', "$project forks");
5158         git_project_list_body(\@list, $order);
5159         git_footer_html();
5160 }
5161
5162 sub git_project_index {
5163         my @projects = git_get_projects_list($project);
5164
5165         print $cgi->header(
5166                 -type => 'text/plain',
5167                 -charset => 'utf-8',
5168                 -content_disposition => 'inline; filename="index.aux"');
5169
5170         foreach my $pr (@projects) {
5171                 if (!exists $pr->{'owner'}) {
5172                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
5173                 }
5174
5175                 my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
5176                 # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
5177                 $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5178                 $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5179                 $path  =~ s/ /\+/g;
5180                 $owner =~ s/ /\+/g;
5181
5182                 print "$path $owner\n";
5183         }
5184 }
5185
5186 sub git_summary {
5187         my $descr = git_get_project_description($project) || "none";
5188         my %co = parse_commit("HEAD");
5189         my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
5190         my $head = $co{'id'};
5191         my $remote_heads = gitweb_check_feature('remote_heads');
5192
5193         my $owner = git_get_project_owner($project);
5194
5195         my $refs = git_get_references();
5196         # These get_*_list functions return one more to allow us to see if
5197         # there are more ...
5198         my @taglist  = git_get_tags_list(16);
5199         my @headlist = git_get_heads_list(16);
5200         my @remotelist = $remote_heads ? git_get_heads_list(16, 'remotes') : ();
5201         my @forklist;
5202         my $check_forks = gitweb_check_feature('forks');
5203
5204         if ($check_forks) {
5205                 @forklist = git_get_projects_list($project);
5206         }
5207
5208         git_header_html();
5209         git_print_page_nav('summary','', $head);
5210
5211         print "<div class=\"title\">&nbsp;</div>\n";
5212         print "<table class=\"projects_list\">\n" .
5213               "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
5214               "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
5215         if (defined $cd{'rfc2822'}) {
5216                 print "<tr id=\"metadata_lchange\"><td>last change</td><td>$cd{'rfc2822'}</td></tr>\n";
5217         }
5218
5219         # use per project git URL list in $projectroot/$project/cloneurl
5220         # or make project git URL from git base URL and project name
5221         my $url_tag = "URL";
5222         my @url_list = git_get_project_url_list($project);
5223         @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
5224         foreach my $git_url (@url_list) {
5225                 next unless $git_url;
5226                 print format_repo_url($url_tag, $git_url);
5227                 $url_tag = "";
5228         }
5229
5230         # Tag cloud
5231         my $show_ctags = gitweb_check_feature('ctags');
5232         if ($show_ctags) {
5233                 my $ctags = git_get_project_ctags($project);
5234                 my $cloud = git_populate_project_tagcloud($ctags);
5235                 print "<tr id=\"metadata_ctags\"><td>Content tags:<br />";
5236                 print "</td>\n<td>" unless %$ctags;
5237                 print "<form action=\"$show_ctags\" method=\"post\"><input type=\"hidden\" name=\"p\" value=\"$project\" />Add: <input type=\"text\" name=\"t\" size=\"8\" /></form>";
5238                 print "</td>\n<td>" if %$ctags;
5239                 print git_show_project_tagcloud($cloud, 48);
5240                 print "</td></tr>";
5241         }
5242
5243         print "</table>\n";
5244
5245         # If XSS prevention is on, we don't include README.html.
5246         # TODO: Allow a readme in some safe format.
5247         if (!$prevent_xss && -s "$projectroot/$project/README.html") {
5248                 print "<div class=\"title\">readme</div>\n" .
5249                       "<div class=\"readme\">\n";
5250                 insert_file("$projectroot/$project/README.html");
5251                 print "\n</div>\n"; # class="readme"
5252         }
5253
5254         # we need to request one more than 16 (0..15) to check if
5255         # those 16 are all
5256         my @commitlist = $head ? parse_commits($head, 17) : ();
5257         if (@commitlist) {
5258                 git_print_header_div('shortlog');
5259                 git_shortlog_body(\@commitlist, 0, 15, $refs,
5260                                   $#commitlist <=  15 ? undef :
5261                                   $cgi->a({-href => href(action=>"shortlog")}, "..."));
5262         }
5263
5264         if (@taglist) {
5265                 git_print_header_div('tags');
5266                 git_tags_body(\@taglist, 0, 15,
5267                               $#taglist <=  15 ? undef :
5268                               $cgi->a({-href => href(action=>"tags")}, "..."));
5269         }
5270
5271         if (@headlist) {
5272                 git_print_header_div('heads');
5273                 git_heads_body(\@headlist, $head, 0, 15,
5274                                $#headlist <= 15 ? undef :
5275                                $cgi->a({-href => href(action=>"heads")}, "..."));
5276         }
5277
5278         if (@remotelist) {
5279                 git_print_header_div('remotes');
5280                 git_heads_body(\@remotelist, $head, 0, 15,
5281                                $#remotelist <= 15 ? undef :
5282                                $cgi->a({-href => href(action=>"remotes")}, "..."));
5283         }
5284
5285         if (@forklist) {
5286                 git_print_header_div('forks');
5287                 git_project_list_body(\@forklist, 'age', 0, 15,
5288                                       $#forklist <= 15 ? undef :
5289                                       $cgi->a({-href => href(action=>"forks")}, "..."),
5290                                       'no_header');
5291         }
5292
5293         git_footer_html();
5294 }
5295
5296 sub git_tag {
5297         my %tag = parse_tag($hash);
5298
5299         if (! %tag) {
5300                 die_error(404, "Unknown tag object");
5301         }
5302
5303         my $head = git_get_head_hash($project);
5304         git_header_html();
5305         git_print_page_nav('','', $head,undef,$head);
5306         git_print_header_div('commit', esc_html($tag{'name'}), $hash);
5307         print "<div class=\"title_text\">\n" .
5308               "<table class=\"object_header\">\n" .
5309               "<tr>\n" .
5310               "<td>object</td>\n" .
5311               "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5312                                $tag{'object'}) . "</td>\n" .
5313               "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5314                                               $tag{'type'}) . "</td>\n" .
5315               "</tr>\n";
5316         if (defined($tag{'author'})) {
5317                 git_print_authorship_rows(\%tag, 'author');
5318         }
5319         print "</table>\n\n" .
5320               "</div>\n";
5321         print "<div class=\"page_body\">";
5322         my $comment = $tag{'comment'};
5323         foreach my $line (@$comment) {
5324                 chomp $line;
5325                 print esc_html($line, -nbsp=>1) . "<br/>\n";
5326         }
5327         print "</div>\n";
5328         git_footer_html();
5329 }
5330
5331 sub git_blame_common {
5332         my $format = shift || 'porcelain';
5333         if ($format eq 'porcelain' && $cgi->param('js')) {
5334                 $format = 'incremental';
5335                 $action = 'blame_incremental'; # for page title etc
5336         }
5337
5338         # permissions
5339         gitweb_check_feature('blame')
5340                 or die_error(403, "Blame view not allowed");
5341
5342         # error checking
5343         die_error(400, "No file name given") unless $file_name;
5344         $hash_base ||= git_get_head_hash($project);
5345         die_error(404, "Couldn't find base commit") unless $hash_base;
5346         my %co = parse_commit($hash_base)
5347                 or die_error(404, "Commit not found");
5348         my $ftype = "blob";
5349         if (!defined $hash) {
5350                 $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
5351                         or die_error(404, "Error looking up file");
5352         } else {
5353                 $ftype = git_get_type($hash);
5354                 if ($ftype !~ "blob") {
5355                         die_error(400, "Object is not a blob");
5356                 }
5357         }
5358
5359         my $fd;
5360         if ($format eq 'incremental') {
5361                 # get file contents (as base)
5362                 open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
5363                         or die_error(500, "Open git-cat-file failed");
5364         } elsif ($format eq 'data') {
5365                 # run git-blame --incremental
5366                 open $fd, "-|", git_cmd(), "blame", "--incremental",
5367                         $hash_base, "--", $file_name
5368                         or die_error(500, "Open git-blame --incremental failed");
5369         } else {
5370                 # run git-blame --porcelain
5371                 open $fd, "-|", git_cmd(), "blame", '-p',
5372                         $hash_base, '--', $file_name
5373                         or die_error(500, "Open git-blame --porcelain failed");
5374         }
5375
5376         # incremental blame data returns early
5377         if ($format eq 'data') {
5378                 print $cgi->header(
5379                         -type=>"text/plain", -charset => "utf-8",
5380                         -status=> "200 OK");
5381                 local $| = 1; # output autoflush
5382                 print while <$fd>;
5383                 close $fd
5384                         or print "ERROR $!\n";
5385
5386                 print 'END';
5387                 if (defined $t0 && gitweb_check_feature('timed')) {
5388                         print ' '.
5389                               Time::HiRes::tv_interval($t0, [Time::HiRes::gettimeofday()]).
5390                               ' '.$number_of_git_cmds;
5391                 }
5392                 print "\n";
5393
5394                 return;
5395         }
5396
5397         # page header
5398         git_header_html();
5399         my $formats_nav =
5400                 $cgi->a({-href => href(action=>"blob", -replay=>1)},
5401                         "blob") .
5402                 " | ";
5403         if ($format eq 'incremental') {
5404                 $formats_nav .=
5405                         $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
5406                                 "blame") . " (non-incremental)";
5407         } else {
5408                 $formats_nav .=
5409                         $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
5410                                 "blame") . " (incremental)";
5411         }
5412         $formats_nav .=
5413                 " | " .
5414                 $cgi->a({-href => href(action=>"history", -replay=>1)},
5415                         "history") .
5416                 " | " .
5417                 $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
5418                         "HEAD");
5419         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5420         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5421         git_print_page_path($file_name, $ftype, $hash_base);
5422
5423         # page body
5424         if ($format eq 'incremental') {
5425                 print "<noscript>\n<div class=\"error\"><center><b>\n".
5426                       "This page requires JavaScript to run.\n Use ".
5427                       $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
5428                               'this page').
5429                       " instead.\n".
5430                       "</b></center></div>\n</noscript>\n";
5431
5432                 print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
5433         }
5434
5435         print qq!<div class="page_body">\n!;
5436         print qq!<div id="progress_info">... / ...</div>\n!
5437                 if ($format eq 'incremental');
5438         print qq!<table id="blame_table" class="blame" width="100%">\n!.
5439               #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
5440               qq!<thead>\n!.
5441               qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
5442               qq!</thead>\n!.
5443               qq!<tbody>\n!;
5444
5445         my @rev_color = qw(light dark);
5446         my $num_colors = scalar(@rev_color);
5447         my $current_color = 0;
5448
5449         if ($format eq 'incremental') {
5450                 my $color_class = $rev_color[$current_color];
5451
5452                 #contents of a file
5453                 my $linenr = 0;
5454         LINE:
5455                 while (my $line = <$fd>) {
5456                         chomp $line;
5457                         $linenr++;
5458
5459                         print qq!<tr id="l$linenr" class="$color_class">!.
5460                               qq!<td class="sha1"><a href=""> </a></td>!.
5461                               qq!<td class="linenr">!.
5462                               qq!<a class="linenr" href="">$linenr</a></td>!;
5463                         print qq!<td class="pre">! . esc_html($line) . "</td>\n";
5464                         print qq!</tr>\n!;
5465                 }
5466
5467         } else { # porcelain, i.e. ordinary blame
5468                 my %metainfo = (); # saves information about commits
5469
5470                 # blame data
5471         LINE:
5472                 while (my $line = <$fd>) {
5473                         chomp $line;
5474                         # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
5475                         # no <lines in group> for subsequent lines in group of lines
5476                         my ($full_rev, $orig_lineno, $lineno, $group_size) =
5477                            ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
5478                         if (!exists $metainfo{$full_rev}) {
5479                                 $metainfo{$full_rev} = { 'nprevious' => 0 };
5480                         }
5481                         my $meta = $metainfo{$full_rev};
5482                         my $data;
5483                         while ($data = <$fd>) {
5484                                 chomp $data;
5485                                 last if ($data =~ s/^\t//); # contents of line
5486                                 if ($data =~ /^(\S+)(?: (.*))?$/) {
5487                                         $meta->{$1} = $2 unless exists $meta->{$1};
5488                                 }
5489                                 if ($data =~ /^previous /) {
5490                                         $meta->{'nprevious'}++;
5491                                 }
5492                         }
5493                         my $short_rev = substr($full_rev, 0, 8);
5494                         my $author = $meta->{'author'};
5495                         my %date =
5496                                 parse_date($meta->{'author-time'}, $meta->{'author-tz'});
5497                         my $date = $date{'iso-tz'};
5498                         if ($group_size) {
5499                                 $current_color = ($current_color + 1) % $num_colors;
5500                         }
5501                         my $tr_class = $rev_color[$current_color];
5502                         $tr_class .= ' boundary' if (exists $meta->{'boundary'});
5503                         $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
5504                         $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
5505                         print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
5506                         if ($group_size) {
5507                                 print "<td class=\"sha1\"";
5508                                 print " title=\"". esc_html($author) . ", $date\"";
5509                                 print " rowspan=\"$group_size\"" if ($group_size > 1);
5510                                 print ">";
5511                                 print $cgi->a({-href => href(action=>"commit",
5512                                                              hash=>$full_rev,
5513                                                              file_name=>$file_name)},
5514                                               esc_html($short_rev));
5515                                 if ($group_size >= 2) {
5516                                         my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
5517                                         if (@author_initials) {
5518                                                 print "<br />" .
5519                                                       esc_html(join('', @author_initials));
5520                                                 #           or join('.', ...)
5521                                         }
5522                                 }
5523                                 print "</td>\n";
5524                         }
5525                         # 'previous' <sha1 of parent commit> <filename at commit>
5526                         if (exists $meta->{'previous'} &&
5527                             $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
5528                                 $meta->{'parent'} = $1;
5529                                 $meta->{'file_parent'} = unquote($2);
5530                         }
5531                         my $linenr_commit =
5532                                 exists($meta->{'parent'}) ?
5533                                 $meta->{'parent'} : $full_rev;
5534                         my $linenr_filename =
5535                                 exists($meta->{'file_parent'}) ?
5536                                 $meta->{'file_parent'} : unquote($meta->{'filename'});
5537                         my $blamed = href(action => 'blame',
5538                                           file_name => $linenr_filename,
5539                                           hash_base => $linenr_commit);
5540                         print "<td class=\"linenr\">";
5541                         print $cgi->a({ -href => "$blamed#l$orig_lineno",
5542                                         -class => "linenr" },
5543                                       esc_html($lineno));
5544                         print "</td>";
5545                         print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
5546                         print "</tr>\n";
5547                 } # end while
5548
5549         }
5550
5551         # footer
5552         print "</tbody>\n".
5553               "</table>\n"; # class="blame"
5554         print "</div>\n";   # class="blame_body"
5555         close $fd
5556                 or print "Reading blob failed\n";
5557
5558         git_footer_html();
5559 }
5560
5561 sub git_blame {
5562         git_blame_common();
5563 }
5564
5565 sub git_blame_incremental {
5566         git_blame_common('incremental');
5567 }
5568
5569 sub git_blame_data {
5570         git_blame_common('data');
5571 }
5572
5573 sub git_tags {
5574         my $head = git_get_head_hash($project);
5575         git_header_html();
5576         git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
5577         git_print_header_div('summary', $project);
5578
5579         my @tagslist = git_get_tags_list();
5580         if (@tagslist) {
5581                 git_tags_body(\@tagslist);
5582         }
5583         git_footer_html();
5584 }
5585
5586 sub git_heads {
5587         my $head = git_get_head_hash($project);
5588         git_header_html();
5589         git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
5590         git_print_header_div('summary', $project);
5591
5592         my @headslist = git_get_heads_list();
5593         if (@headslist) {
5594                 git_heads_body(\@headslist, $head);
5595         }
5596         git_footer_html();
5597 }
5598
5599 sub git_remotes {
5600         gitweb_check_feature('remote_heads')
5601                 or die_error(403, "Remote heads view is disabled");
5602
5603         my $head = git_get_head_hash($project);
5604         my $remote = $input_params{'hash'};
5605
5606         my @remotelist;
5607
5608         if (defined $remote) {
5609                 # only display the heads in a given remote, stripping the
5610                 # remote name which is already visible elsewhere
5611                 @remotelist = map {
5612                         my $ref = $_ ;
5613                         $ref->{'name'} =~ s!^$remote/!!;
5614                         $ref
5615                 } git_get_heads_list(undef, "remotes/$remote");
5616         } else {
5617                 @remotelist = git_get_heads_list(undef, 'remotes');
5618         }
5619
5620         git_header_html(undef, undef, -action_extra => $remote);
5621         git_print_page_nav('', '',  $head, undef, $head,
5622                 format_ref_views($remote ? '' : 'remotes'));
5623
5624         if (defined $remote) {
5625                 git_print_header_div('remotes', "$remote remote for $project");
5626         } else {
5627                 git_print_header_div('summary', "$project remotes");
5628         }
5629
5630         if (@remotelist) {
5631                 git_heads_body(\@remotelist, $head);
5632         }
5633
5634         git_footer_html();
5635 }
5636
5637 sub git_blob_plain {
5638         my $type = shift;
5639         my $expires;
5640
5641         if (!defined $hash) {
5642                 if (defined $file_name) {
5643                         my $base = $hash_base || git_get_head_hash($project);
5644                         $hash = git_get_hash_by_path($base, $file_name, "blob")
5645                                 or die_error(404, "Cannot find file");
5646                 } else {
5647                         die_error(400, "No file name defined");
5648                 }
5649         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5650                 # blobs defined by non-textual hash id's can be cached
5651                 $expires = "+1d";
5652         }
5653
5654         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5655                 or die_error(500, "Open git-cat-file blob '$hash' failed");
5656
5657         # content-type (can include charset)
5658         $type = blob_contenttype($fd, $file_name, $type);
5659
5660         # "save as" filename, even when no $file_name is given
5661         my $save_as = "$hash";
5662         if (defined $file_name) {
5663                 $save_as = $file_name;
5664         } elsif ($type =~ m/^text\//) {
5665                 $save_as .= '.txt';
5666         }
5667
5668         # With XSS prevention on, blobs of all types except a few known safe
5669         # ones are served with "Content-Disposition: attachment" to make sure
5670         # they don't run in our security domain.  For certain image types,
5671         # blob view writes an <img> tag referring to blob_plain view, and we
5672         # want to be sure not to break that by serving the image as an
5673         # attachment (though Firefox 3 doesn't seem to care).
5674         my $sandbox = $prevent_xss &&
5675                 $type !~ m!^(?:text/plain|image/(?:gif|png|jpeg))$!;
5676
5677         print $cgi->header(
5678                 -type => $type,
5679                 -expires => $expires,
5680                 -content_disposition =>
5681                         ($sandbox ? 'attachment' : 'inline')
5682                         . '; filename="' . $save_as . '"');
5683         local $/ = undef;
5684         binmode STDOUT, ':raw';
5685         print <$fd>;
5686         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
5687         close $fd;
5688 }
5689
5690 sub git_blob {
5691         my $expires;
5692
5693         if (!defined $hash) {
5694                 if (defined $file_name) {
5695                         my $base = $hash_base || git_get_head_hash($project);
5696                         $hash = git_get_hash_by_path($base, $file_name, "blob")
5697                                 or die_error(404, "Cannot find file");
5698                 } else {
5699                         die_error(400, "No file name defined");
5700                 }
5701         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
5702                 # blobs defined by non-textual hash id's can be cached
5703                 $expires = "+1d";
5704         }
5705
5706         my $have_blame = gitweb_check_feature('blame');
5707         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
5708                 or die_error(500, "Couldn't cat $file_name, $hash");
5709         my $mimetype = blob_mimetype($fd, $file_name);
5710         # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
5711         if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
5712                 close $fd;
5713                 return git_blob_plain($mimetype);
5714         }
5715         # we can have blame only for text/* mimetype
5716         $have_blame &&= ($mimetype =~ m!^text/!);
5717
5718         my $highlight = gitweb_check_feature('highlight');
5719         my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
5720         $fd = run_highlighter($fd, $highlight, $syntax)
5721                 if $syntax;
5722
5723         git_header_html(undef, $expires);
5724         my $formats_nav = '';
5725         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
5726                 if (defined $file_name) {
5727                         if ($have_blame) {
5728                                 $formats_nav .=
5729                                         $cgi->a({-href => href(action=>"blame", -replay=>1)},
5730                                                 "blame") .
5731                                         " | ";
5732                         }
5733                         $formats_nav .=
5734                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
5735                                         "history") .
5736                                 " | " .
5737                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5738                                         "raw") .
5739                                 " | " .
5740                                 $cgi->a({-href => href(action=>"blob",
5741                                                        hash_base=>"HEAD", file_name=>$file_name)},
5742                                         "HEAD");
5743                 } else {
5744                         $formats_nav .=
5745                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
5746                                         "raw");
5747                 }
5748                 git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5749                 git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5750         } else {
5751                 print "<div class=\"page_nav\">\n" .
5752                       "<br/><br/></div>\n" .
5753                       "<div class=\"title\">$hash</div>\n";
5754         }
5755         git_print_page_path($file_name, "blob", $hash_base);
5756         print "<div class=\"page_body\">\n";
5757         if ($mimetype =~ m!^image/!) {
5758                 print qq!<img type="$mimetype"!;
5759                 if ($file_name) {
5760                         print qq! alt="$file_name" title="$file_name"!;
5761                 }
5762                 print qq! src="! .
5763                       href(action=>"blob_plain", hash=>$hash,
5764                            hash_base=>$hash_base, file_name=>$file_name) .
5765                       qq!" />\n!;
5766         } else {
5767                 my $nr;
5768                 while (my $line = <$fd>) {
5769                         chomp $line;
5770                         $nr++;
5771                         $line = untabify($line);
5772                         printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
5773                                $nr, href(-replay => 1), $nr, $nr, $syntax ? $line : esc_html($line, -nbsp=>1);
5774                 }
5775         }
5776         close $fd
5777                 or print "Reading blob failed.\n";
5778         print "</div>";
5779         git_footer_html();
5780 }
5781
5782 sub git_tree {
5783         if (!defined $hash_base) {
5784                 $hash_base = "HEAD";
5785         }
5786         if (!defined $hash) {
5787                 if (defined $file_name) {
5788                         $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
5789                 } else {
5790                         $hash = $hash_base;
5791                 }
5792         }
5793         die_error(404, "No such tree") unless defined($hash);
5794
5795         my $show_sizes = gitweb_check_feature('show-sizes');
5796         my $have_blame = gitweb_check_feature('blame');
5797
5798         my @entries = ();
5799         {
5800                 local $/ = "\0";
5801                 open my $fd, "-|", git_cmd(), "ls-tree", '-z',
5802                         ($show_sizes ? '-l' : ()), @extra_options, $hash
5803                         or die_error(500, "Open git-ls-tree failed");
5804                 @entries = map { chomp; $_ } <$fd>;
5805                 close $fd
5806                         or die_error(404, "Reading tree failed");
5807         }
5808
5809         my $refs = git_get_references();
5810         my $ref = format_ref_marker($refs, $hash_base);
5811         git_header_html();
5812         my $basedir = '';
5813         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
5814                 my @views_nav = ();
5815                 if (defined $file_name) {
5816                         push @views_nav,
5817                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
5818                                         "history"),
5819                                 $cgi->a({-href => href(action=>"tree",
5820                                                        hash_base=>"HEAD", file_name=>$file_name)},
5821                                         "HEAD"),
5822                 }
5823                 my $snapshot_links = format_snapshot_links($hash);
5824                 if (defined $snapshot_links) {
5825                         # FIXME: Should be available when we have no hash base as well.
5826                         push @views_nav, $snapshot_links;
5827                 }
5828                 git_print_page_nav('tree','', $hash_base, undef, undef,
5829                                    join(' | ', @views_nav));
5830                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
5831         } else {
5832                 undef $hash_base;
5833                 print "<div class=\"page_nav\">\n";
5834                 print "<br/><br/></div>\n";
5835                 print "<div class=\"title\">$hash</div>\n";
5836         }
5837         if (defined $file_name) {
5838                 $basedir = $file_name;
5839                 if ($basedir ne '' && substr($basedir, -1) ne '/') {
5840                         $basedir .= '/';
5841                 }
5842                 git_print_page_path($file_name, 'tree', $hash_base);
5843         }
5844         print "<div class=\"page_body\">\n";
5845         print "<table class=\"tree\">\n";
5846         my $alternate = 1;
5847         # '..' (top directory) link if possible
5848         if (defined $hash_base &&
5849             defined $file_name && $file_name =~ m![^/]+$!) {
5850                 if ($alternate) {
5851                         print "<tr class=\"dark\">\n";
5852                 } else {
5853                         print "<tr class=\"light\">\n";
5854                 }
5855                 $alternate ^= 1;
5856
5857                 my $up = $file_name;
5858                 $up =~ s!/?[^/]+$!!;
5859                 undef $up unless $up;
5860                 # based on git_print_tree_entry
5861                 print '<td class="mode">' . mode_str('040000') . "</td>\n";
5862                 print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
5863                 print '<td class="list">';
5864                 print $cgi->a({-href => href(action=>"tree",
5865                                              hash_base=>$hash_base,
5866                                              file_name=>$up)},
5867                               "..");
5868                 print "</td>\n";
5869                 print "<td class=\"link\"></td>\n";
5870
5871                 print "</tr>\n";
5872         }
5873         foreach my $line (@entries) {
5874                 my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
5875
5876                 if ($alternate) {
5877                         print "<tr class=\"dark\">\n";
5878                 } else {
5879                         print "<tr class=\"light\">\n";
5880                 }
5881                 $alternate ^= 1;
5882
5883                 git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
5884
5885                 print "</tr>\n";
5886         }
5887         print "</table>\n" .
5888               "</div>";
5889         git_footer_html();
5890 }
5891
5892 sub snapshot_name {
5893         my ($project, $hash) = @_;
5894
5895         # path/to/project.git  -> project
5896         # path/to/project/.git -> project
5897         my $name = to_utf8($project);
5898         $name =~ s,([^/])/*\.git$,$1,;
5899         $name = basename($name);
5900         # sanitize name
5901         $name =~ s/[[:cntrl:]]/?/g;
5902
5903         my $ver = $hash;
5904         if ($hash =~ /^[0-9a-fA-F]+$/) {
5905                 # shorten SHA-1 hash
5906                 my $full_hash = git_get_full_hash($project, $hash);
5907                 if ($full_hash =~ /^$hash/ && length($hash) > 7) {
5908                         $ver = git_get_short_hash($project, $hash);
5909                 }
5910         } elsif ($hash =~ m!^refs/tags/(.*)$!) {
5911                 # tags don't need shortened SHA-1 hash
5912                 $ver = $1;
5913         } else {
5914                 # branches and other need shortened SHA-1 hash
5915                 if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
5916                         $ver = $1;
5917                 }
5918                 $ver .= '-' . git_get_short_hash($project, $hash);
5919         }
5920         # in case of hierarchical branch names
5921         $ver =~ s!/!.!g;
5922
5923         # name = project-version_string
5924         $name = "$name-$ver";
5925
5926         return wantarray ? ($name, $name) : $name;
5927 }
5928
5929 sub git_snapshot {
5930         my $format = $input_params{'snapshot_format'};
5931         if (!@snapshot_fmts) {
5932                 die_error(403, "Snapshots not allowed");
5933         }
5934         # default to first supported snapshot format
5935         $format ||= $snapshot_fmts[0];
5936         if ($format !~ m/^[a-z0-9]+$/) {
5937                 die_error(400, "Invalid snapshot format parameter");
5938         } elsif (!exists($known_snapshot_formats{$format})) {
5939                 die_error(400, "Unknown snapshot format");
5940         } elsif ($known_snapshot_formats{$format}{'disabled'}) {
5941                 die_error(403, "Snapshot format not allowed");
5942         } elsif (!grep($_ eq $format, @snapshot_fmts)) {
5943                 die_error(403, "Unsupported snapshot format");
5944         }
5945
5946         my $type = git_get_type("$hash^{}");
5947         if (!$type) {
5948                 die_error(404, 'Object does not exist');
5949         }  elsif ($type eq 'blob') {
5950                 die_error(400, 'Object is not a tree-ish');
5951         }
5952
5953         my ($name, $prefix) = snapshot_name($project, $hash);
5954         my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
5955         my $cmd = quote_command(
5956                 git_cmd(), 'archive',
5957                 "--format=$known_snapshot_formats{$format}{'format'}",
5958                 "--prefix=$prefix/", $hash);
5959         if (exists $known_snapshot_formats{$format}{'compressor'}) {
5960                 $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
5961         }
5962
5963         $filename =~ s/(["\\])/\\$1/g;
5964         print $cgi->header(
5965                 -type => $known_snapshot_formats{$format}{'type'},
5966                 -content_disposition => 'inline; filename="' . $filename . '"',
5967                 -status => '200 OK');
5968
5969         open my $fd, "-|", $cmd
5970                 or die_error(500, "Execute git-archive failed");
5971         binmode STDOUT, ':raw';
5972         print <$fd>;
5973         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
5974         close $fd;
5975 }
5976
5977 sub git_log_generic {
5978         my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
5979
5980         my $head = git_get_head_hash($project);
5981         if (!defined $base) {
5982                 $base = $head;
5983         }
5984         if (!defined $page) {
5985                 $page = 0;
5986         }
5987         my $refs = git_get_references();
5988
5989         my $commit_hash = $base;
5990         if (defined $parent) {
5991                 $commit_hash = "$parent..$base";
5992         }
5993         my @commitlist =
5994                 parse_commits($commit_hash, 101, (100 * $page),
5995                               defined $file_name ? ($file_name, "--full-history") : ());
5996
5997         my $ftype;
5998         if (!defined $file_hash && defined $file_name) {
5999                 # some commits could have deleted file in question,
6000                 # and not have it in tree, but one of them has to have it
6001                 for (my $i = 0; $i < @commitlist; $i++) {
6002                         $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
6003                         last if defined $file_hash;
6004                 }
6005         }
6006         if (defined $file_hash) {
6007                 $ftype = git_get_type($file_hash);
6008         }
6009         if (defined $file_name && !defined $ftype) {
6010                 die_error(500, "Unknown type of object");
6011         }
6012         my %co;
6013         if (defined $file_name) {
6014                 %co = parse_commit($base)
6015                         or die_error(404, "Unknown commit object");
6016         }
6017
6018
6019         my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
6020         my $next_link = '';
6021         if ($#commitlist >= 100) {
6022                 $next_link =
6023                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
6024                                  -accesskey => "n", -title => "Alt-n"}, "next");
6025         }
6026         my $patch_max = gitweb_get_feature('patches');
6027         if ($patch_max && !defined $file_name) {
6028                 if ($patch_max < 0 || @commitlist <= $patch_max) {
6029                         $paging_nav .= " &sdot; " .
6030                                 $cgi->a({-href => href(action=>"patches", -replay=>1)},
6031                                         "patches");
6032                 }
6033         }
6034
6035         git_header_html();
6036         git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
6037         if (defined $file_name) {
6038                 git_print_header_div('commit', esc_html($co{'title'}), $base);
6039         } else {
6040                 git_print_header_div('summary', $project)
6041         }
6042         git_print_page_path($file_name, $ftype, $hash_base)
6043                 if (defined $file_name);
6044
6045         $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
6046                      $file_name, $file_hash, $ftype);
6047
6048         git_footer_html();
6049 }
6050
6051 sub git_log {
6052         git_log_generic('log', \&git_log_body,
6053                         $hash, $hash_parent);
6054 }
6055
6056 sub git_commit {
6057         $hash ||= $hash_base || "HEAD";
6058         my %co = parse_commit($hash)
6059             or die_error(404, "Unknown commit object");
6060
6061         my $parent  = $co{'parent'};
6062         my $parents = $co{'parents'}; # listref
6063
6064         # we need to prepare $formats_nav before any parameter munging
6065         my $formats_nav;
6066         if (!defined $parent) {
6067                 # --root commitdiff
6068                 $formats_nav .= '(initial)';
6069         } elsif (@$parents == 1) {
6070                 # single parent commit
6071                 $formats_nav .=
6072                         '(parent: ' .
6073                         $cgi->a({-href => href(action=>"commit",
6074                                                hash=>$parent)},
6075                                 esc_html(substr($parent, 0, 7))) .
6076                         ')';
6077         } else {
6078                 # merge commit
6079                 $formats_nav .=
6080                         '(merge: ' .
6081                         join(' ', map {
6082                                 $cgi->a({-href => href(action=>"commit",
6083                                                        hash=>$_)},
6084                                         esc_html(substr($_, 0, 7)));
6085                         } @$parents ) .
6086                         ')';
6087         }
6088         if (gitweb_check_feature('patches') && @$parents <= 1) {
6089                 $formats_nav .= " | " .
6090                         $cgi->a({-href => href(action=>"patch", -replay=>1)},
6091                                 "patch");
6092         }
6093
6094         if (!defined $parent) {
6095                 $parent = "--root";
6096         }
6097         my @difftree;
6098         open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
6099                 @diff_opts,
6100                 (@$parents <= 1 ? $parent : '-c'),
6101                 $hash, "--"
6102                 or die_error(500, "Open git-diff-tree failed");
6103         @difftree = map { chomp; $_ } <$fd>;
6104         close $fd or die_error(404, "Reading git-diff-tree failed");
6105
6106         # non-textual hash id's can be cached
6107         my $expires;
6108         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6109                 $expires = "+1d";
6110         }
6111         my $refs = git_get_references();
6112         my $ref = format_ref_marker($refs, $co{'id'});
6113
6114         git_header_html(undef, $expires);
6115         git_print_page_nav('commit', '',
6116                            $hash, $co{'tree'}, $hash,
6117                            $formats_nav);
6118
6119         if (defined $co{'parent'}) {
6120                 git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
6121         } else {
6122                 git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
6123         }
6124         print "<div class=\"title_text\">\n" .
6125               "<table class=\"object_header\">\n";
6126         git_print_authorship_rows(\%co);
6127         print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
6128         print "<tr>" .
6129               "<td>tree</td>" .
6130               "<td class=\"sha1\">" .
6131               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
6132                        class => "list"}, $co{'tree'}) .
6133               "</td>" .
6134               "<td class=\"link\">" .
6135               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
6136                       "tree");
6137         my $snapshot_links = format_snapshot_links($hash);
6138         if (defined $snapshot_links) {
6139                 print " | " . $snapshot_links;
6140         }
6141         print "</td>" .
6142               "</tr>\n";
6143
6144         foreach my $par (@$parents) {
6145                 print "<tr>" .
6146                       "<td>parent</td>" .
6147                       "<td class=\"sha1\">" .
6148                       $cgi->a({-href => href(action=>"commit", hash=>$par),
6149                                class => "list"}, $par) .
6150                       "</td>" .
6151                       "<td class=\"link\">" .
6152                       $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
6153                       " | " .
6154                       $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
6155                       "</td>" .
6156                       "</tr>\n";
6157         }
6158         print "</table>".
6159               "</div>\n";
6160
6161         print "<div class=\"page_body\">\n";
6162         git_print_log($co{'comment'});
6163         print "</div>\n";
6164
6165         git_difftree_body(\@difftree, $hash, @$parents);
6166
6167         git_footer_html();
6168 }
6169
6170 sub git_object {
6171         # object is defined by:
6172         # - hash or hash_base alone
6173         # - hash_base and file_name
6174         my $type;
6175
6176         # - hash or hash_base alone
6177         if ($hash || ($hash_base && !defined $file_name)) {
6178                 my $object_id = $hash || $hash_base;
6179
6180                 open my $fd, "-|", quote_command(
6181                         git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
6182                         or die_error(404, "Object does not exist");
6183                 $type = <$fd>;
6184                 chomp $type;
6185                 close $fd
6186                         or die_error(404, "Object does not exist");
6187
6188         # - hash_base and file_name
6189         } elsif ($hash_base && defined $file_name) {
6190                 $file_name =~ s,/+$,,;
6191
6192                 system(git_cmd(), "cat-file", '-e', $hash_base) == 0
6193                         or die_error(404, "Base object does not exist");
6194
6195                 # here errors should not hapen
6196                 open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
6197                         or die_error(500, "Open git-ls-tree failed");
6198                 my $line = <$fd>;
6199                 close $fd;
6200
6201                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
6202                 unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
6203                         die_error(404, "File or directory for given base does not exist");
6204                 }
6205                 $type = $2;
6206                 $hash = $3;
6207         } else {
6208                 die_error(400, "Not enough information to find object");
6209         }
6210
6211         print $cgi->redirect(-uri => href(action=>$type, -full=>1,
6212                                           hash=>$hash, hash_base=>$hash_base,
6213                                           file_name=>$file_name),
6214                              -status => '302 Found');
6215 }
6216
6217 sub git_blobdiff {
6218         my $format = shift || 'html';
6219
6220         my $fd;
6221         my @difftree;
6222         my %diffinfo;
6223         my $expires;
6224
6225         # preparing $fd and %diffinfo for git_patchset_body
6226         # new style URI
6227         if (defined $hash_base && defined $hash_parent_base) {
6228                 if (defined $file_name) {
6229                         # read raw output
6230                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6231                                 $hash_parent_base, $hash_base,
6232                                 "--", (defined $file_parent ? $file_parent : ()), $file_name
6233                                 or die_error(500, "Open git-diff-tree failed");
6234                         @difftree = map { chomp; $_ } <$fd>;
6235                         close $fd
6236                                 or die_error(404, "Reading git-diff-tree failed");
6237                         @difftree
6238                                 or die_error(404, "Blob diff not found");
6239
6240                 } elsif (defined $hash &&
6241                          $hash =~ /[0-9a-fA-F]{40}/) {
6242                         # try to find filename from $hash
6243
6244                         # read filtered raw output
6245                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6246                                 $hash_parent_base, $hash_base, "--"
6247                                 or die_error(500, "Open git-diff-tree failed");
6248                         @difftree =
6249                                 # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
6250                                 # $hash == to_id
6251                                 grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
6252                                 map { chomp; $_ } <$fd>;
6253                         close $fd
6254                                 or die_error(404, "Reading git-diff-tree failed");
6255                         @difftree
6256                                 or die_error(404, "Blob diff not found");
6257
6258                 } else {
6259                         die_error(400, "Missing one of the blob diff parameters");
6260                 }
6261
6262                 if (@difftree > 1) {
6263                         die_error(400, "Ambiguous blob diff specification");
6264                 }
6265
6266                 %diffinfo = parse_difftree_raw_line($difftree[0]);
6267                 $file_parent ||= $diffinfo{'from_file'} || $file_name;
6268                 $file_name   ||= $diffinfo{'to_file'};
6269
6270                 $hash_parent ||= $diffinfo{'from_id'};
6271                 $hash        ||= $diffinfo{'to_id'};
6272
6273                 # non-textual hash id's can be cached
6274                 if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
6275                     $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
6276                         $expires = '+1d';
6277                 }
6278
6279                 # open patch output
6280                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6281                         '-p', ($format eq 'html' ? "--full-index" : ()),
6282                         $hash_parent_base, $hash_base,
6283                         "--", (defined $file_parent ? $file_parent : ()), $file_name
6284                         or die_error(500, "Open git-diff-tree failed");
6285         }
6286
6287         # old/legacy style URI -- not generated anymore since 1.4.3.
6288         if (!%diffinfo) {
6289                 die_error('404 Not Found', "Missing one of the blob diff parameters")
6290         }
6291
6292         # header
6293         if ($format eq 'html') {
6294                 my $formats_nav =
6295                         $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
6296                                 "raw");
6297                 git_header_html(undef, $expires);
6298                 if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6299                         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6300                         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6301                 } else {
6302                         print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
6303                         print "<div class=\"title\">$hash vs $hash_parent</div>\n";
6304                 }
6305                 if (defined $file_name) {
6306                         git_print_page_path($file_name, "blob", $hash_base);
6307                 } else {
6308                         print "<div class=\"page_path\"></div>\n";
6309                 }
6310
6311         } elsif ($format eq 'plain') {
6312                 print $cgi->header(
6313                         -type => 'text/plain',
6314                         -charset => 'utf-8',
6315                         -expires => $expires,
6316                         -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
6317
6318                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6319
6320         } else {
6321                 die_error(400, "Unknown blobdiff format");
6322         }
6323
6324         # patch
6325         if ($format eq 'html') {
6326                 print "<div class=\"page_body\">\n";
6327
6328                 git_patchset_body($fd, [ \%diffinfo ], $hash_base, $hash_parent_base);
6329                 close $fd;
6330
6331                 print "</div>\n"; # class="page_body"
6332                 git_footer_html();
6333
6334         } else {
6335                 while (my $line = <$fd>) {
6336                         $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
6337                         $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
6338
6339                         print $line;
6340
6341                         last if $line =~ m!^\+\+\+!;
6342                 }
6343                 local $/ = undef;
6344                 print <$fd>;
6345                 close $fd;
6346         }
6347 }
6348
6349 sub git_blobdiff_plain {
6350         git_blobdiff('plain');
6351 }
6352
6353 sub git_commitdiff {
6354         my %params = @_;
6355         my $format = $params{-format} || 'html';
6356
6357         my ($patch_max) = gitweb_get_feature('patches');
6358         if ($format eq 'patch') {
6359                 die_error(403, "Patch view not allowed") unless $patch_max;
6360         }
6361
6362         $hash ||= $hash_base || "HEAD";
6363         my %co = parse_commit($hash)
6364             or die_error(404, "Unknown commit object");
6365
6366         # choose format for commitdiff for merge
6367         if (! defined $hash_parent && @{$co{'parents'}} > 1) {
6368                 $hash_parent = '--cc';
6369         }
6370         # we need to prepare $formats_nav before almost any parameter munging
6371         my $formats_nav;
6372         if ($format eq 'html') {
6373                 $formats_nav =
6374                         $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
6375                                 "raw");
6376                 if ($patch_max && @{$co{'parents'}} <= 1) {
6377                         $formats_nav .= " | " .
6378                                 $cgi->a({-href => href(action=>"patch", -replay=>1)},
6379                                         "patch");
6380                 }
6381
6382                 if (defined $hash_parent &&
6383                     $hash_parent ne '-c' && $hash_parent ne '--cc') {
6384                         # commitdiff with two commits given
6385                         my $hash_parent_short = $hash_parent;
6386                         if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
6387                                 $hash_parent_short = substr($hash_parent, 0, 7);
6388                         }
6389                         $formats_nav .=
6390                                 ' (from';
6391                         for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
6392                                 if ($co{'parents'}[$i] eq $hash_parent) {
6393                                         $formats_nav .= ' parent ' . ($i+1);
6394                                         last;
6395                                 }
6396                         }
6397                         $formats_nav .= ': ' .
6398                                 $cgi->a({-href => href(action=>"commitdiff",
6399                                                        hash=>$hash_parent)},
6400                                         esc_html($hash_parent_short)) .
6401                                 ')';
6402                 } elsif (!$co{'parent'}) {
6403                         # --root commitdiff
6404                         $formats_nav .= ' (initial)';
6405                 } elsif (scalar @{$co{'parents'}} == 1) {
6406                         # single parent commit
6407                         $formats_nav .=
6408                                 ' (parent: ' .
6409                                 $cgi->a({-href => href(action=>"commitdiff",
6410                                                        hash=>$co{'parent'})},
6411                                         esc_html(substr($co{'parent'}, 0, 7))) .
6412                                 ')';
6413                 } else {
6414                         # merge commit
6415                         if ($hash_parent eq '--cc') {
6416                                 $formats_nav .= ' | ' .
6417                                         $cgi->a({-href => href(action=>"commitdiff",
6418                                                                hash=>$hash, hash_parent=>'-c')},
6419                                                 'combined');
6420                         } else { # $hash_parent eq '-c'
6421                                 $formats_nav .= ' | ' .
6422                                         $cgi->a({-href => href(action=>"commitdiff",
6423                                                                hash=>$hash, hash_parent=>'--cc')},
6424                                                 'compact');
6425                         }
6426                         $formats_nav .=
6427                                 ' (merge: ' .
6428                                 join(' ', map {
6429                                         $cgi->a({-href => href(action=>"commitdiff",
6430                                                                hash=>$_)},
6431                                                 esc_html(substr($_, 0, 7)));
6432                                 } @{$co{'parents'}} ) .
6433                                 ')';
6434                 }
6435         }
6436
6437         my $hash_parent_param = $hash_parent;
6438         if (!defined $hash_parent_param) {
6439                 # --cc for multiple parents, --root for parentless
6440                 $hash_parent_param =
6441                         @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
6442         }
6443
6444         # read commitdiff
6445         my $fd;
6446         my @difftree;
6447         if ($format eq 'html') {
6448                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6449                         "--no-commit-id", "--patch-with-raw", "--full-index",
6450                         $hash_parent_param, $hash, "--"
6451                         or die_error(500, "Open git-diff-tree failed");
6452
6453                 while (my $line = <$fd>) {
6454                         chomp $line;
6455                         # empty line ends raw part of diff-tree output
6456                         last unless $line;
6457                         push @difftree, scalar parse_difftree_raw_line($line);
6458                 }
6459
6460         } elsif ($format eq 'plain') {
6461                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6462                         '-p', $hash_parent_param, $hash, "--"
6463                         or die_error(500, "Open git-diff-tree failed");
6464         } elsif ($format eq 'patch') {
6465                 # For commit ranges, we limit the output to the number of
6466                 # patches specified in the 'patches' feature.
6467                 # For single commits, we limit the output to a single patch,
6468                 # diverging from the git-format-patch default.
6469                 my @commit_spec = ();
6470                 if ($hash_parent) {
6471                         if ($patch_max > 0) {
6472                                 push @commit_spec, "-$patch_max";
6473                         }
6474                         push @commit_spec, '-n', "$hash_parent..$hash";
6475                 } else {
6476                         if ($params{-single}) {
6477                                 push @commit_spec, '-1';
6478                         } else {
6479                                 if ($patch_max > 0) {
6480                                         push @commit_spec, "-$patch_max";
6481                                 }
6482                                 push @commit_spec, "-n";
6483                         }
6484                         push @commit_spec, '--root', $hash;
6485                 }
6486                 open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
6487                         '--encoding=utf8', '--stdout', @commit_spec
6488                         or die_error(500, "Open git-format-patch failed");
6489         } else {
6490                 die_error(400, "Unknown commitdiff format");
6491         }
6492
6493         # non-textual hash id's can be cached
6494         my $expires;
6495         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6496                 $expires = "+1d";
6497         }
6498
6499         # write commit message
6500         if ($format eq 'html') {
6501                 my $refs = git_get_references();
6502                 my $ref = format_ref_marker($refs, $co{'id'});
6503
6504                 git_header_html(undef, $expires);
6505                 git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
6506                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
6507                 print "<div class=\"title_text\">\n" .
6508                       "<table class=\"object_header\">\n";
6509                 git_print_authorship_rows(\%co);
6510                 print "</table>".
6511                       "</div>\n";
6512                 print "<div class=\"page_body\">\n";
6513                 if (@{$co{'comment'}} > 1) {
6514                         print "<div class=\"log\">\n";
6515                         git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
6516                         print "</div>\n"; # class="log"
6517                 }
6518
6519         } elsif ($format eq 'plain') {
6520                 my $refs = git_get_references("tags");
6521                 my $tagname = git_get_rev_name_tags($hash);
6522                 my $filename = basename($project) . "-$hash.patch";
6523
6524                 print $cgi->header(
6525                         -type => 'text/plain',
6526                         -charset => 'utf-8',
6527                         -expires => $expires,
6528                         -content_disposition => 'inline; filename="' . "$filename" . '"');
6529                 my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
6530                 print "From: " . to_utf8($co{'author'}) . "\n";
6531                 print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
6532                 print "Subject: " . to_utf8($co{'title'}) . "\n";
6533
6534                 print "X-Git-Tag: $tagname\n" if $tagname;
6535                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6536
6537                 foreach my $line (@{$co{'comment'}}) {
6538                         print to_utf8($line) . "\n";
6539                 }
6540                 print "---\n\n";
6541         } elsif ($format eq 'patch') {
6542                 my $filename = basename($project) . "-$hash.patch";
6543
6544                 print $cgi->header(
6545                         -type => 'text/plain',
6546                         -charset => 'utf-8',
6547                         -expires => $expires,
6548                         -content_disposition => 'inline; filename="' . "$filename" . '"');
6549         }
6550
6551         # write patch
6552         if ($format eq 'html') {
6553                 my $use_parents = !defined $hash_parent ||
6554                         $hash_parent eq '-c' || $hash_parent eq '--cc';
6555                 git_difftree_body(\@difftree, $hash,
6556                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
6557                 print "<br/>\n";
6558
6559                 git_patchset_body($fd, \@difftree, $hash,
6560                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
6561                 close $fd;
6562                 print "</div>\n"; # class="page_body"
6563                 git_footer_html();
6564
6565         } elsif ($format eq 'plain') {
6566                 local $/ = undef;
6567                 print <$fd>;
6568                 close $fd
6569                         or print "Reading git-diff-tree failed\n";
6570         } elsif ($format eq 'patch') {
6571                 local $/ = undef;
6572                 print <$fd>;
6573                 close $fd
6574                         or print "Reading git-format-patch failed\n";
6575         }
6576 }
6577
6578 sub git_commitdiff_plain {
6579         git_commitdiff(-format => 'plain');
6580 }
6581
6582 # format-patch-style patches
6583 sub git_patch {
6584         git_commitdiff(-format => 'patch', -single => 1);
6585 }
6586
6587 sub git_patches {
6588         git_commitdiff(-format => 'patch');
6589 }
6590
6591 sub git_history {
6592         git_log_generic('history', \&git_history_body,
6593                         $hash_base, $hash_parent_base,
6594                         $file_name, $hash);
6595 }
6596
6597 sub git_search {
6598         gitweb_check_feature('search') or die_error(403, "Search is disabled");
6599         if (!defined $searchtext) {
6600                 die_error(400, "Text field is empty");
6601         }
6602         if (!defined $hash) {
6603                 $hash = git_get_head_hash($project);
6604         }
6605         my %co = parse_commit($hash);
6606         if (!%co) {
6607                 die_error(404, "Unknown commit object");
6608         }
6609         if (!defined $page) {
6610                 $page = 0;
6611         }
6612
6613         $searchtype ||= 'commit';
6614         if ($searchtype eq 'pickaxe') {
6615                 # pickaxe may take all resources of your box and run for several minutes
6616                 # with every query - so decide by yourself how public you make this feature
6617                 gitweb_check_feature('pickaxe')
6618                     or die_error(403, "Pickaxe is disabled");
6619         }
6620         if ($searchtype eq 'grep') {
6621                 gitweb_check_feature('grep')
6622                     or die_error(403, "Grep is disabled");
6623         }
6624
6625         git_header_html();
6626
6627         if ($searchtype eq 'commit' or $searchtype eq 'author' or $searchtype eq 'committer') {
6628                 my $greptype;
6629                 if ($searchtype eq 'commit') {
6630                         $greptype = "--grep=";
6631                 } elsif ($searchtype eq 'author') {
6632                         $greptype = "--author=";
6633                 } elsif ($searchtype eq 'committer') {
6634                         $greptype = "--committer=";
6635                 }
6636                 $greptype .= $searchtext;
6637                 my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
6638                                                $greptype, '--regexp-ignore-case',
6639                                                $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
6640
6641                 my $paging_nav = '';
6642                 if ($page > 0) {
6643                         $paging_nav .=
6644                                 $cgi->a({-href => href(action=>"search", hash=>$hash,
6645                                                        searchtext=>$searchtext,
6646                                                        searchtype=>$searchtype)},
6647                                         "first");
6648                         $paging_nav .= " &sdot; " .
6649                                 $cgi->a({-href => href(-replay=>1, page=>$page-1),
6650                                          -accesskey => "p", -title => "Alt-p"}, "prev");
6651                 } else {
6652                         $paging_nav .= "first";
6653                         $paging_nav .= " &sdot; prev";
6654                 }
6655                 my $next_link = '';
6656                 if ($#commitlist >= 100) {
6657                         $next_link =
6658                                 $cgi->a({-href => href(-replay=>1, page=>$page+1),
6659                                          -accesskey => "n", -title => "Alt-n"}, "next");
6660                         $paging_nav .= " &sdot; $next_link";
6661                 } else {
6662                         $paging_nav .= " &sdot; next";
6663                 }
6664
6665                 git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
6666                 git_print_header_div('commit', esc_html($co{'title'}), $hash);
6667                 if ($page == 0 && !@commitlist) {
6668                         print "<p>No match.</p>\n";
6669                 } else {
6670                         git_search_grep_body(\@commitlist, 0, 99, $next_link);
6671                 }
6672         }
6673
6674         if ($searchtype eq 'pickaxe') {
6675                 git_print_page_nav('','', $hash,$co{'tree'},$hash);
6676                 git_print_header_div('commit', esc_html($co{'title'}), $hash);
6677
6678                 print "<table class=\"pickaxe search\">\n";
6679                 my $alternate = 1;
6680                 local $/ = "\n";
6681                 open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
6682                         '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
6683                         ($search_use_regexp ? '--pickaxe-regex' : ());
6684                 undef %co;
6685                 my @files;
6686                 while (my $line = <$fd>) {
6687                         chomp $line;
6688                         next unless $line;
6689
6690                         my %set = parse_difftree_raw_line($line);
6691                         if (defined $set{'commit'}) {
6692                                 # finish previous commit
6693                                 if (%co) {
6694                                         print "</td>\n" .
6695                                               "<td class=\"link\">" .
6696                                               $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6697                                               " | " .
6698                                               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6699                                         print "</td>\n" .
6700                                               "</tr>\n";
6701                                 }
6702
6703                                 if ($alternate) {
6704                                         print "<tr class=\"dark\">\n";
6705                                 } else {
6706                                         print "<tr class=\"light\">\n";
6707                                 }
6708                                 $alternate ^= 1;
6709                                 %co = parse_commit($set{'commit'});
6710                                 my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6711                                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6712                                       "<td><i>$author</i></td>\n" .
6713                                       "<td>" .
6714                                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6715                                               -class => "list subject"},
6716                                               chop_and_escape_str($co{'title'}, 50) . "<br/>");
6717                         } elsif (defined $set{'to_id'}) {
6718                                 next if ($set{'to_id'} =~ m/^0{40}$/);
6719
6720                                 print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6721                                                              hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6722                                               -class => "list"},
6723                                               "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6724                                       "<br/>\n";
6725                         }
6726                 }
6727                 close $fd;
6728
6729                 # finish last commit (warning: repetition!)
6730                 if (%co) {
6731                         print "</td>\n" .
6732                               "<td class=\"link\">" .
6733                               $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6734                               " | " .
6735                               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6736                         print "</td>\n" .
6737                               "</tr>\n";
6738                 }
6739
6740                 print "</table>\n";
6741         }
6742
6743         if ($searchtype eq 'grep') {
6744                 git_print_page_nav('','', $hash,$co{'tree'},$hash);
6745                 git_print_header_div('commit', esc_html($co{'title'}), $hash);
6746
6747                 print "<table class=\"grep_search\">\n";
6748                 my $alternate = 1;
6749                 my $matches = 0;
6750                 local $/ = "\n";
6751                 open my $fd, "-|", git_cmd(), 'grep', '-n',
6752                         $search_use_regexp ? ('-E', '-i') : '-F',
6753                         $searchtext, $co{'tree'};
6754                 my $lastfile = '';
6755                 while (my $line = <$fd>) {
6756                         chomp $line;
6757                         my ($file, $lno, $ltext, $binary);
6758                         last if ($matches++ > 1000);
6759                         if ($line =~ /^Binary file (.+) matches$/) {
6760                                 $file = $1;
6761                                 $binary = 1;
6762                         } else {
6763                                 (undef, $file, $lno, $ltext) = split(/:/, $line, 4);
6764                         }
6765                         if ($file ne $lastfile) {
6766                                 $lastfile and print "</td></tr>\n";
6767                                 if ($alternate++) {
6768                                         print "<tr class=\"dark\">\n";
6769                                 } else {
6770                                         print "<tr class=\"light\">\n";
6771                                 }
6772                                 print "<td class=\"list\">".
6773                                         $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6774                                                                file_name=>"$file"),
6775                                                 -class => "list"}, esc_path($file));
6776                                 print "</td><td>\n";
6777                                 $lastfile = $file;
6778                         }
6779                         if ($binary) {
6780                                 print "<div class=\"binary\">Binary file</div>\n";
6781                         } else {
6782                                 $ltext = untabify($ltext);
6783                                 if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6784                                         $ltext = esc_html($1, -nbsp=>1);
6785                                         $ltext .= '<span class="match">';
6786                                         $ltext .= esc_html($2, -nbsp=>1);
6787                                         $ltext .= '</span>';
6788                                         $ltext .= esc_html($3, -nbsp=>1);
6789                                 } else {
6790                                         $ltext = esc_html($ltext, -nbsp=>1);
6791                                 }
6792                                 print "<div class=\"pre\">" .
6793                                         $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
6794                                                                file_name=>"$file").'#l'.$lno,
6795                                                 -class => "linenr"}, sprintf('%4i', $lno))
6796                                         . ' ' .  $ltext . "</div>\n";
6797                         }
6798                 }
6799                 if ($lastfile) {
6800                         print "</td></tr>\n";
6801                         if ($matches > 1000) {
6802                                 print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6803                         }
6804                 } else {
6805                         print "<div class=\"diff nodifferences\">No matches found</div>\n";
6806                 }
6807                 close $fd;
6808
6809                 print "</table>\n";
6810         }
6811         git_footer_html();
6812 }
6813
6814 sub git_search_help {
6815         git_header_html();
6816         git_print_page_nav('','', $hash,$hash,$hash);
6817         print <<EOT;
6818 <p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
6819 regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
6820 the pattern entered is recognized as the POSIX extended
6821 <a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
6822 insensitive).</p>
6823 <dl>
6824 <dt><b>commit</b></dt>
6825 <dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
6826 EOT
6827         my $have_grep = gitweb_check_feature('grep');
6828         if ($have_grep) {
6829                 print <<EOT;
6830 <dt><b>grep</b></dt>
6831 <dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
6832     a different one) are searched for the given pattern. On large trees, this search can take
6833 a while and put some strain on the server, so please use it with some consideration. Note that
6834 due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
6835 case-sensitive.</dd>
6836 EOT
6837         }
6838         print <<EOT;
6839 <dt><b>author</b></dt>
6840 <dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
6841 <dt><b>committer</b></dt>
6842 <dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
6843 EOT
6844         my $have_pickaxe = gitweb_check_feature('pickaxe');
6845         if ($have_pickaxe) {
6846                 print <<EOT;
6847 <dt><b>pickaxe</b></dt>
6848 <dd>All commits that caused the string to appear or disappear from any file (changes that
6849 added, removed or "modified" the string) will be listed. This search can take a while and
6850 takes a lot of strain on the server, so please use it wisely. Note that since you may be
6851 interested even in changes just changing the case as well, this search is case sensitive.</dd>
6852 EOT
6853         }
6854         print "</dl>\n";
6855         git_footer_html();
6856 }
6857
6858 sub git_shortlog {
6859         git_log_generic('shortlog', \&git_shortlog_body,
6860                         $hash, $hash_parent);
6861 }
6862
6863 ## ......................................................................
6864 ## feeds (RSS, Atom; OPML)
6865
6866 sub git_feed {
6867         my $format = shift || 'atom';
6868         my $have_blame = gitweb_check_feature('blame');
6869
6870         # Atom: http://www.atomenabled.org/developers/syndication/
6871         # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
6872         if ($format ne 'rss' && $format ne 'atom') {
6873                 die_error(400, "Unknown web feed format");
6874         }
6875
6876         # log/feed of current (HEAD) branch, log of given branch, history of file/directory
6877         my $head = $hash || 'HEAD';
6878         my @commitlist = parse_commits($head, 150, 0, $file_name);
6879
6880         my %latest_commit;
6881         my %latest_date;
6882         my $content_type = "application/$format+xml";
6883         if (defined $cgi->http('HTTP_ACCEPT') &&
6884                  $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
6885                 # browser (feed reader) prefers text/xml
6886                 $content_type = 'text/xml';
6887         }
6888         if (defined($commitlist[0])) {
6889                 %latest_commit = %{$commitlist[0]};
6890                 my $latest_epoch = $latest_commit{'committer_epoch'};
6891                 %latest_date   = parse_date($latest_epoch);
6892                 my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
6893                 if (defined $if_modified) {
6894                         my $since;
6895                         if (eval { require HTTP::Date; 1; }) {
6896                                 $since = HTTP::Date::str2time($if_modified);
6897                         } elsif (eval { require Time::ParseDate; 1; }) {
6898                                 $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
6899                         }
6900                         if (defined $since && $latest_epoch <= $since) {
6901                                 print $cgi->header(
6902                                         -type => $content_type,
6903                                         -charset => 'utf-8',
6904                                         -last_modified => $latest_date{'rfc2822'},
6905                                         -status => '304 Not Modified');
6906                                 return;
6907                         }
6908                 }
6909                 print $cgi->header(
6910                         -type => $content_type,
6911                         -charset => 'utf-8',
6912                         -last_modified => $latest_date{'rfc2822'});
6913         } else {
6914                 print $cgi->header(
6915                         -type => $content_type,
6916                         -charset => 'utf-8');
6917         }
6918
6919         # Optimization: skip generating the body if client asks only
6920         # for Last-Modified date.
6921         return if ($cgi->request_method() eq 'HEAD');
6922
6923         # header variables
6924         my $title = "$site_name - $project/$action";
6925         my $feed_type = 'log';
6926         if (defined $hash) {
6927                 $title .= " - '$hash'";
6928                 $feed_type = 'branch log';
6929                 if (defined $file_name) {
6930                         $title .= " :: $file_name";
6931                         $feed_type = 'history';
6932                 }
6933         } elsif (defined $file_name) {
6934                 $title .= " - $file_name";
6935                 $feed_type = 'history';
6936         }
6937         $title .= " $feed_type";
6938         my $descr = git_get_project_description($project);
6939         if (defined $descr) {
6940                 $descr = esc_html($descr);
6941         } else {
6942                 $descr = "$project " .
6943                          ($format eq 'rss' ? 'RSS' : 'Atom') .
6944                          " feed";
6945         }
6946         my $owner = git_get_project_owner($project);
6947         $owner = esc_html($owner);
6948
6949         #header
6950         my $alt_url;
6951         if (defined $file_name) {
6952                 $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
6953         } elsif (defined $hash) {
6954                 $alt_url = href(-full=>1, action=>"log", hash=>$hash);
6955         } else {
6956                 $alt_url = href(-full=>1, action=>"summary");
6957         }
6958         print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
6959         if ($format eq 'rss') {
6960                 print <<XML;
6961 <rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
6962 <channel>
6963 XML
6964                 print "<title>$title</title>\n" .
6965                       "<link>$alt_url</link>\n" .
6966                       "<description>$descr</description>\n" .
6967                       "<language>en</language>\n" .
6968                       # project owner is responsible for 'editorial' content
6969                       "<managingEditor>$owner</managingEditor>\n";
6970                 if (defined $logo || defined $favicon) {
6971                         # prefer the logo to the favicon, since RSS
6972                         # doesn't allow both
6973                         my $img = esc_url($logo || $favicon);
6974                         print "<image>\n" .
6975                               "<url>$img</url>\n" .
6976                               "<title>$title</title>\n" .
6977                               "<link>$alt_url</link>\n" .
6978                               "</image>\n";
6979                 }
6980                 if (%latest_date) {
6981                         print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
6982                         print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
6983                 }
6984                 print "<generator>gitweb v.$version/$git_version</generator>\n";
6985         } elsif ($format eq 'atom') {
6986                 print <<XML;
6987 <feed xmlns="http://www.w3.org/2005/Atom">
6988 XML
6989                 print "<title>$title</title>\n" .
6990                       "<subtitle>$descr</subtitle>\n" .
6991                       '<link rel="alternate" type="text/html" href="' .
6992                       $alt_url . '" />' . "\n" .
6993                       '<link rel="self" type="' . $content_type . '" href="' .
6994                       $cgi->self_url() . '" />' . "\n" .
6995                       "<id>" . href(-full=>1) . "</id>\n" .
6996                       # use project owner for feed author
6997                       "<author><name>$owner</name></author>\n";
6998                 if (defined $favicon) {
6999                         print "<icon>" . esc_url($favicon) . "</icon>\n";
7000                 }
7001                 if (defined $logo_url) {
7002                         # not twice as wide as tall: 72 x 27 pixels
7003                         print "<logo>" . esc_url($logo) . "</logo>\n";
7004                 }
7005                 if (! %latest_date) {
7006                         # dummy date to keep the feed valid until commits trickle in:
7007                         print "<updated>1970-01-01T00:00:00Z</updated>\n";
7008                 } else {
7009                         print "<updated>$latest_date{'iso-8601'}</updated>\n";
7010                 }
7011                 print "<generator version='$version/$git_version'>gitweb</generator>\n";
7012         }
7013
7014         # contents
7015         for (my $i = 0; $i <= $#commitlist; $i++) {
7016                 my %co = %{$commitlist[$i]};
7017                 my $commit = $co{'id'};
7018                 # we read 150, we always show 30 and the ones more recent than 48 hours
7019                 if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7020                         last;
7021                 }
7022                 my %cd = parse_date($co{'author_epoch'});
7023
7024                 # get list of changed files
7025                 open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7026                         $co{'parent'} || "--root",
7027                         $co{'id'}, "--", (defined $file_name ? $file_name : ())
7028                         or next;
7029                 my @difftree = map { chomp; $_ } <$fd>;
7030                 close $fd
7031                         or next;
7032
7033                 # print element (entry, item)
7034                 my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7035                 if ($format eq 'rss') {
7036                         print "<item>\n" .
7037                               "<title>" . esc_html($co{'title'}) . "</title>\n" .
7038                               "<author>" . esc_html($co{'author'}) . "</author>\n" .
7039                               "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7040                               "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7041                               "<link>$co_url</link>\n" .
7042                               "<description>" . esc_html($co{'title'}) . "</description>\n" .
7043                               "<content:encoded>" .
7044                               "<![CDATA[\n";
7045                 } elsif ($format eq 'atom') {
7046                         print "<entry>\n" .
7047                               "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7048                               "<updated>$cd{'iso-8601'}</updated>\n" .
7049                               "<author>\n" .
7050                               "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7051                         if ($co{'author_email'}) {
7052                                 print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7053                         }
7054                         print "</author>\n" .
7055                               # use committer for contributor
7056                               "<contributor>\n" .
7057                               "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7058                         if ($co{'committer_email'}) {
7059                                 print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7060                         }
7061                         print "</contributor>\n" .
7062                               "<published>$cd{'iso-8601'}</published>\n" .
7063                               "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7064                               "<id>$co_url</id>\n" .
7065                               "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
7066                               "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
7067                 }
7068                 my $comment = $co{'comment'};
7069                 print "<pre>\n";
7070                 foreach my $line (@$comment) {
7071                         $line = esc_html($line);
7072                         print "$line\n";
7073                 }
7074                 print "</pre><ul>\n";
7075                 foreach my $difftree_line (@difftree) {
7076                         my %difftree = parse_difftree_raw_line($difftree_line);
7077                         next if !$difftree{'from_id'};
7078
7079                         my $file = $difftree{'file'} || $difftree{'to_file'};
7080
7081                         print "<li>" .
7082                               "[" .
7083                               $cgi->a({-href => href(-full=>1, action=>"blobdiff",
7084                                                      hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
7085                                                      hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
7086                                                      file_name=>$file, file_parent=>$difftree{'from_file'}),
7087                                       -title => "diff"}, 'D');
7088                         if ($have_blame) {
7089                                 print $cgi->a({-href => href(-full=>1, action=>"blame",
7090                                                              file_name=>$file, hash_base=>$commit),
7091                                               -title => "blame"}, 'B');
7092                         }
7093                         # if this is not a feed of a file history
7094                         if (!defined $file_name || $file_name ne $file) {
7095                                 print $cgi->a({-href => href(-full=>1, action=>"history",
7096                                                              file_name=>$file, hash=>$commit),
7097                                               -title => "history"}, 'H');
7098                         }
7099                         $file = esc_path($file);
7100                         print "] ".
7101                               "$file</li>\n";
7102                 }
7103                 if ($format eq 'rss') {
7104                         print "</ul>]]>\n" .
7105                               "</content:encoded>\n" .
7106                               "</item>\n";
7107                 } elsif ($format eq 'atom') {
7108                         print "</ul>\n</div>\n" .
7109                               "</content>\n" .
7110                               "</entry>\n";
7111                 }
7112         }
7113
7114         # end of feed
7115         if ($format eq 'rss') {
7116                 print "</channel>\n</rss>\n";
7117         } elsif ($format eq 'atom') {
7118                 print "</feed>\n";
7119         }
7120 }
7121
7122 sub git_rss {
7123         git_feed('rss');
7124 }
7125
7126 sub git_atom {
7127         git_feed('atom');
7128 }
7129
7130 sub git_opml {
7131         my @list = git_get_projects_list();
7132
7133         print $cgi->header(
7134                 -type => 'text/xml',
7135                 -charset => 'utf-8',
7136                 -content_disposition => 'inline; filename="opml.xml"');
7137
7138         print <<XML;
7139 <?xml version="1.0" encoding="utf-8"?>
7140 <opml version="1.0">
7141 <head>
7142   <title>$site_name OPML Export</title>
7143 </head>
7144 <body>
7145 <outline text="git RSS feeds">
7146 XML
7147
7148         foreach my $pr (@list) {
7149                 my %proj = %$pr;
7150                 my $head = git_get_head_hash($proj{'path'});
7151                 if (!defined $head) {
7152                         next;
7153                 }
7154                 $git_dir = "$projectroot/$proj{'path'}";
7155                 my %co = parse_commit($head);
7156                 if (!%co) {
7157                         next;
7158                 }
7159
7160                 my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7161                 my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7162                 my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7163                 print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7164         }
7165         print <<XML;
7166 </outline>
7167 </body>
7168 </opml>
7169 XML
7170 }