Merge branch 'kk/maint-gitweb-missing-owner'
[git] / gitweb / gitweb.perl
1 #!/usr/bin/perl
2
3 # gitweb - simple web interface to track changes in git repositories
4 #
5 # (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
6 # (C) 2005, Christian Gierke
7 #
8 # This program is licensed under the GPLv2
9
10 use 5.008;
11 use strict;
12 use warnings;
13 use CGI qw(:standard :escapeHTML -nosticky);
14 use CGI::Util qw(unescape);
15 use CGI::Carp qw(fatalsToBrowser set_message);
16 use Encode;
17 use Fcntl ':mode';
18 use File::Find qw();
19 use File::Basename qw(basename);
20 use Time::HiRes qw(gettimeofday tv_interval);
21 binmode STDOUT, ':utf8';
22
23 our $t0 = [ gettimeofday() ];
24 our $number_of_git_cmds = 0;
25
26 BEGIN {
27         CGI->compile() if $ENV{'MOD_PERL'};
28 }
29
30 our $version = "++GIT_VERSION++";
31
32 our ($my_url, $my_uri, $base_url, $path_info, $home_link);
33 sub evaluate_uri {
34         our $cgi;
35
36         our $my_url = $cgi->url();
37         our $my_uri = $cgi->url(-absolute => 1);
38
39         # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
40         # needed and used only for URLs with nonempty PATH_INFO
41         our $base_url = $my_url;
42
43         # When the script is used as DirectoryIndex, the URL does not contain the name
44         # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
45         # have to do it ourselves. We make $path_info global because it's also used
46         # later on.
47         #
48         # Another issue with the script being the DirectoryIndex is that the resulting
49         # $my_url data is not the full script URL: this is good, because we want
50         # generated links to keep implying the script name if it wasn't explicitly
51         # indicated in the URL we're handling, but it means that $my_url cannot be used
52         # as base URL.
53         # Therefore, if we needed to strip PATH_INFO, then we know that we have
54         # to build the base URL ourselves:
55         our $path_info = decode_utf8($ENV{"PATH_INFO"});
56         if ($path_info) {
57                 if ($my_url =~ s,\Q$path_info\E$,, &&
58                     $my_uri =~ s,\Q$path_info\E$,, &&
59                     defined $ENV{'SCRIPT_NAME'}) {
60                         $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
61                 }
62         }
63
64         # target of the home link on top of all pages
65         our $home_link = $my_uri || "/";
66 }
67
68 # core git executable to use
69 # this can just be "git" if your webserver has a sensible PATH
70 our $GIT = "++GIT_BINDIR++/git";
71
72 # absolute fs-path which will be prepended to the project path
73 #our $projectroot = "/pub/scm";
74 our $projectroot = "++GITWEB_PROJECTROOT++";
75
76 # fs traversing limit for getting project list
77 # the number is relative to the projectroot
78 our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
79
80 # string of the home link on top of all pages
81 our $home_link_str = "++GITWEB_HOME_LINK_STR++";
82
83 # name of your site or organization to appear in page titles
84 # replace this with something more descriptive for clearer bookmarks
85 our $site_name = "++GITWEB_SITENAME++"
86                  || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
87
88 # html snippet to include in the <head> section of each page
89 our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
90 # filename of html text to include at top of each page
91 our $site_header = "++GITWEB_SITE_HEADER++";
92 # html text to include at home page
93 our $home_text = "++GITWEB_HOMETEXT++";
94 # filename of html text to include at bottom of each page
95 our $site_footer = "++GITWEB_SITE_FOOTER++";
96
97 # URI of stylesheets
98 our @stylesheets = ("++GITWEB_CSS++");
99 # URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
100 our $stylesheet = undef;
101 # URI of GIT logo (72x27 size)
102 our $logo = "++GITWEB_LOGO++";
103 # URI of GIT favicon, assumed to be image/png type
104 our $favicon = "++GITWEB_FAVICON++";
105 # URI of gitweb.js (JavaScript code for gitweb)
106 our $javascript = "++GITWEB_JS++";
107
108 # URI and label (title) of GIT logo link
109 #our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
110 #our $logo_label = "git documentation";
111 our $logo_url = "http://git-scm.com/";
112 our $logo_label = "git homepage";
113
114 # source of projects list
115 our $projects_list = "++GITWEB_LIST++";
116
117 # the width (in characters) of the projects list "Description" column
118 our $projects_list_description_width = 25;
119
120 # group projects by category on the projects list
121 # (enabled if this variable evaluates to true)
122 our $projects_list_group_categories = 0;
123
124 # default category if none specified
125 # (leave the empty string for no category)
126 our $project_list_default_category = "";
127
128 # default order of projects list
129 # valid values are none, project, descr, owner, and age
130 our $default_projects_order = "project";
131
132 # show repository only if this file exists
133 # (only effective if this variable evaluates to true)
134 our $export_ok = "++GITWEB_EXPORT_OK++";
135
136 # show repository only if this subroutine returns true
137 # when given the path to the project, for example:
138 #    sub { return -e "$_[0]/git-daemon-export-ok"; }
139 our $export_auth_hook = undef;
140
141 # only allow viewing of repositories also shown on the overview page
142 our $strict_export = "++GITWEB_STRICT_EXPORT++";
143
144 # list of git base URLs used for URL to where fetch project from,
145 # i.e. full URL is "$git_base_url/$project"
146 our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
147
148 # default blob_plain mimetype and default charset for text/plain blob
149 our $default_blob_plain_mimetype = 'text/plain';
150 our $default_text_plain_charset  = undef;
151
152 # file to use for guessing MIME types before trying /etc/mime.types
153 # (relative to the current git repository)
154 our $mimetypes_file = undef;
155
156 # assume this charset if line contains non-UTF-8 characters;
157 # it should be valid encoding (see Encoding::Supported(3pm) for list),
158 # for which encoding all byte sequences are valid, for example
159 # 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
160 # could be even 'utf-8' for the old behavior)
161 our $fallback_encoding = 'latin1';
162
163 # rename detection options for git-diff and git-diff-tree
164 # - default is '-M', with the cost proportional to
165 #   (number of removed files) * (number of new files).
166 # - more costly is '-C' (which implies '-M'), with the cost proportional to
167 #   (number of changed files + number of removed files) * (number of new files)
168 # - even more costly is '-C', '--find-copies-harder' with cost
169 #   (number of files in the original tree) * (number of new files)
170 # - one might want to include '-B' option, e.g. '-B', '-M'
171 our @diff_opts = ('-M'); # taken from git_commit
172
173 # Disables features that would allow repository owners to inject script into
174 # the gitweb domain.
175 our $prevent_xss = 0;
176
177 # Path to the highlight executable to use (must be the one from
178 # http://www.andre-simon.de due to assumptions about parameters and output).
179 # Useful if highlight is not installed on your webserver's PATH.
180 # [Default: highlight]
181 our $highlight_bin = "++HIGHLIGHT_BIN++";
182
183 # information about snapshot formats that gitweb is capable of serving
184 our %known_snapshot_formats = (
185         # name => {
186         #       'display' => display name,
187         #       'type' => mime type,
188         #       'suffix' => filename suffix,
189         #       'format' => --format for git-archive,
190         #       'compressor' => [compressor command and arguments]
191         #                       (array reference, optional)
192         #       'disabled' => boolean (optional)}
193         #
194         'tgz' => {
195                 'display' => 'tar.gz',
196                 'type' => 'application/x-gzip',
197                 'suffix' => '.tar.gz',
198                 'format' => 'tar',
199                 'compressor' => ['gzip', '-n']},
200
201         'tbz2' => {
202                 'display' => 'tar.bz2',
203                 'type' => 'application/x-bzip2',
204                 'suffix' => '.tar.bz2',
205                 'format' => 'tar',
206                 'compressor' => ['bzip2']},
207
208         'txz' => {
209                 'display' => 'tar.xz',
210                 'type' => 'application/x-xz',
211                 'suffix' => '.tar.xz',
212                 'format' => 'tar',
213                 'compressor' => ['xz'],
214                 'disabled' => 1},
215
216         'zip' => {
217                 'display' => 'zip',
218                 'type' => 'application/x-zip',
219                 'suffix' => '.zip',
220                 'format' => 'zip'},
221 );
222
223 # Aliases so we understand old gitweb.snapshot values in repository
224 # configuration.
225 our %known_snapshot_format_aliases = (
226         'gzip'  => 'tgz',
227         'bzip2' => 'tbz2',
228         'xz'    => 'txz',
229
230         # backward compatibility: legacy gitweb config support
231         'x-gzip' => undef, 'gz' => undef,
232         'x-bzip2' => undef, 'bz2' => undef,
233         'x-zip' => undef, '' => undef,
234 );
235
236 # Pixel sizes for icons and avatars. If the default font sizes or lineheights
237 # are changed, it may be appropriate to change these values too via
238 # $GITWEB_CONFIG.
239 our %avatar_size = (
240         'default' => 16,
241         'double'  => 32
242 );
243
244 # Used to set the maximum load that we will still respond to gitweb queries.
245 # If server load exceed this value then return "503 server busy" error.
246 # If gitweb cannot determined server load, it is taken to be 0.
247 # Leave it undefined (or set to 'undef') to turn off load checking.
248 our $maxload = 300;
249
250 # configuration for 'highlight' (http://www.andre-simon.de/)
251 # match by basename
252 our %highlight_basename = (
253         #'Program' => 'py',
254         #'Library' => 'py',
255         'SConstruct' => 'py', # SCons equivalent of Makefile
256         'Makefile' => 'make',
257 );
258 # match by extension
259 our %highlight_ext = (
260         # main extensions, defining name of syntax;
261         # see files in /usr/share/highlight/langDefs/ directory
262         map { $_ => $_ }
263                 qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
264         # alternate extensions, see /etc/highlight/filetypes.conf
265         'h' => 'c',
266         map { $_ => 'sh'  } qw(bash zsh ksh),
267         map { $_ => 'cpp' } qw(cxx c++ cc),
268         map { $_ => 'php' } qw(php3 php4 php5 phps),
269         map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
270         map { $_ => 'make'} qw(mak mk),
271         map { $_ => 'xml' } qw(xhtml html htm),
272 );
273
274 # You define site-wide feature defaults here; override them with
275 # $GITWEB_CONFIG as necessary.
276 our %feature = (
277         # feature => {
278         #       'sub' => feature-sub (subroutine),
279         #       'override' => allow-override (boolean),
280         #       'default' => [ default options...] (array reference)}
281         #
282         # if feature is overridable (it means that allow-override has true value),
283         # then feature-sub will be called with default options as parameters;
284         # return value of feature-sub indicates if to enable specified feature
285         #
286         # if there is no 'sub' key (no feature-sub), then feature cannot be
287         # overridden
288         #
289         # use gitweb_get_feature(<feature>) to retrieve the <feature> value
290         # (an array) or gitweb_check_feature(<feature>) to check if <feature>
291         # is enabled
292
293         # Enable the 'blame' blob view, showing the last commit that modified
294         # each line in the file. This can be very CPU-intensive.
295
296         # To enable system wide have in $GITWEB_CONFIG
297         # $feature{'blame'}{'default'} = [1];
298         # To have project specific config enable override in $GITWEB_CONFIG
299         # $feature{'blame'}{'override'} = 1;
300         # and in project config gitweb.blame = 0|1;
301         'blame' => {
302                 'sub' => sub { feature_bool('blame', @_) },
303                 'override' => 0,
304                 'default' => [0]},
305
306         # Enable the 'snapshot' link, providing a compressed archive of any
307         # tree. This can potentially generate high traffic if you have large
308         # project.
309
310         # Value is a list of formats defined in %known_snapshot_formats that
311         # you wish to offer.
312         # To disable system wide have in $GITWEB_CONFIG
313         # $feature{'snapshot'}{'default'} = [];
314         # To have project specific config enable override in $GITWEB_CONFIG
315         # $feature{'snapshot'}{'override'} = 1;
316         # and in project config, a comma-separated list of formats or "none"
317         # to disable.  Example: gitweb.snapshot = tbz2,zip;
318         'snapshot' => {
319                 'sub' => \&feature_snapshot,
320                 'override' => 0,
321                 'default' => ['tgz']},
322
323         # Enable text search, which will list the commits which match author,
324         # committer or commit text to a given string.  Enabled by default.
325         # Project specific override is not supported.
326         #
327         # Note that this controls all search features, which means that if
328         # it is disabled, then 'grep' and 'pickaxe' search would also be
329         # disabled.
330         'search' => {
331                 'override' => 0,
332                 'default' => [1]},
333
334         # Enable grep search, which will list the files in currently selected
335         # tree containing the given string. Enabled by default. This can be
336         # potentially CPU-intensive, of course.
337         # Note that you need to have 'search' feature enabled too.
338
339         # To enable system wide have in $GITWEB_CONFIG
340         # $feature{'grep'}{'default'} = [1];
341         # To have project specific config enable override in $GITWEB_CONFIG
342         # $feature{'grep'}{'override'} = 1;
343         # and in project config gitweb.grep = 0|1;
344         'grep' => {
345                 'sub' => sub { feature_bool('grep', @_) },
346                 'override' => 0,
347                 'default' => [1]},
348
349         # Enable the pickaxe search, which will list the commits that modified
350         # a given string in a file. This can be practical and quite faster
351         # alternative to 'blame', but still potentially CPU-intensive.
352         # Note that you need to have 'search' feature enabled too.
353
354         # To enable system wide have in $GITWEB_CONFIG
355         # $feature{'pickaxe'}{'default'} = [1];
356         # To have project specific config enable override in $GITWEB_CONFIG
357         # $feature{'pickaxe'}{'override'} = 1;
358         # and in project config gitweb.pickaxe = 0|1;
359         'pickaxe' => {
360                 'sub' => sub { feature_bool('pickaxe', @_) },
361                 'override' => 0,
362                 'default' => [1]},
363
364         # Enable showing size of blobs in a 'tree' view, in a separate
365         # column, similar to what 'ls -l' does.  This cost a bit of IO.
366
367         # To disable system wide have in $GITWEB_CONFIG
368         # $feature{'show-sizes'}{'default'} = [0];
369         # To have project specific config enable override in $GITWEB_CONFIG
370         # $feature{'show-sizes'}{'override'} = 1;
371         # and in project config gitweb.showsizes = 0|1;
372         'show-sizes' => {
373                 'sub' => sub { feature_bool('showsizes', @_) },
374                 'override' => 0,
375                 'default' => [1]},
376
377         # Make gitweb use an alternative format of the URLs which can be
378         # more readable and natural-looking: project name is embedded
379         # directly in the path and the query string contains other
380         # auxiliary information. All gitweb installations recognize
381         # URL in either format; this configures in which formats gitweb
382         # generates links.
383
384         # To enable system wide have in $GITWEB_CONFIG
385         # $feature{'pathinfo'}{'default'} = [1];
386         # Project specific override is not supported.
387
388         # Note that you will need to change the default location of CSS,
389         # favicon, logo and possibly other files to an absolute URL. Also,
390         # if gitweb.cgi serves as your indexfile, you will need to force
391         # $my_uri to contain the script name in your $GITWEB_CONFIG.
392         'pathinfo' => {
393                 'override' => 0,
394                 'default' => [0]},
395
396         # Make gitweb consider projects in project root subdirectories
397         # to be forks of existing projects. Given project $projname.git,
398         # projects matching $projname/*.git will not be shown in the main
399         # projects list, instead a '+' mark will be added to $projname
400         # there and a 'forks' view will be enabled for the project, listing
401         # all the forks. If project list is taken from a file, forks have
402         # to be listed after the main project.
403
404         # To enable system wide have in $GITWEB_CONFIG
405         # $feature{'forks'}{'default'} = [1];
406         # Project specific override is not supported.
407         'forks' => {
408                 'override' => 0,
409                 'default' => [0]},
410
411         # Insert custom links to the action bar of all project pages.
412         # This enables you mainly to link to third-party scripts integrating
413         # into gitweb; e.g. git-browser for graphical history representation
414         # or custom web-based repository administration interface.
415
416         # The 'default' value consists of a list of triplets in the form
417         # (label, link, position) where position is the label after which
418         # to insert the link and link is a format string where %n expands
419         # to the project name, %f to the project path within the filesystem,
420         # %h to the current hash (h gitweb parameter) and %b to the current
421         # hash base (hb gitweb parameter); %% expands to %.
422
423         # To enable system wide have in $GITWEB_CONFIG e.g.
424         # $feature{'actions'}{'default'} = [('graphiclog',
425         #       '/git-browser/by-commit.html?r=%n', 'summary')];
426         # Project specific override is not supported.
427         'actions' => {
428                 'override' => 0,
429                 'default' => []},
430
431         # Allow gitweb scan project content tags of project repository,
432         # and display the popular Web 2.0-ish "tag cloud" near the projects
433         # list.  Note that this is something COMPLETELY different from the
434         # normal Git tags.
435
436         # gitweb by itself can show existing tags, but it does not handle
437         # tagging itself; you need to do it externally, outside gitweb.
438         # The format is described in git_get_project_ctags() subroutine.
439         # You may want to install the HTML::TagCloud Perl module to get
440         # a pretty tag cloud instead of just a list of tags.
441
442         # To enable system wide have in $GITWEB_CONFIG
443         # $feature{'ctags'}{'default'} = [1];
444         # Project specific override is not supported.
445
446         # In the future whether ctags editing is enabled might depend
447         # on the value, but using 1 should always mean no editing of ctags.
448         'ctags' => {
449                 'override' => 0,
450                 'default' => [0]},
451
452         # The maximum number of patches in a patchset generated in patch
453         # view. Set this to 0 or undef to disable patch view, or to a
454         # negative number to remove any limit.
455
456         # To disable system wide have in $GITWEB_CONFIG
457         # $feature{'patches'}{'default'} = [0];
458         # To have project specific config enable override in $GITWEB_CONFIG
459         # $feature{'patches'}{'override'} = 1;
460         # and in project config gitweb.patches = 0|n;
461         # where n is the maximum number of patches allowed in a patchset.
462         'patches' => {
463                 'sub' => \&feature_patches,
464                 'override' => 0,
465                 'default' => [16]},
466
467         # Avatar support. When this feature is enabled, views such as
468         # shortlog or commit will display an avatar associated with
469         # the email of the committer(s) and/or author(s).
470
471         # Currently available providers are gravatar and picon.
472         # If an unknown provider is specified, the feature is disabled.
473
474         # Gravatar depends on Digest::MD5.
475         # Picon currently relies on the indiana.edu database.
476
477         # To enable system wide have in $GITWEB_CONFIG
478         # $feature{'avatar'}{'default'} = ['<provider>'];
479         # where <provider> is either gravatar or picon.
480         # To have project specific config enable override in $GITWEB_CONFIG
481         # $feature{'avatar'}{'override'} = 1;
482         # and in project config gitweb.avatar = <provider>;
483         'avatar' => {
484                 'sub' => \&feature_avatar,
485                 'override' => 0,
486                 'default' => ['']},
487
488         # Enable displaying how much time and how many git commands
489         # it took to generate and display page.  Disabled by default.
490         # Project specific override is not supported.
491         'timed' => {
492                 'override' => 0,
493                 'default' => [0]},
494
495         # Enable turning some links into links to actions which require
496         # JavaScript to run (like 'blame_incremental').  Not enabled by
497         # default.  Project specific override is currently not supported.
498         'javascript-actions' => {
499                 'override' => 0,
500                 'default' => [0]},
501
502         # Enable and configure ability to change common timezone for dates
503         # in gitweb output via JavaScript.  Enabled by default.
504         # Project specific override is not supported.
505         'javascript-timezone' => {
506                 'override' => 0,
507                 'default' => [
508                         'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
509                                      # or undef to turn off this feature
510                         'gitweb_tz', # name of cookie where to store selected timezone
511                         'datetime',  # CSS class used to mark up dates for manipulation
512                 ]},
513
514         # Syntax highlighting support. This is based on Daniel Svensson's
515         # and Sham Chukoury's work in gitweb-xmms2.git.
516         # It requires the 'highlight' program present in $PATH,
517         # and therefore is disabled by default.
518
519         # To enable system wide have in $GITWEB_CONFIG
520         # $feature{'highlight'}{'default'} = [1];
521
522         'highlight' => {
523                 'sub' => sub { feature_bool('highlight', @_) },
524                 'override' => 0,
525                 'default' => [0]},
526
527         # Enable displaying of remote heads in the heads list
528
529         # To enable system wide have in $GITWEB_CONFIG
530         # $feature{'remote_heads'}{'default'} = [1];
531         # To have project specific config enable override in $GITWEB_CONFIG
532         # $feature{'remote_heads'}{'override'} = 1;
533         # and in project config gitweb.remote_heads = 0|1;
534         'remote_heads' => {
535                 'sub' => sub { feature_bool('remote_heads', @_) },
536                 'override' => 0,
537                 'default' => [0]},
538 );
539
540 sub gitweb_get_feature {
541         my ($name) = @_;
542         return unless exists $feature{$name};
543         my ($sub, $override, @defaults) = (
544                 $feature{$name}{'sub'},
545                 $feature{$name}{'override'},
546                 @{$feature{$name}{'default'}});
547         # project specific override is possible only if we have project
548         our $git_dir; # global variable, declared later
549         if (!$override || !defined $git_dir) {
550                 return @defaults;
551         }
552         if (!defined $sub) {
553                 warn "feature $name is not overridable";
554                 return @defaults;
555         }
556         return $sub->(@defaults);
557 }
558
559 # A wrapper to check if a given feature is enabled.
560 # With this, you can say
561 #
562 #   my $bool_feat = gitweb_check_feature('bool_feat');
563 #   gitweb_check_feature('bool_feat') or somecode;
564 #
565 # instead of
566 #
567 #   my ($bool_feat) = gitweb_get_feature('bool_feat');
568 #   (gitweb_get_feature('bool_feat'))[0] or somecode;
569 #
570 sub gitweb_check_feature {
571         return (gitweb_get_feature(@_))[0];
572 }
573
574
575 sub feature_bool {
576         my $key = shift;
577         my ($val) = git_get_project_config($key, '--bool');
578
579         if (!defined $val) {
580                 return ($_[0]);
581         } elsif ($val eq 'true') {
582                 return (1);
583         } elsif ($val eq 'false') {
584                 return (0);
585         }
586 }
587
588 sub feature_snapshot {
589         my (@fmts) = @_;
590
591         my ($val) = git_get_project_config('snapshot');
592
593         if ($val) {
594                 @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
595         }
596
597         return @fmts;
598 }
599
600 sub feature_patches {
601         my @val = (git_get_project_config('patches', '--int'));
602
603         if (@val) {
604                 return @val;
605         }
606
607         return ($_[0]);
608 }
609
610 sub feature_avatar {
611         my @val = (git_get_project_config('avatar'));
612
613         return @val ? @val : @_;
614 }
615
616 # checking HEAD file with -e is fragile if the repository was
617 # initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
618 # and then pruned.
619 sub check_head_link {
620         my ($dir) = @_;
621         my $headfile = "$dir/HEAD";
622         return ((-e $headfile) ||
623                 (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
624 }
625
626 sub check_export_ok {
627         my ($dir) = @_;
628         return (check_head_link($dir) &&
629                 (!$export_ok || -e "$dir/$export_ok") &&
630                 (!$export_auth_hook || $export_auth_hook->($dir)));
631 }
632
633 # process alternate names for backward compatibility
634 # filter out unsupported (unknown) snapshot formats
635 sub filter_snapshot_fmts {
636         my @fmts = @_;
637
638         @fmts = map {
639                 exists $known_snapshot_format_aliases{$_} ?
640                        $known_snapshot_format_aliases{$_} : $_} @fmts;
641         @fmts = grep {
642                 exists $known_snapshot_formats{$_} &&
643                 !$known_snapshot_formats{$_}{'disabled'}} @fmts;
644 }
645
646 # If it is set to code reference, it is code that it is to be run once per
647 # request, allowing updating configurations that change with each request,
648 # while running other code in config file only once.
649 #
650 # Otherwise, if it is false then gitweb would process config file only once;
651 # if it is true then gitweb config would be run for each request.
652 our $per_request_config = 1;
653
654 # read and parse gitweb config file given by its parameter.
655 # returns true on success, false on recoverable error, allowing
656 # to chain this subroutine, using first file that exists.
657 # dies on errors during parsing config file, as it is unrecoverable.
658 sub read_config_file {
659         my $filename = shift;
660         return unless defined $filename;
661         # die if there are errors parsing config file
662         if (-e $filename) {
663                 do $filename;
664                 die $@ if $@;
665                 return 1;
666         }
667         return;
668 }
669
670 our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
671 sub evaluate_gitweb_config {
672         our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
673         our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
674         our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
675
676         # Protect agains duplications of file names, to not read config twice.
677         # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
678         # there possibility of duplication of filename there doesn't matter.
679         $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
680         $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
681
682         # Common system-wide settings for convenience.
683         # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
684         read_config_file($GITWEB_CONFIG_COMMON);
685
686         # Use first config file that exists.  This means use the per-instance
687         # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
688         read_config_file($GITWEB_CONFIG) and return;
689         read_config_file($GITWEB_CONFIG_SYSTEM);
690 }
691
692 # Get loadavg of system, to compare against $maxload.
693 # Currently it requires '/proc/loadavg' present to get loadavg;
694 # if it is not present it returns 0, which means no load checking.
695 sub get_loadavg {
696         if( -e '/proc/loadavg' ){
697                 open my $fd, '<', '/proc/loadavg'
698                         or return 0;
699                 my @load = split(/\s+/, scalar <$fd>);
700                 close $fd;
701
702                 # The first three columns measure CPU and IO utilization of the last one,
703                 # five, and 10 minute periods.  The fourth column shows the number of
704                 # currently running processes and the total number of processes in the m/n
705                 # format.  The last column displays the last process ID used.
706                 return $load[0] || 0;
707         }
708         # additional checks for load average should go here for things that don't export
709         # /proc/loadavg
710
711         return 0;
712 }
713
714 # version of the core git binary
715 our $git_version;
716 sub evaluate_git_version {
717         our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
718         $number_of_git_cmds++;
719 }
720
721 sub check_loadavg {
722         if (defined $maxload && get_loadavg() > $maxload) {
723                 die_error(503, "The load average on the server is too high");
724         }
725 }
726
727 # ======================================================================
728 # input validation and dispatch
729
730 # input parameters can be collected from a variety of sources (presently, CGI
731 # and PATH_INFO), so we define an %input_params hash that collects them all
732 # together during validation: this allows subsequent uses (e.g. href()) to be
733 # agnostic of the parameter origin
734
735 our %input_params = ();
736
737 # input parameters are stored with the long parameter name as key. This will
738 # also be used in the href subroutine to convert parameters to their CGI
739 # equivalent, and since the href() usage is the most frequent one, we store
740 # the name -> CGI key mapping here, instead of the reverse.
741 #
742 # XXX: Warning: If you touch this, check the search form for updating,
743 # too.
744
745 our @cgi_param_mapping = (
746         project => "p",
747         action => "a",
748         file_name => "f",
749         file_parent => "fp",
750         hash => "h",
751         hash_parent => "hp",
752         hash_base => "hb",
753         hash_parent_base => "hpb",
754         page => "pg",
755         order => "o",
756         searchtext => "s",
757         searchtype => "st",
758         snapshot_format => "sf",
759         extra_options => "opt",
760         search_use_regexp => "sr",
761         ctag => "by_tag",
762         diff_style => "ds",
763         project_filter => "pf",
764         # this must be last entry (for manipulation from JavaScript)
765         javascript => "js"
766 );
767 our %cgi_param_mapping = @cgi_param_mapping;
768
769 # we will also need to know the possible actions, for validation
770 our %actions = (
771         "blame" => \&git_blame,
772         "blame_incremental" => \&git_blame_incremental,
773         "blame_data" => \&git_blame_data,
774         "blobdiff" => \&git_blobdiff,
775         "blobdiff_plain" => \&git_blobdiff_plain,
776         "blob" => \&git_blob,
777         "blob_plain" => \&git_blob_plain,
778         "commitdiff" => \&git_commitdiff,
779         "commitdiff_plain" => \&git_commitdiff_plain,
780         "commit" => \&git_commit,
781         "forks" => \&git_forks,
782         "heads" => \&git_heads,
783         "history" => \&git_history,
784         "log" => \&git_log,
785         "patch" => \&git_patch,
786         "patches" => \&git_patches,
787         "remotes" => \&git_remotes,
788         "rss" => \&git_rss,
789         "atom" => \&git_atom,
790         "search" => \&git_search,
791         "search_help" => \&git_search_help,
792         "shortlog" => \&git_shortlog,
793         "summary" => \&git_summary,
794         "tag" => \&git_tag,
795         "tags" => \&git_tags,
796         "tree" => \&git_tree,
797         "snapshot" => \&git_snapshot,
798         "object" => \&git_object,
799         # those below don't need $project
800         "opml" => \&git_opml,
801         "project_list" => \&git_project_list,
802         "project_index" => \&git_project_index,
803 );
804
805 # finally, we have the hash of allowed extra_options for the commands that
806 # allow them
807 our %allowed_options = (
808         "--no-merges" => [ qw(rss atom log shortlog history) ],
809 );
810
811 # fill %input_params with the CGI parameters. All values except for 'opt'
812 # should be single values, but opt can be an array. We should probably
813 # build an array of parameters that can be multi-valued, but since for the time
814 # being it's only this one, we just single it out
815 sub evaluate_query_params {
816         our $cgi;
817
818         while (my ($name, $symbol) = each %cgi_param_mapping) {
819                 if ($symbol eq 'opt') {
820                         $input_params{$name} = [ map { decode_utf8($_) } $cgi->param($symbol) ];
821                 } else {
822                         $input_params{$name} = decode_utf8($cgi->param($symbol));
823                 }
824         }
825 }
826
827 # now read PATH_INFO and update the parameter list for missing parameters
828 sub evaluate_path_info {
829         return if defined $input_params{'project'};
830         return if !$path_info;
831         $path_info =~ s,^/+,,;
832         return if !$path_info;
833
834         # find which part of PATH_INFO is project
835         my $project = $path_info;
836         $project =~ s,/+$,,;
837         while ($project && !check_head_link("$projectroot/$project")) {
838                 $project =~ s,/*[^/]*$,,;
839         }
840         return unless $project;
841         $input_params{'project'} = $project;
842
843         # do not change any parameters if an action is given using the query string
844         return if $input_params{'action'};
845         $path_info =~ s,^\Q$project\E/*,,;
846
847         # next, check if we have an action
848         my $action = $path_info;
849         $action =~ s,/.*$,,;
850         if (exists $actions{$action}) {
851                 $path_info =~ s,^$action/*,,;
852                 $input_params{'action'} = $action;
853         }
854
855         # list of actions that want hash_base instead of hash, but can have no
856         # pathname (f) parameter
857         my @wants_base = (
858                 'tree',
859                 'history',
860         );
861
862         # we want to catch, among others
863         # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
864         my ($parentrefname, $parentpathname, $refname, $pathname) =
865                 ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
866
867         # first, analyze the 'current' part
868         if (defined $pathname) {
869                 # we got "branch:filename" or "branch:dir/"
870                 # we could use git_get_type(branch:pathname), but:
871                 # - it needs $git_dir
872                 # - it does a git() call
873                 # - the convention of terminating directories with a slash
874                 #   makes it superfluous
875                 # - embedding the action in the PATH_INFO would make it even
876                 #   more superfluous
877                 $pathname =~ s,^/+,,;
878                 if (!$pathname || substr($pathname, -1) eq "/") {
879                         $input_params{'action'} ||= "tree";
880                         $pathname =~ s,/$,,;
881                 } else {
882                         # the default action depends on whether we had parent info
883                         # or not
884                         if ($parentrefname) {
885                                 $input_params{'action'} ||= "blobdiff_plain";
886                         } else {
887                                 $input_params{'action'} ||= "blob_plain";
888                         }
889                 }
890                 $input_params{'hash_base'} ||= $refname;
891                 $input_params{'file_name'} ||= $pathname;
892         } elsif (defined $refname) {
893                 # we got "branch". In this case we have to choose if we have to
894                 # set hash or hash_base.
895                 #
896                 # Most of the actions without a pathname only want hash to be
897                 # set, except for the ones specified in @wants_base that want
898                 # hash_base instead. It should also be noted that hand-crafted
899                 # links having 'history' as an action and no pathname or hash
900                 # set will fail, but that happens regardless of PATH_INFO.
901                 if (defined $parentrefname) {
902                         # if there is parent let the default be 'shortlog' action
903                         # (for http://git.example.com/repo.git/A..B links); if there
904                         # is no parent, dispatch will detect type of object and set
905                         # action appropriately if required (if action is not set)
906                         $input_params{'action'} ||= "shortlog";
907                 }
908                 if ($input_params{'action'} &&
909                     grep { $_ eq $input_params{'action'} } @wants_base) {
910                         $input_params{'hash_base'} ||= $refname;
911                 } else {
912                         $input_params{'hash'} ||= $refname;
913                 }
914         }
915
916         # next, handle the 'parent' part, if present
917         if (defined $parentrefname) {
918                 # a missing pathspec defaults to the 'current' filename, allowing e.g.
919                 # someproject/blobdiff/oldrev..newrev:/filename
920                 if ($parentpathname) {
921                         $parentpathname =~ s,^/+,,;
922                         $parentpathname =~ s,/$,,;
923                         $input_params{'file_parent'} ||= $parentpathname;
924                 } else {
925                         $input_params{'file_parent'} ||= $input_params{'file_name'};
926                 }
927                 # we assume that hash_parent_base is wanted if a path was specified,
928                 # or if the action wants hash_base instead of hash
929                 if (defined $input_params{'file_parent'} ||
930                         grep { $_ eq $input_params{'action'} } @wants_base) {
931                         $input_params{'hash_parent_base'} ||= $parentrefname;
932                 } else {
933                         $input_params{'hash_parent'} ||= $parentrefname;
934                 }
935         }
936
937         # for the snapshot action, we allow URLs in the form
938         # $project/snapshot/$hash.ext
939         # where .ext determines the snapshot and gets removed from the
940         # passed $refname to provide the $hash.
941         #
942         # To be able to tell that $refname includes the format extension, we
943         # require the following two conditions to be satisfied:
944         # - the hash input parameter MUST have been set from the $refname part
945         #   of the URL (i.e. they must be equal)
946         # - the snapshot format MUST NOT have been defined already (e.g. from
947         #   CGI parameter sf)
948         # It's also useless to try any matching unless $refname has a dot,
949         # so we check for that too
950         if (defined $input_params{'action'} &&
951                 $input_params{'action'} eq 'snapshot' &&
952                 defined $refname && index($refname, '.') != -1 &&
953                 $refname eq $input_params{'hash'} &&
954                 !defined $input_params{'snapshot_format'}) {
955                 # We loop over the known snapshot formats, checking for
956                 # extensions. Allowed extensions are both the defined suffix
957                 # (which includes the initial dot already) and the snapshot
958                 # format key itself, with a prepended dot
959                 while (my ($fmt, $opt) = each %known_snapshot_formats) {
960                         my $hash = $refname;
961                         unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
962                                 next;
963                         }
964                         my $sfx = $1;
965                         # a valid suffix was found, so set the snapshot format
966                         # and reset the hash parameter
967                         $input_params{'snapshot_format'} = $fmt;
968                         $input_params{'hash'} = $hash;
969                         # we also set the format suffix to the one requested
970                         # in the URL: this way a request for e.g. .tgz returns
971                         # a .tgz instead of a .tar.gz
972                         $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
973                         last;
974                 }
975         }
976 }
977
978 our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
979      $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
980      $searchtext, $search_regexp, $project_filter);
981 sub evaluate_and_validate_params {
982         our $action = $input_params{'action'};
983         if (defined $action) {
984                 if (!validate_action($action)) {
985                         die_error(400, "Invalid action parameter");
986                 }
987         }
988
989         # parameters which are pathnames
990         our $project = $input_params{'project'};
991         if (defined $project) {
992                 if (!validate_project($project)) {
993                         undef $project;
994                         die_error(404, "No such project");
995                 }
996         }
997
998         our $project_filter = $input_params{'project_filter'};
999         if (defined $project_filter) {
1000                 if (!validate_pathname($project_filter)) {
1001                         die_error(404, "Invalid project_filter parameter");
1002                 }
1003         }
1004
1005         our $file_name = $input_params{'file_name'};
1006         if (defined $file_name) {
1007                 if (!validate_pathname($file_name)) {
1008                         die_error(400, "Invalid file parameter");
1009                 }
1010         }
1011
1012         our $file_parent = $input_params{'file_parent'};
1013         if (defined $file_parent) {
1014                 if (!validate_pathname($file_parent)) {
1015                         die_error(400, "Invalid file parent parameter");
1016                 }
1017         }
1018
1019         # parameters which are refnames
1020         our $hash = $input_params{'hash'};
1021         if (defined $hash) {
1022                 if (!validate_refname($hash)) {
1023                         die_error(400, "Invalid hash parameter");
1024                 }
1025         }
1026
1027         our $hash_parent = $input_params{'hash_parent'};
1028         if (defined $hash_parent) {
1029                 if (!validate_refname($hash_parent)) {
1030                         die_error(400, "Invalid hash parent parameter");
1031                 }
1032         }
1033
1034         our $hash_base = $input_params{'hash_base'};
1035         if (defined $hash_base) {
1036                 if (!validate_refname($hash_base)) {
1037                         die_error(400, "Invalid hash base parameter");
1038                 }
1039         }
1040
1041         our @extra_options = @{$input_params{'extra_options'}};
1042         # @extra_options is always defined, since it can only be (currently) set from
1043         # CGI, and $cgi->param() returns the empty array in array context if the param
1044         # is not set
1045         foreach my $opt (@extra_options) {
1046                 if (not exists $allowed_options{$opt}) {
1047                         die_error(400, "Invalid option parameter");
1048                 }
1049                 if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1050                         die_error(400, "Invalid option parameter for this action");
1051                 }
1052         }
1053
1054         our $hash_parent_base = $input_params{'hash_parent_base'};
1055         if (defined $hash_parent_base) {
1056                 if (!validate_refname($hash_parent_base)) {
1057                         die_error(400, "Invalid hash parent base parameter");
1058                 }
1059         }
1060
1061         # other parameters
1062         our $page = $input_params{'page'};
1063         if (defined $page) {
1064                 if ($page =~ m/[^0-9]/) {
1065                         die_error(400, "Invalid page parameter");
1066                 }
1067         }
1068
1069         our $searchtype = $input_params{'searchtype'};
1070         if (defined $searchtype) {
1071                 if ($searchtype =~ m/[^a-z]/) {
1072                         die_error(400, "Invalid searchtype parameter");
1073                 }
1074         }
1075
1076         our $search_use_regexp = $input_params{'search_use_regexp'};
1077
1078         our $searchtext = $input_params{'searchtext'};
1079         our $search_regexp;
1080         if (defined $searchtext) {
1081                 if (length($searchtext) < 2) {
1082                         die_error(403, "At least two characters are required for search parameter");
1083                 }
1084                 if ($search_use_regexp) {
1085                         $search_regexp = $searchtext;
1086                         if (!eval { qr/$search_regexp/; 1; }) {
1087                                 (my $error = $@) =~ s/ at \S+ line \d+.*\n?//;
1088                                 die_error(400, "Invalid search regexp '$search_regexp'",
1089                                           esc_html($error));
1090                         }
1091                 } else {
1092                         $search_regexp = quotemeta $searchtext;
1093                 }
1094         }
1095 }
1096
1097 # path to the current git repository
1098 our $git_dir;
1099 sub evaluate_git_dir {
1100         our $git_dir = "$projectroot/$project" if $project;
1101 }
1102
1103 our (@snapshot_fmts, $git_avatar);
1104 sub configure_gitweb_features {
1105         # list of supported snapshot formats
1106         our @snapshot_fmts = gitweb_get_feature('snapshot');
1107         @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1108
1109         # check that the avatar feature is set to a known provider name,
1110         # and for each provider check if the dependencies are satisfied.
1111         # if the provider name is invalid or the dependencies are not met,
1112         # reset $git_avatar to the empty string.
1113         our ($git_avatar) = gitweb_get_feature('avatar');
1114         if ($git_avatar eq 'gravatar') {
1115                 $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1116         } elsif ($git_avatar eq 'picon') {
1117                 # no dependencies
1118         } else {
1119                 $git_avatar = '';
1120         }
1121 }
1122
1123 # custom error handler: 'die <message>' is Internal Server Error
1124 sub handle_errors_html {
1125         my $msg = shift; # it is already HTML escaped
1126
1127         # to avoid infinite loop where error occurs in die_error,
1128         # change handler to default handler, disabling handle_errors_html
1129         set_message("Error occured when inside die_error:\n$msg");
1130
1131         # you cannot jump out of die_error when called as error handler;
1132         # the subroutine set via CGI::Carp::set_message is called _after_
1133         # HTTP headers are already written, so it cannot write them itself
1134         die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1135 }
1136 set_message(\&handle_errors_html);
1137
1138 # dispatch
1139 sub dispatch {
1140         if (!defined $action) {
1141                 if (defined $hash) {
1142                         $action = git_get_type($hash);
1143                         $action or die_error(404, "Object does not exist");
1144                 } elsif (defined $hash_base && defined $file_name) {
1145                         $action = git_get_type("$hash_base:$file_name");
1146                         $action or die_error(404, "File or directory does not exist");
1147                 } elsif (defined $project) {
1148                         $action = 'summary';
1149                 } else {
1150                         $action = 'project_list';
1151                 }
1152         }
1153         if (!defined($actions{$action})) {
1154                 die_error(400, "Unknown action");
1155         }
1156         if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1157             !$project) {
1158                 die_error(400, "Project needed");
1159         }
1160         $actions{$action}->();
1161 }
1162
1163 sub reset_timer {
1164         our $t0 = [ gettimeofday() ]
1165                 if defined $t0;
1166         our $number_of_git_cmds = 0;
1167 }
1168
1169 our $first_request = 1;
1170 sub run_request {
1171         reset_timer();
1172
1173         evaluate_uri();
1174         if ($first_request) {
1175                 evaluate_gitweb_config();
1176                 evaluate_git_version();
1177         }
1178         if ($per_request_config) {
1179                 if (ref($per_request_config) eq 'CODE') {
1180                         $per_request_config->();
1181                 } elsif (!$first_request) {
1182                         evaluate_gitweb_config();
1183                 }
1184         }
1185         check_loadavg();
1186
1187         # $projectroot and $projects_list might be set in gitweb config file
1188         $projects_list ||= $projectroot;
1189
1190         evaluate_query_params();
1191         evaluate_path_info();
1192         evaluate_and_validate_params();
1193         evaluate_git_dir();
1194
1195         configure_gitweb_features();
1196
1197         dispatch();
1198 }
1199
1200 our $is_last_request = sub { 1 };
1201 our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1202 our $CGI = 'CGI';
1203 our $cgi;
1204 sub configure_as_fcgi {
1205         require CGI::Fast;
1206         our $CGI = 'CGI::Fast';
1207
1208         my $request_number = 0;
1209         # let each child service 100 requests
1210         our $is_last_request = sub { ++$request_number > 100 };
1211 }
1212 sub evaluate_argv {
1213         my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1214         configure_as_fcgi()
1215                 if $script_name =~ /\.fcgi$/;
1216
1217         return unless (@ARGV);
1218
1219         require Getopt::Long;
1220         Getopt::Long::GetOptions(
1221                 'fastcgi|fcgi|f' => \&configure_as_fcgi,
1222                 'nproc|n=i' => sub {
1223                         my ($arg, $val) = @_;
1224                         return unless eval { require FCGI::ProcManager; 1; };
1225                         my $proc_manager = FCGI::ProcManager->new({
1226                                 n_processes => $val,
1227                         });
1228                         our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1229                         our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1230                         our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1231                 },
1232         );
1233 }
1234
1235 sub run {
1236         evaluate_argv();
1237
1238         $first_request = 1;
1239         $pre_listen_hook->()
1240                 if $pre_listen_hook;
1241
1242  REQUEST:
1243         while ($cgi = $CGI->new()) {
1244                 $pre_dispatch_hook->()
1245                         if $pre_dispatch_hook;
1246
1247                 run_request();
1248
1249                 $post_dispatch_hook->()
1250                         if $post_dispatch_hook;
1251                 $first_request = 0;
1252
1253                 last REQUEST if ($is_last_request->());
1254         }
1255
1256  DONE_GITWEB:
1257         1;
1258 }
1259
1260 run();
1261
1262 if (defined caller) {
1263         # wrapped in a subroutine processing requests,
1264         # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1265         return;
1266 } else {
1267         # pure CGI script, serving single request
1268         exit;
1269 }
1270
1271 ## ======================================================================
1272 ## action links
1273
1274 # possible values of extra options
1275 # -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1276 # -replay => 1      - start from a current view (replay with modifications)
1277 # -path_info => 0|1 - don't use/use path_info URL (if possible)
1278 # -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1279 sub href {
1280         my %params = @_;
1281         # default is to use -absolute url() i.e. $my_uri
1282         my $href = $params{-full} ? $my_url : $my_uri;
1283
1284         # implicit -replay, must be first of implicit params
1285         $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1286
1287         $params{'project'} = $project unless exists $params{'project'};
1288
1289         if ($params{-replay}) {
1290                 while (my ($name, $symbol) = each %cgi_param_mapping) {
1291                         if (!exists $params{$name}) {
1292                                 $params{$name} = $input_params{$name};
1293                         }
1294                 }
1295         }
1296
1297         my $use_pathinfo = gitweb_check_feature('pathinfo');
1298         if (defined $params{'project'} &&
1299             (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1300                 # try to put as many parameters as possible in PATH_INFO:
1301                 #   - project name
1302                 #   - action
1303                 #   - hash_parent or hash_parent_base:/file_parent
1304                 #   - hash or hash_base:/filename
1305                 #   - the snapshot_format as an appropriate suffix
1306
1307                 # When the script is the root DirectoryIndex for the domain,
1308                 # $href here would be something like http://gitweb.example.com/
1309                 # Thus, we strip any trailing / from $href, to spare us double
1310                 # slashes in the final URL
1311                 $href =~ s,/$,,;
1312
1313                 # Then add the project name, if present
1314                 $href .= "/".esc_path_info($params{'project'});
1315                 delete $params{'project'};
1316
1317                 # since we destructively absorb parameters, we keep this
1318                 # boolean that remembers if we're handling a snapshot
1319                 my $is_snapshot = $params{'action'} eq 'snapshot';
1320
1321                 # Summary just uses the project path URL, any other action is
1322                 # added to the URL
1323                 if (defined $params{'action'}) {
1324                         $href .= "/".esc_path_info($params{'action'})
1325                                 unless $params{'action'} eq 'summary';
1326                         delete $params{'action'};
1327                 }
1328
1329                 # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1330                 # stripping nonexistent or useless pieces
1331                 $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1332                         || $params{'hash_parent'} || $params{'hash'});
1333                 if (defined $params{'hash_base'}) {
1334                         if (defined $params{'hash_parent_base'}) {
1335                                 $href .= esc_path_info($params{'hash_parent_base'});
1336                                 # skip the file_parent if it's the same as the file_name
1337                                 if (defined $params{'file_parent'}) {
1338                                         if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1339                                                 delete $params{'file_parent'};
1340                                         } elsif ($params{'file_parent'} !~ /\.\./) {
1341                                                 $href .= ":/".esc_path_info($params{'file_parent'});
1342                                                 delete $params{'file_parent'};
1343                                         }
1344                                 }
1345                                 $href .= "..";
1346                                 delete $params{'hash_parent'};
1347                                 delete $params{'hash_parent_base'};
1348                         } elsif (defined $params{'hash_parent'}) {
1349                                 $href .= esc_path_info($params{'hash_parent'}). "..";
1350                                 delete $params{'hash_parent'};
1351                         }
1352
1353                         $href .= esc_path_info($params{'hash_base'});
1354                         if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1355                                 $href .= ":/".esc_path_info($params{'file_name'});
1356                                 delete $params{'file_name'};
1357                         }
1358                         delete $params{'hash'};
1359                         delete $params{'hash_base'};
1360                 } elsif (defined $params{'hash'}) {
1361                         $href .= esc_path_info($params{'hash'});
1362                         delete $params{'hash'};
1363                 }
1364
1365                 # If the action was a snapshot, we can absorb the
1366                 # snapshot_format parameter too
1367                 if ($is_snapshot) {
1368                         my $fmt = $params{'snapshot_format'};
1369                         # snapshot_format should always be defined when href()
1370                         # is called, but just in case some code forgets, we
1371                         # fall back to the default
1372                         $fmt ||= $snapshot_fmts[0];
1373                         $href .= $known_snapshot_formats{$fmt}{'suffix'};
1374                         delete $params{'snapshot_format'};
1375                 }
1376         }
1377
1378         # now encode the parameters explicitly
1379         my @result = ();
1380         for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1381                 my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1382                 if (defined $params{$name}) {
1383                         if (ref($params{$name}) eq "ARRAY") {
1384                                 foreach my $par (@{$params{$name}}) {
1385                                         push @result, $symbol . "=" . esc_param($par);
1386                                 }
1387                         } else {
1388                                 push @result, $symbol . "=" . esc_param($params{$name});
1389                         }
1390                 }
1391         }
1392         $href .= "?" . join(';', @result) if scalar @result;
1393
1394         # final transformation: trailing spaces must be escaped (URI-encoded)
1395         $href =~ s/(\s+)$/CGI::escape($1)/e;
1396
1397         if ($params{-anchor}) {
1398                 $href .= "#".esc_param($params{-anchor});
1399         }
1400
1401         return $href;
1402 }
1403
1404
1405 ## ======================================================================
1406 ## validation, quoting/unquoting and escaping
1407
1408 sub validate_action {
1409         my $input = shift || return undef;
1410         return undef unless exists $actions{$input};
1411         return $input;
1412 }
1413
1414 sub validate_project {
1415         my $input = shift || return undef;
1416         if (!validate_pathname($input) ||
1417                 !(-d "$projectroot/$input") ||
1418                 !check_export_ok("$projectroot/$input") ||
1419                 ($strict_export && !project_in_list($input))) {
1420                 return undef;
1421         } else {
1422                 return $input;
1423         }
1424 }
1425
1426 sub validate_pathname {
1427         my $input = shift || return undef;
1428
1429         # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1430         # at the beginning, at the end, and between slashes.
1431         # also this catches doubled slashes
1432         if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1433                 return undef;
1434         }
1435         # no null characters
1436         if ($input =~ m!\0!) {
1437                 return undef;
1438         }
1439         return $input;
1440 }
1441
1442 sub validate_refname {
1443         my $input = shift || return undef;
1444
1445         # textual hashes are O.K.
1446         if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1447                 return $input;
1448         }
1449         # it must be correct pathname
1450         $input = validate_pathname($input)
1451                 or return undef;
1452         # restrictions on ref name according to git-check-ref-format
1453         if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1454                 return undef;
1455         }
1456         return $input;
1457 }
1458
1459 # decode sequences of octets in utf8 into Perl's internal form,
1460 # which is utf-8 with utf8 flag set if needed.  gitweb writes out
1461 # in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1462 sub to_utf8 {
1463         my $str = shift;
1464         return undef unless defined $str;
1465
1466         if (utf8::is_utf8($str) || utf8::decode($str)) {
1467                 return $str;
1468         } else {
1469                 return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1470         }
1471 }
1472
1473 # quote unsafe chars, but keep the slash, even when it's not
1474 # correct, but quoted slashes look too horrible in bookmarks
1475 sub esc_param {
1476         my $str = shift;
1477         return undef unless defined $str;
1478         $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1479         $str =~ s/ /\+/g;
1480         return $str;
1481 }
1482
1483 # the quoting rules for path_info fragment are slightly different
1484 sub esc_path_info {
1485         my $str = shift;
1486         return undef unless defined $str;
1487
1488         # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1489         $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1490
1491         return $str;
1492 }
1493
1494 # quote unsafe chars in whole URL, so some characters cannot be quoted
1495 sub esc_url {
1496         my $str = shift;
1497         return undef unless defined $str;
1498         $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1499         $str =~ s/ /\+/g;
1500         return $str;
1501 }
1502
1503 # quote unsafe characters in HTML attributes
1504 sub esc_attr {
1505
1506         # for XHTML conformance escaping '"' to '&quot;' is not enough
1507         return esc_html(@_);
1508 }
1509
1510 # replace invalid utf8 character with SUBSTITUTION sequence
1511 sub esc_html {
1512         my $str = shift;
1513         my %opts = @_;
1514
1515         return undef unless defined $str;
1516
1517         $str = to_utf8($str);
1518         $str = $cgi->escapeHTML($str);
1519         if ($opts{'-nbsp'}) {
1520                 $str =~ s/ /&nbsp;/g;
1521         }
1522         $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1523         return $str;
1524 }
1525
1526 # quote control characters and escape filename to HTML
1527 sub esc_path {
1528         my $str = shift;
1529         my %opts = @_;
1530
1531         return undef unless defined $str;
1532
1533         $str = to_utf8($str);
1534         $str = $cgi->escapeHTML($str);
1535         if ($opts{'-nbsp'}) {
1536                 $str =~ s/ /&nbsp;/g;
1537         }
1538         $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1539         return $str;
1540 }
1541
1542 # Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1543 sub sanitize {
1544         my $str = shift;
1545
1546         return undef unless defined $str;
1547
1548         $str = to_utf8($str);
1549         $str =~ s|([[:cntrl:]])|($1 =~ /[\t\n\r]/ ? $1 : quot_cec($1))|eg;
1550         return $str;
1551 }
1552
1553 # Make control characters "printable", using character escape codes (CEC)
1554 sub quot_cec {
1555         my $cntrl = shift;
1556         my %opts = @_;
1557         my %es = ( # character escape codes, aka escape sequences
1558                 "\t" => '\t',   # tab            (HT)
1559                 "\n" => '\n',   # line feed      (LF)
1560                 "\r" => '\r',   # carrige return (CR)
1561                 "\f" => '\f',   # form feed      (FF)
1562                 "\b" => '\b',   # backspace      (BS)
1563                 "\a" => '\a',   # alarm (bell)   (BEL)
1564                 "\e" => '\e',   # escape         (ESC)
1565                 "\013" => '\v', # vertical tab   (VT)
1566                 "\000" => '\0', # nul character  (NUL)
1567         );
1568         my $chr = ( (exists $es{$cntrl})
1569                     ? $es{$cntrl}
1570                     : sprintf('\%2x', ord($cntrl)) );
1571         if ($opts{-nohtml}) {
1572                 return $chr;
1573         } else {
1574                 return "<span class=\"cntrl\">$chr</span>";
1575         }
1576 }
1577
1578 # Alternatively use unicode control pictures codepoints,
1579 # Unicode "printable representation" (PR)
1580 sub quot_upr {
1581         my $cntrl = shift;
1582         my %opts = @_;
1583
1584         my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1585         if ($opts{-nohtml}) {
1586                 return $chr;
1587         } else {
1588                 return "<span class=\"cntrl\">$chr</span>";
1589         }
1590 }
1591
1592 # git may return quoted and escaped filenames
1593 sub unquote {
1594         my $str = shift;
1595
1596         sub unq {
1597                 my $seq = shift;
1598                 my %es = ( # character escape codes, aka escape sequences
1599                         't' => "\t",   # tab            (HT, TAB)
1600                         'n' => "\n",   # newline        (NL)
1601                         'r' => "\r",   # return         (CR)
1602                         'f' => "\f",   # form feed      (FF)
1603                         'b' => "\b",   # backspace      (BS)
1604                         'a' => "\a",   # alarm (bell)   (BEL)
1605                         'e' => "\e",   # escape         (ESC)
1606                         'v' => "\013", # vertical tab   (VT)
1607                 );
1608
1609                 if ($seq =~ m/^[0-7]{1,3}$/) {
1610                         # octal char sequence
1611                         return chr(oct($seq));
1612                 } elsif (exists $es{$seq}) {
1613                         # C escape sequence, aka character escape code
1614                         return $es{$seq};
1615                 }
1616                 # quoted ordinary character
1617                 return $seq;
1618         }
1619
1620         if ($str =~ m/^"(.*)"$/) {
1621                 # needs unquoting
1622                 $str = $1;
1623                 $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1624         }
1625         return $str;
1626 }
1627
1628 # escape tabs (convert tabs to spaces)
1629 sub untabify {
1630         my $line = shift;
1631
1632         while ((my $pos = index($line, "\t")) != -1) {
1633                 if (my $count = (8 - ($pos % 8))) {
1634                         my $spaces = ' ' x $count;
1635                         $line =~ s/\t/$spaces/;
1636                 }
1637         }
1638
1639         return $line;
1640 }
1641
1642 sub project_in_list {
1643         my $project = shift;
1644         my @list = git_get_projects_list();
1645         return @list && scalar(grep { $_->{'path'} eq $project } @list);
1646 }
1647
1648 ## ----------------------------------------------------------------------
1649 ## HTML aware string manipulation
1650
1651 # Try to chop given string on a word boundary between position
1652 # $len and $len+$add_len. If there is no word boundary there,
1653 # chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1654 # (marking chopped part) would be longer than given string.
1655 sub chop_str {
1656         my $str = shift;
1657         my $len = shift;
1658         my $add_len = shift || 10;
1659         my $where = shift || 'right'; # 'left' | 'center' | 'right'
1660
1661         # Make sure perl knows it is utf8 encoded so we don't
1662         # cut in the middle of a utf8 multibyte char.
1663         $str = to_utf8($str);
1664
1665         # allow only $len chars, but don't cut a word if it would fit in $add_len
1666         # if it doesn't fit, cut it if it's still longer than the dots we would add
1667         # remove chopped character entities entirely
1668
1669         # when chopping in the middle, distribute $len into left and right part
1670         # return early if chopping wouldn't make string shorter
1671         if ($where eq 'center') {
1672                 return $str if ($len + 5 >= length($str)); # filler is length 5
1673                 $len = int($len/2);
1674         } else {
1675                 return $str if ($len + 4 >= length($str)); # filler is length 4
1676         }
1677
1678         # regexps: ending and beginning with word part up to $add_len
1679         my $endre = qr/.{$len}\w{0,$add_len}/;
1680         my $begre = qr/\w{0,$add_len}.{$len}/;
1681
1682         if ($where eq 'left') {
1683                 $str =~ m/^(.*?)($begre)$/;
1684                 my ($lead, $body) = ($1, $2);
1685                 if (length($lead) > 4) {
1686                         $lead = " ...";
1687                 }
1688                 return "$lead$body";
1689
1690         } elsif ($where eq 'center') {
1691                 $str =~ m/^($endre)(.*)$/;
1692                 my ($left, $str)  = ($1, $2);
1693                 $str =~ m/^(.*?)($begre)$/;
1694                 my ($mid, $right) = ($1, $2);
1695                 if (length($mid) > 5) {
1696                         $mid = " ... ";
1697                 }
1698                 return "$left$mid$right";
1699
1700         } else {
1701                 $str =~ m/^($endre)(.*)$/;
1702                 my $body = $1;
1703                 my $tail = $2;
1704                 if (length($tail) > 4) {
1705                         $tail = "... ";
1706                 }
1707                 return "$body$tail";
1708         }
1709 }
1710
1711 # takes the same arguments as chop_str, but also wraps a <span> around the
1712 # result with a title attribute if it does get chopped. Additionally, the
1713 # string is HTML-escaped.
1714 sub chop_and_escape_str {
1715         my ($str) = @_;
1716
1717         my $chopped = chop_str(@_);
1718         $str = to_utf8($str);
1719         if ($chopped eq $str) {
1720                 return esc_html($chopped);
1721         } else {
1722                 $str =~ s/[[:cntrl:]]/?/g;
1723                 return $cgi->span({-title=>$str}, esc_html($chopped));
1724         }
1725 }
1726
1727 # Highlight selected fragments of string, using given CSS class,
1728 # and escape HTML.  It is assumed that fragments do not overlap.
1729 # Regions are passed as list of pairs (array references).
1730 #
1731 # Example: esc_html_hl_regions("foobar", "mark", [ 0, 3 ]) returns
1732 # '<span class="mark">foo</span>bar'
1733 sub esc_html_hl_regions {
1734         my ($str, $css_class, @sel) = @_;
1735         my %opts = grep { ref($_) ne 'ARRAY' } @sel;
1736         @sel     = grep { ref($_) eq 'ARRAY' } @sel;
1737         return esc_html($str, %opts) unless @sel;
1738
1739         my $out = '';
1740         my $pos = 0;
1741
1742         for my $s (@sel) {
1743                 my ($begin, $end) = @$s;
1744
1745                 # Don't create empty <span> elements.
1746                 next if $end <= $begin;
1747
1748                 my $escaped = esc_html(substr($str, $begin, $end - $begin),
1749                                        %opts);
1750
1751                 $out .= esc_html(substr($str, $pos, $begin - $pos), %opts)
1752                         if ($begin - $pos > 0);
1753                 $out .= $cgi->span({-class => $css_class}, $escaped);
1754
1755                 $pos = $end;
1756         }
1757         $out .= esc_html(substr($str, $pos), %opts)
1758                 if ($pos < length($str));
1759
1760         return $out;
1761 }
1762
1763 # return positions of beginning and end of each match
1764 sub matchpos_list {
1765         my ($str, $regexp) = @_;
1766         return unless (defined $str && defined $regexp);
1767
1768         my @matches;
1769         while ($str =~ /$regexp/g) {
1770                 push @matches, [$-[0], $+[0]];
1771         }
1772         return @matches;
1773 }
1774
1775 # highlight match (if any), and escape HTML
1776 sub esc_html_match_hl {
1777         my ($str, $regexp) = @_;
1778         return esc_html($str) unless defined $regexp;
1779
1780         my @matches = matchpos_list($str, $regexp);
1781         return esc_html($str) unless @matches;
1782
1783         return esc_html_hl_regions($str, 'match', @matches);
1784 }
1785
1786
1787 # highlight match (if any) of shortened string, and escape HTML
1788 sub esc_html_match_hl_chopped {
1789         my ($str, $chopped, $regexp) = @_;
1790         return esc_html_match_hl($str, $regexp) unless defined $chopped;
1791
1792         my @matches = matchpos_list($str, $regexp);
1793         return esc_html($chopped) unless @matches;
1794
1795         # filter matches so that we mark chopped string
1796         my $tail = "... "; # see chop_str
1797         unless ($chopped =~ s/\Q$tail\E$//) {
1798                 $tail = '';
1799         }
1800         my $chop_len = length($chopped);
1801         my $tail_len = length($tail);
1802         my @filtered;
1803
1804         for my $m (@matches) {
1805                 if ($m->[0] > $chop_len) {
1806                         push @filtered, [ $chop_len, $chop_len + $tail_len ] if ($tail_len > 0);
1807                         last;
1808                 } elsif ($m->[1] > $chop_len) {
1809                         push @filtered, [ $m->[0], $chop_len + $tail_len ];
1810                         last;
1811                 }
1812                 push @filtered, $m;
1813         }
1814
1815         return esc_html_hl_regions($chopped . $tail, 'match', @filtered);
1816 }
1817
1818 ## ----------------------------------------------------------------------
1819 ## functions returning short strings
1820
1821 # CSS class for given age value (in seconds)
1822 sub age_class {
1823         my $age = shift;
1824
1825         if (!defined $age) {
1826                 return "noage";
1827         } elsif ($age < 60*60*2) {
1828                 return "age0";
1829         } elsif ($age < 60*60*24*2) {
1830                 return "age1";
1831         } else {
1832                 return "age2";
1833         }
1834 }
1835
1836 # convert age in seconds to "nn units ago" string
1837 sub age_string {
1838         my $age = shift;
1839         my $age_str;
1840
1841         if ($age > 60*60*24*365*2) {
1842                 $age_str = (int $age/60/60/24/365);
1843                 $age_str .= " years ago";
1844         } elsif ($age > 60*60*24*(365/12)*2) {
1845                 $age_str = int $age/60/60/24/(365/12);
1846                 $age_str .= " months ago";
1847         } elsif ($age > 60*60*24*7*2) {
1848                 $age_str = int $age/60/60/24/7;
1849                 $age_str .= " weeks ago";
1850         } elsif ($age > 60*60*24*2) {
1851                 $age_str = int $age/60/60/24;
1852                 $age_str .= " days ago";
1853         } elsif ($age > 60*60*2) {
1854                 $age_str = int $age/60/60;
1855                 $age_str .= " hours ago";
1856         } elsif ($age > 60*2) {
1857                 $age_str = int $age/60;
1858                 $age_str .= " min ago";
1859         } elsif ($age > 2) {
1860                 $age_str = int $age;
1861                 $age_str .= " sec ago";
1862         } else {
1863                 $age_str .= " right now";
1864         }
1865         return $age_str;
1866 }
1867
1868 use constant {
1869         S_IFINVALID => 0030000,
1870         S_IFGITLINK => 0160000,
1871 };
1872
1873 # submodule/subproject, a commit object reference
1874 sub S_ISGITLINK {
1875         my $mode = shift;
1876
1877         return (($mode & S_IFMT) == S_IFGITLINK)
1878 }
1879
1880 # convert file mode in octal to symbolic file mode string
1881 sub mode_str {
1882         my $mode = oct shift;
1883
1884         if (S_ISGITLINK($mode)) {
1885                 return 'm---------';
1886         } elsif (S_ISDIR($mode & S_IFMT)) {
1887                 return 'drwxr-xr-x';
1888         } elsif (S_ISLNK($mode)) {
1889                 return 'lrwxrwxrwx';
1890         } elsif (S_ISREG($mode)) {
1891                 # git cares only about the executable bit
1892                 if ($mode & S_IXUSR) {
1893                         return '-rwxr-xr-x';
1894                 } else {
1895                         return '-rw-r--r--';
1896                 };
1897         } else {
1898                 return '----------';
1899         }
1900 }
1901
1902 # convert file mode in octal to file type string
1903 sub file_type {
1904         my $mode = shift;
1905
1906         if ($mode !~ m/^[0-7]+$/) {
1907                 return $mode;
1908         } else {
1909                 $mode = oct $mode;
1910         }
1911
1912         if (S_ISGITLINK($mode)) {
1913                 return "submodule";
1914         } elsif (S_ISDIR($mode & S_IFMT)) {
1915                 return "directory";
1916         } elsif (S_ISLNK($mode)) {
1917                 return "symlink";
1918         } elsif (S_ISREG($mode)) {
1919                 return "file";
1920         } else {
1921                 return "unknown";
1922         }
1923 }
1924
1925 # convert file mode in octal to file type description string
1926 sub file_type_long {
1927         my $mode = shift;
1928
1929         if ($mode !~ m/^[0-7]+$/) {
1930                 return $mode;
1931         } else {
1932                 $mode = oct $mode;
1933         }
1934
1935         if (S_ISGITLINK($mode)) {
1936                 return "submodule";
1937         } elsif (S_ISDIR($mode & S_IFMT)) {
1938                 return "directory";
1939         } elsif (S_ISLNK($mode)) {
1940                 return "symlink";
1941         } elsif (S_ISREG($mode)) {
1942                 if ($mode & S_IXUSR) {
1943                         return "executable";
1944                 } else {
1945                         return "file";
1946                 };
1947         } else {
1948                 return "unknown";
1949         }
1950 }
1951
1952
1953 ## ----------------------------------------------------------------------
1954 ## functions returning short HTML fragments, or transforming HTML fragments
1955 ## which don't belong to other sections
1956
1957 # format line of commit message.
1958 sub format_log_line_html {
1959         my $line = shift;
1960
1961         $line = esc_html($line, -nbsp=>1);
1962         $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1963                 $cgi->a({-href => href(action=>"object", hash=>$1),
1964                                         -class => "text"}, $1);
1965         }eg;
1966
1967         return $line;
1968 }
1969
1970 # format marker of refs pointing to given object
1971
1972 # the destination action is chosen based on object type and current context:
1973 # - for annotated tags, we choose the tag view unless it's the current view
1974 #   already, in which case we go to shortlog view
1975 # - for other refs, we keep the current view if we're in history, shortlog or
1976 #   log view, and select shortlog otherwise
1977 sub format_ref_marker {
1978         my ($refs, $id) = @_;
1979         my $markers = '';
1980
1981         if (defined $refs->{$id}) {
1982                 foreach my $ref (@{$refs->{$id}}) {
1983                         # this code exploits the fact that non-lightweight tags are the
1984                         # only indirect objects, and that they are the only objects for which
1985                         # we want to use tag instead of shortlog as action
1986                         my ($type, $name) = qw();
1987                         my $indirect = ($ref =~ s/\^\{\}$//);
1988                         # e.g. tags/v2.6.11 or heads/next
1989                         if ($ref =~ m!^(.*?)s?/(.*)$!) {
1990                                 $type = $1;
1991                                 $name = $2;
1992                         } else {
1993                                 $type = "ref";
1994                                 $name = $ref;
1995                         }
1996
1997                         my $class = $type;
1998                         $class .= " indirect" if $indirect;
1999
2000                         my $dest_action = "shortlog";
2001
2002                         if ($indirect) {
2003                                 $dest_action = "tag" unless $action eq "tag";
2004                         } elsif ($action =~ /^(history|(short)?log)$/) {
2005                                 $dest_action = $action;
2006                         }
2007
2008                         my $dest = "";
2009                         $dest .= "refs/" unless $ref =~ m!^refs/!;
2010                         $dest .= $ref;
2011
2012                         my $link = $cgi->a({
2013                                 -href => href(
2014                                         action=>$dest_action,
2015                                         hash=>$dest
2016                                 )}, $name);
2017
2018                         $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
2019                                 $link . "</span>";
2020                 }
2021         }
2022
2023         if ($markers) {
2024                 return ' <span class="refs">'. $markers . '</span>';
2025         } else {
2026                 return "";
2027         }
2028 }
2029
2030 # format, perhaps shortened and with markers, title line
2031 sub format_subject_html {
2032         my ($long, $short, $href, $extra) = @_;
2033         $extra = '' unless defined($extra);
2034
2035         if (length($short) < length($long)) {
2036                 $long =~ s/[[:cntrl:]]/?/g;
2037                 return $cgi->a({-href => $href, -class => "list subject",
2038                                 -title => to_utf8($long)},
2039                        esc_html($short)) . $extra;
2040         } else {
2041                 return $cgi->a({-href => $href, -class => "list subject"},
2042                        esc_html($long)) . $extra;
2043         }
2044 }
2045
2046 # Rather than recomputing the url for an email multiple times, we cache it
2047 # after the first hit. This gives a visible benefit in views where the avatar
2048 # for the same email is used repeatedly (e.g. shortlog).
2049 # The cache is shared by all avatar engines (currently gravatar only), which
2050 # are free to use it as preferred. Since only one avatar engine is used for any
2051 # given page, there's no risk for cache conflicts.
2052 our %avatar_cache = ();
2053
2054 # Compute the picon url for a given email, by using the picon search service over at
2055 # http://www.cs.indiana.edu/picons/search.html
2056 sub picon_url {
2057         my $email = lc shift;
2058         if (!$avatar_cache{$email}) {
2059                 my ($user, $domain) = split('@', $email);
2060                 $avatar_cache{$email} =
2061                         "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
2062                         "$domain/$user/" .
2063                         "users+domains+unknown/up/single";
2064         }
2065         return $avatar_cache{$email};
2066 }
2067
2068 # Compute the gravatar url for a given email, if it's not in the cache already.
2069 # Gravatar stores only the part of the URL before the size, since that's the
2070 # one computationally more expensive. This also allows reuse of the cache for
2071 # different sizes (for this particular engine).
2072 sub gravatar_url {
2073         my $email = lc shift;
2074         my $size = shift;
2075         $avatar_cache{$email} ||=
2076                 "http://www.gravatar.com/avatar/" .
2077                         Digest::MD5::md5_hex($email) . "?s=";
2078         return $avatar_cache{$email} . $size;
2079 }
2080
2081 # Insert an avatar for the given $email at the given $size if the feature
2082 # is enabled.
2083 sub git_get_avatar {
2084         my ($email, %opts) = @_;
2085         my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
2086         my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
2087         $opts{-size} ||= 'default';
2088         my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
2089         my $url = "";
2090         if ($git_avatar eq 'gravatar') {
2091                 $url = gravatar_url($email, $size);
2092         } elsif ($git_avatar eq 'picon') {
2093                 $url = picon_url($email);
2094         }
2095         # Other providers can be added by extending the if chain, defining $url
2096         # as needed. If no variant puts something in $url, we assume avatars
2097         # are completely disabled/unavailable.
2098         if ($url) {
2099                 return $pre_white .
2100                        "<img width=\"$size\" " .
2101                             "class=\"avatar\" " .
2102                             "src=\"".esc_url($url)."\" " .
2103                             "alt=\"\" " .
2104                        "/>" . $post_white;
2105         } else {
2106                 return "";
2107         }
2108 }
2109
2110 sub format_search_author {
2111         my ($author, $searchtype, $displaytext) = @_;
2112         my $have_search = gitweb_check_feature('search');
2113
2114         if ($have_search) {
2115                 my $performed = "";
2116                 if ($searchtype eq 'author') {
2117                         $performed = "authored";
2118                 } elsif ($searchtype eq 'committer') {
2119                         $performed = "committed";
2120                 }
2121
2122                 return $cgi->a({-href => href(action=>"search", hash=>$hash,
2123                                 searchtext=>$author,
2124                                 searchtype=>$searchtype), class=>"list",
2125                                 title=>"Search for commits $performed by $author"},
2126                                 $displaytext);
2127
2128         } else {
2129                 return $displaytext;
2130         }
2131 }
2132
2133 # format the author name of the given commit with the given tag
2134 # the author name is chopped and escaped according to the other
2135 # optional parameters (see chop_str).
2136 sub format_author_html {
2137         my $tag = shift;
2138         my $co = shift;
2139         my $author = chop_and_escape_str($co->{'author_name'}, @_);
2140         return "<$tag class=\"author\">" .
2141                format_search_author($co->{'author_name'}, "author",
2142                        git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2143                        $author) .
2144                "</$tag>";
2145 }
2146
2147 # format git diff header line, i.e. "diff --(git|combined|cc) ..."
2148 sub format_git_diff_header_line {
2149         my $line = shift;
2150         my $diffinfo = shift;
2151         my ($from, $to) = @_;
2152
2153         if ($diffinfo->{'nparents'}) {
2154                 # combined diff
2155                 $line =~ s!^(diff (.*?) )"?.*$!$1!;
2156                 if ($to->{'href'}) {
2157                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2158                                          esc_path($to->{'file'}));
2159                 } else { # file was deleted (no href)
2160                         $line .= esc_path($to->{'file'});
2161                 }
2162         } else {
2163                 # "ordinary" diff
2164                 $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2165                 if ($from->{'href'}) {
2166                         $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2167                                          'a/' . esc_path($from->{'file'}));
2168                 } else { # file was added (no href)
2169                         $line .= 'a/' . esc_path($from->{'file'});
2170                 }
2171                 $line .= ' ';
2172                 if ($to->{'href'}) {
2173                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2174                                          'b/' . esc_path($to->{'file'}));
2175                 } else { # file was deleted
2176                         $line .= 'b/' . esc_path($to->{'file'});
2177                 }
2178         }
2179
2180         return "<div class=\"diff header\">$line</div>\n";
2181 }
2182
2183 # format extended diff header line, before patch itself
2184 sub format_extended_diff_header_line {
2185         my $line = shift;
2186         my $diffinfo = shift;
2187         my ($from, $to) = @_;
2188
2189         # match <path>
2190         if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2191                 $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2192                                        esc_path($from->{'file'}));
2193         }
2194         if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2195                 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2196                                  esc_path($to->{'file'}));
2197         }
2198         # match single <mode>
2199         if ($line =~ m/\s(\d{6})$/) {
2200                 $line .= '<span class="info"> (' .
2201                          file_type_long($1) .
2202                          ')</span>';
2203         }
2204         # match <hash>
2205         if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2206                 # can match only for combined diff
2207                 $line = 'index ';
2208                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2209                         if ($from->{'href'}[$i]) {
2210                                 $line .= $cgi->a({-href=>$from->{'href'}[$i],
2211                                                   -class=>"hash"},
2212                                                  substr($diffinfo->{'from_id'}[$i],0,7));
2213                         } else {
2214                                 $line .= '0' x 7;
2215                         }
2216                         # separator
2217                         $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2218                 }
2219                 $line .= '..';
2220                 if ($to->{'href'}) {
2221                         $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2222                                          substr($diffinfo->{'to_id'},0,7));
2223                 } else {
2224                         $line .= '0' x 7;
2225                 }
2226
2227         } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2228                 # can match only for ordinary diff
2229                 my ($from_link, $to_link);
2230                 if ($from->{'href'}) {
2231                         $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2232                                              substr($diffinfo->{'from_id'},0,7));
2233                 } else {
2234                         $from_link = '0' x 7;
2235                 }
2236                 if ($to->{'href'}) {
2237                         $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2238                                            substr($diffinfo->{'to_id'},0,7));
2239                 } else {
2240                         $to_link = '0' x 7;
2241                 }
2242                 my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2243                 $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2244         }
2245
2246         return $line . "<br/>\n";
2247 }
2248
2249 # format from-file/to-file diff header
2250 sub format_diff_from_to_header {
2251         my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2252         my $line;
2253         my $result = '';
2254
2255         $line = $from_line;
2256         #assert($line =~ m/^---/) if DEBUG;
2257         # no extra formatting for "^--- /dev/null"
2258         if (! $diffinfo->{'nparents'}) {
2259                 # ordinary (single parent) diff
2260                 if ($line =~ m!^--- "?a/!) {
2261                         if ($from->{'href'}) {
2262                                 $line = '--- a/' .
2263                                         $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2264                                                 esc_path($from->{'file'}));
2265                         } else {
2266                                 $line = '--- a/' .
2267                                         esc_path($from->{'file'});
2268                         }
2269                 }
2270                 $result .= qq!<div class="diff from_file">$line</div>\n!;
2271
2272         } else {
2273                 # combined diff (merge commit)
2274                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2275                         if ($from->{'href'}[$i]) {
2276                                 $line = '--- ' .
2277                                         $cgi->a({-href=>href(action=>"blobdiff",
2278                                                              hash_parent=>$diffinfo->{'from_id'}[$i],
2279                                                              hash_parent_base=>$parents[$i],
2280                                                              file_parent=>$from->{'file'}[$i],
2281                                                              hash=>$diffinfo->{'to_id'},
2282                                                              hash_base=>$hash,
2283                                                              file_name=>$to->{'file'}),
2284                                                  -class=>"path",
2285                                                  -title=>"diff" . ($i+1)},
2286                                                 $i+1) .
2287                                         '/' .
2288                                         $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2289                                                 esc_path($from->{'file'}[$i]));
2290                         } else {
2291                                 $line = '--- /dev/null';
2292                         }
2293                         $result .= qq!<div class="diff from_file">$line</div>\n!;
2294                 }
2295         }
2296
2297         $line = $to_line;
2298         #assert($line =~ m/^\+\+\+/) if DEBUG;
2299         # no extra formatting for "^+++ /dev/null"
2300         if ($line =~ m!^\+\+\+ "?b/!) {
2301                 if ($to->{'href'}) {
2302                         $line = '+++ b/' .
2303                                 $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2304                                         esc_path($to->{'file'}));
2305                 } else {
2306                         $line = '+++ b/' .
2307                                 esc_path($to->{'file'});
2308                 }
2309         }
2310         $result .= qq!<div class="diff to_file">$line</div>\n!;
2311
2312         return $result;
2313 }
2314
2315 # create note for patch simplified by combined diff
2316 sub format_diff_cc_simplified {
2317         my ($diffinfo, @parents) = @_;
2318         my $result = '';
2319
2320         $result .= "<div class=\"diff header\">" .
2321                    "diff --cc ";
2322         if (!is_deleted($diffinfo)) {
2323                 $result .= $cgi->a({-href => href(action=>"blob",
2324                                                   hash_base=>$hash,
2325                                                   hash=>$diffinfo->{'to_id'},
2326                                                   file_name=>$diffinfo->{'to_file'}),
2327                                     -class => "path"},
2328                                    esc_path($diffinfo->{'to_file'}));
2329         } else {
2330                 $result .= esc_path($diffinfo->{'to_file'});
2331         }
2332         $result .= "</div>\n" . # class="diff header"
2333                    "<div class=\"diff nodifferences\">" .
2334                    "Simple merge" .
2335                    "</div>\n"; # class="diff nodifferences"
2336
2337         return $result;
2338 }
2339
2340 sub diff_line_class {
2341         my ($line, $from, $to) = @_;
2342
2343         # ordinary diff
2344         my $num_sign = 1;
2345         # combined diff
2346         if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2347                 $num_sign = scalar @{$from->{'href'}};
2348         }
2349
2350         my @diff_line_classifier = (
2351                 { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2352                 { regexp => qr/^\\/,               class => "incomplete"  },
2353                 { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2354                 # classifier for context must come before classifier add/rem,
2355                 # or we would have to use more complicated regexp, for example
2356                 # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2357                 { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2358                 { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2359         );
2360         for my $clsfy (@diff_line_classifier) {
2361                 return $clsfy->{'class'}
2362                         if ($line =~ $clsfy->{'regexp'});
2363         }
2364
2365         # fallback
2366         return "";
2367 }
2368
2369 # assumes that $from and $to are defined and correctly filled,
2370 # and that $line holds a line of chunk header for unified diff
2371 sub format_unidiff_chunk_header {
2372         my ($line, $from, $to) = @_;
2373
2374         my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2375                 $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2376
2377         $from_lines = 0 unless defined $from_lines;
2378         $to_lines   = 0 unless defined $to_lines;
2379
2380         if ($from->{'href'}) {
2381                 $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2382                                      -class=>"list"}, $from_text);
2383         }
2384         if ($to->{'href'}) {
2385                 $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2386                                      -class=>"list"}, $to_text);
2387         }
2388         $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2389                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2390         return $line;
2391 }
2392
2393 # assumes that $from and $to are defined and correctly filled,
2394 # and that $line holds a line of chunk header for combined diff
2395 sub format_cc_diff_chunk_header {
2396         my ($line, $from, $to) = @_;
2397
2398         my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2399         my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2400
2401         @from_text = split(' ', $ranges);
2402         for (my $i = 0; $i < @from_text; ++$i) {
2403                 ($from_start[$i], $from_nlines[$i]) =
2404                         (split(',', substr($from_text[$i], 1)), 0);
2405         }
2406
2407         $to_text   = pop @from_text;
2408         $to_start  = pop @from_start;
2409         $to_nlines = pop @from_nlines;
2410
2411         $line = "<span class=\"chunk_info\">$prefix ";
2412         for (my $i = 0; $i < @from_text; ++$i) {
2413                 if ($from->{'href'}[$i]) {
2414                         $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2415                                           -class=>"list"}, $from_text[$i]);
2416                 } else {
2417                         $line .= $from_text[$i];
2418                 }
2419                 $line .= " ";
2420         }
2421         if ($to->{'href'}) {
2422                 $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2423                                   -class=>"list"}, $to_text);
2424         } else {
2425                 $line .= $to_text;
2426         }
2427         $line .= " $prefix</span>" .
2428                  "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2429         return $line;
2430 }
2431
2432 # process patch (diff) line (not to be used for diff headers),
2433 # returning HTML-formatted (but not wrapped) line.
2434 # If the line is passed as a reference, it is treated as HTML and not
2435 # esc_html()'ed.
2436 sub format_diff_line {
2437         my ($line, $diff_class, $from, $to) = @_;
2438
2439         if (ref($line)) {
2440                 $line = $$line;
2441         } else {
2442                 chomp $line;
2443                 $line = untabify($line);
2444
2445                 if ($from && $to && $line =~ m/^\@{2} /) {
2446                         $line = format_unidiff_chunk_header($line, $from, $to);
2447                 } elsif ($from && $to && $line =~ m/^\@{3}/) {
2448                         $line = format_cc_diff_chunk_header($line, $from, $to);
2449                 } else {
2450                         $line = esc_html($line, -nbsp=>1);
2451                 }
2452         }
2453
2454         my $diff_classes = "diff";
2455         $diff_classes .= " $diff_class" if ($diff_class);
2456         $line = "<div class=\"$diff_classes\">$line</div>\n";
2457
2458         return $line;
2459 }
2460
2461 # Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2462 # linked.  Pass the hash of the tree/commit to snapshot.
2463 sub format_snapshot_links {
2464         my ($hash) = @_;
2465         my $num_fmts = @snapshot_fmts;
2466         if ($num_fmts > 1) {
2467                 # A parenthesized list of links bearing format names.
2468                 # e.g. "snapshot (_tar.gz_ _zip_)"
2469                 return "snapshot (" . join(' ', map
2470                         $cgi->a({
2471                                 -href => href(
2472                                         action=>"snapshot",
2473                                         hash=>$hash,
2474                                         snapshot_format=>$_
2475                                 )
2476                         }, $known_snapshot_formats{$_}{'display'})
2477                 , @snapshot_fmts) . ")";
2478         } elsif ($num_fmts == 1) {
2479                 # A single "snapshot" link whose tooltip bears the format name.
2480                 # i.e. "_snapshot_"
2481                 my ($fmt) = @snapshot_fmts;
2482                 return
2483                         $cgi->a({
2484                                 -href => href(
2485                                         action=>"snapshot",
2486                                         hash=>$hash,
2487                                         snapshot_format=>$fmt
2488                                 ),
2489                                 -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2490                         }, "snapshot");
2491         } else { # $num_fmts == 0
2492                 return undef;
2493         }
2494 }
2495
2496 ## ......................................................................
2497 ## functions returning values to be passed, perhaps after some
2498 ## transformation, to other functions; e.g. returning arguments to href()
2499
2500 # returns hash to be passed to href to generate gitweb URL
2501 # in -title key it returns description of link
2502 sub get_feed_info {
2503         my $format = shift || 'Atom';
2504         my %res = (action => lc($format));
2505
2506         # feed links are possible only for project views
2507         return unless (defined $project);
2508         # some views should link to OPML, or to generic project feed,
2509         # or don't have specific feed yet (so they should use generic)
2510         return if (!$action || $action =~ /^(?:tags|heads|forks|tag|search)$/x);
2511
2512         my $branch;
2513         # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2514         # from tag links; this also makes possible to detect branch links
2515         if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2516             (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2517                 $branch = $1;
2518         }
2519         # find log type for feed description (title)
2520         my $type = 'log';
2521         if (defined $file_name) {
2522                 $type  = "history of $file_name";
2523                 $type .= "/" if ($action eq 'tree');
2524                 $type .= " on '$branch'" if (defined $branch);
2525         } else {
2526                 $type = "log of $branch" if (defined $branch);
2527         }
2528
2529         $res{-title} = $type;
2530         $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2531         $res{'file_name'} = $file_name;
2532
2533         return %res;
2534 }
2535
2536 ## ----------------------------------------------------------------------
2537 ## git utility subroutines, invoking git commands
2538
2539 # returns path to the core git executable and the --git-dir parameter as list
2540 sub git_cmd {
2541         $number_of_git_cmds++;
2542         return $GIT, '--git-dir='.$git_dir;
2543 }
2544
2545 # quote the given arguments for passing them to the shell
2546 # quote_command("command", "arg 1", "arg with ' and ! characters")
2547 # => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2548 # Try to avoid using this function wherever possible.
2549 sub quote_command {
2550         return join(' ',
2551                 map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2552 }
2553
2554 # get HEAD ref of given project as hash
2555 sub git_get_head_hash {
2556         return git_get_full_hash(shift, 'HEAD');
2557 }
2558
2559 sub git_get_full_hash {
2560         return git_get_hash(@_);
2561 }
2562
2563 sub git_get_short_hash {
2564         return git_get_hash(@_, '--short=7');
2565 }
2566
2567 sub git_get_hash {
2568         my ($project, $hash, @options) = @_;
2569         my $o_git_dir = $git_dir;
2570         my $retval = undef;
2571         $git_dir = "$projectroot/$project";
2572         if (open my $fd, '-|', git_cmd(), 'rev-parse',
2573             '--verify', '-q', @options, $hash) {
2574                 $retval = <$fd>;
2575                 chomp $retval if defined $retval;
2576                 close $fd;
2577         }
2578         if (defined $o_git_dir) {
2579                 $git_dir = $o_git_dir;
2580         }
2581         return $retval;
2582 }
2583
2584 # get type of given object
2585 sub git_get_type {
2586         my $hash = shift;
2587
2588         open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2589         my $type = <$fd>;
2590         close $fd or return;
2591         chomp $type;
2592         return $type;
2593 }
2594
2595 # repository configuration
2596 our $config_file = '';
2597 our %config;
2598
2599 # store multiple values for single key as anonymous array reference
2600 # single values stored directly in the hash, not as [ <value> ]
2601 sub hash_set_multi {
2602         my ($hash, $key, $value) = @_;
2603
2604         if (!exists $hash->{$key}) {
2605                 $hash->{$key} = $value;
2606         } elsif (!ref $hash->{$key}) {
2607                 $hash->{$key} = [ $hash->{$key}, $value ];
2608         } else {
2609                 push @{$hash->{$key}}, $value;
2610         }
2611 }
2612
2613 # return hash of git project configuration
2614 # optionally limited to some section, e.g. 'gitweb'
2615 sub git_parse_project_config {
2616         my $section_regexp = shift;
2617         my %config;
2618
2619         local $/ = "\0";
2620
2621         open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2622                 or return;
2623
2624         while (my $keyval = <$fh>) {
2625                 chomp $keyval;
2626                 my ($key, $value) = split(/\n/, $keyval, 2);
2627
2628                 hash_set_multi(\%config, $key, $value)
2629                         if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2630         }
2631         close $fh;
2632
2633         return %config;
2634 }
2635
2636 # convert config value to boolean: 'true' or 'false'
2637 # no value, number > 0, 'true' and 'yes' values are true
2638 # rest of values are treated as false (never as error)
2639 sub config_to_bool {
2640         my $val = shift;
2641
2642         return 1 if !defined $val;             # section.key
2643
2644         # strip leading and trailing whitespace
2645         $val =~ s/^\s+//;
2646         $val =~ s/\s+$//;
2647
2648         return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2649                 ($val =~ /^(?:true|yes)$/i));  # section.key = true
2650 }
2651
2652 # convert config value to simple decimal number
2653 # an optional value suffix of 'k', 'm', or 'g' will cause the value
2654 # to be multiplied by 1024, 1048576, or 1073741824
2655 sub config_to_int {
2656         my $val = shift;
2657
2658         # strip leading and trailing whitespace
2659         $val =~ s/^\s+//;
2660         $val =~ s/\s+$//;
2661
2662         if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2663                 $unit = lc($unit);
2664                 # unknown unit is treated as 1
2665                 return $num * ($unit eq 'g' ? 1073741824 :
2666                                $unit eq 'm' ?    1048576 :
2667                                $unit eq 'k' ?       1024 : 1);
2668         }
2669         return $val;
2670 }
2671
2672 # convert config value to array reference, if needed
2673 sub config_to_multi {
2674         my $val = shift;
2675
2676         return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2677 }
2678
2679 sub git_get_project_config {
2680         my ($key, $type) = @_;
2681
2682         return unless defined $git_dir;
2683
2684         # key sanity check
2685         return unless ($key);
2686         # only subsection, if exists, is case sensitive,
2687         # and not lowercased by 'git config -z -l'
2688         if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2689                 $key = join(".", lc($hi), $mi, lc($lo));
2690         } else {
2691                 $key = lc($key);
2692         }
2693         $key =~ s/^gitweb\.//;
2694         return if ($key =~ m/\W/);
2695
2696         # type sanity check
2697         if (defined $type) {
2698                 $type =~ s/^--//;
2699                 $type = undef
2700                         unless ($type eq 'bool' || $type eq 'int');
2701         }
2702
2703         # get config
2704         if (!defined $config_file ||
2705             $config_file ne "$git_dir/config") {
2706                 %config = git_parse_project_config('gitweb');
2707                 $config_file = "$git_dir/config";
2708         }
2709
2710         # check if config variable (key) exists
2711         return unless exists $config{"gitweb.$key"};
2712
2713         # ensure given type
2714         if (!defined $type) {
2715                 return $config{"gitweb.$key"};
2716         } elsif ($type eq 'bool') {
2717                 # backward compatibility: 'git config --bool' returns true/false
2718                 return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2719         } elsif ($type eq 'int') {
2720                 return config_to_int($config{"gitweb.$key"});
2721         }
2722         return $config{"gitweb.$key"};
2723 }
2724
2725 # get hash of given path at given ref
2726 sub git_get_hash_by_path {
2727         my $base = shift;
2728         my $path = shift || return undef;
2729         my $type = shift;
2730
2731         $path =~ s,/+$,,;
2732
2733         open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2734                 or die_error(500, "Open git-ls-tree failed");
2735         my $line = <$fd>;
2736         close $fd or return undef;
2737
2738         if (!defined $line) {
2739                 # there is no tree or hash given by $path at $base
2740                 return undef;
2741         }
2742
2743         #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2744         $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2745         if (defined $type && $type ne $2) {
2746                 # type doesn't match
2747                 return undef;
2748         }
2749         return $3;
2750 }
2751
2752 # get path of entry with given hash at given tree-ish (ref)
2753 # used to get 'from' filename for combined diff (merge commit) for renames
2754 sub git_get_path_by_hash {
2755         my $base = shift || return;
2756         my $hash = shift || return;
2757
2758         local $/ = "\0";
2759
2760         open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2761                 or return undef;
2762         while (my $line = <$fd>) {
2763                 chomp $line;
2764
2765                 #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2766                 #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2767                 if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2768                         close $fd;
2769                         return $1;
2770                 }
2771         }
2772         close $fd;
2773         return undef;
2774 }
2775
2776 ## ......................................................................
2777 ## git utility functions, directly accessing git repository
2778
2779 # get the value of config variable either from file named as the variable
2780 # itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2781 # configuration variable in the repository config file.
2782 sub git_get_file_or_project_config {
2783         my ($path, $name) = @_;
2784
2785         $git_dir = "$projectroot/$path";
2786         open my $fd, '<', "$git_dir/$name"
2787                 or return git_get_project_config($name);
2788         my $conf = <$fd>;
2789         close $fd;
2790         if (defined $conf) {
2791                 chomp $conf;
2792         }
2793         return $conf;
2794 }
2795
2796 sub git_get_project_description {
2797         my $path = shift;
2798         return git_get_file_or_project_config($path, 'description');
2799 }
2800
2801 sub git_get_project_category {
2802         my $path = shift;
2803         return git_get_file_or_project_config($path, 'category');
2804 }
2805
2806
2807 # supported formats:
2808 # * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2809 #   - if its contents is a number, use it as tag weight,
2810 #   - otherwise add a tag with weight 1
2811 # * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2812 #   the same value multiple times increases tag weight
2813 # * `gitweb.ctag' multi-valued repo config variable
2814 sub git_get_project_ctags {
2815         my $project = shift;
2816         my $ctags = {};
2817
2818         $git_dir = "$projectroot/$project";
2819         if (opendir my $dh, "$git_dir/ctags") {
2820                 my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2821                 foreach my $tagfile (@files) {
2822                         open my $ct, '<', $tagfile
2823                                 or next;
2824                         my $val = <$ct>;
2825                         chomp $val if $val;
2826                         close $ct;
2827
2828                         (my $ctag = $tagfile) =~ s#.*/##;
2829                         if ($val =~ /^\d+$/) {
2830                                 $ctags->{$ctag} = $val;
2831                         } else {
2832                                 $ctags->{$ctag} = 1;
2833                         }
2834                 }
2835                 closedir $dh;
2836
2837         } elsif (open my $fh, '<', "$git_dir/ctags") {
2838                 while (my $line = <$fh>) {
2839                         chomp $line;
2840                         $ctags->{$line}++ if $line;
2841                 }
2842                 close $fh;
2843
2844         } else {
2845                 my $taglist = config_to_multi(git_get_project_config('ctag'));
2846                 foreach my $tag (@$taglist) {
2847                         $ctags->{$tag}++;
2848                 }
2849         }
2850
2851         return $ctags;
2852 }
2853
2854 # return hash, where keys are content tags ('ctags'),
2855 # and values are sum of weights of given tag in every project
2856 sub git_gather_all_ctags {
2857         my $projects = shift;
2858         my $ctags = {};
2859
2860         foreach my $p (@$projects) {
2861                 foreach my $ct (keys %{$p->{'ctags'}}) {
2862                         $ctags->{$ct} += $p->{'ctags'}->{$ct};
2863                 }
2864         }
2865
2866         return $ctags;
2867 }
2868
2869 sub git_populate_project_tagcloud {
2870         my $ctags = shift;
2871
2872         # First, merge different-cased tags; tags vote on casing
2873         my %ctags_lc;
2874         foreach (keys %$ctags) {
2875                 $ctags_lc{lc $_}->{count} += $ctags->{$_};
2876                 if (not $ctags_lc{lc $_}->{topcount}
2877                     or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2878                         $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2879                         $ctags_lc{lc $_}->{topname} = $_;
2880                 }
2881         }
2882
2883         my $cloud;
2884         my $matched = $input_params{'ctag'};
2885         if (eval { require HTML::TagCloud; 1; }) {
2886                 $cloud = HTML::TagCloud->new;
2887                 foreach my $ctag (sort keys %ctags_lc) {
2888                         # Pad the title with spaces so that the cloud looks
2889                         # less crammed.
2890                         my $title = esc_html($ctags_lc{$ctag}->{topname});
2891                         $title =~ s/ /&nbsp;/g;
2892                         $title =~ s/^/&nbsp;/g;
2893                         $title =~ s/$/&nbsp;/g;
2894                         if (defined $matched && $matched eq $ctag) {
2895                                 $title = qq(<span class="match">$title</span>);
2896                         }
2897                         $cloud->add($title, href(project=>undef, ctag=>$ctag),
2898                                     $ctags_lc{$ctag}->{count});
2899                 }
2900         } else {
2901                 $cloud = {};
2902                 foreach my $ctag (keys %ctags_lc) {
2903                         my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2904                         if (defined $matched && $matched eq $ctag) {
2905                                 $title = qq(<span class="match">$title</span>);
2906                         }
2907                         $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2908                         $cloud->{$ctag}{ctag} =
2909                                 $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2910                 }
2911         }
2912         return $cloud;
2913 }
2914
2915 sub git_show_project_tagcloud {
2916         my ($cloud, $count) = @_;
2917         if (ref $cloud eq 'HTML::TagCloud') {
2918                 return $cloud->html_and_css($count);
2919         } else {
2920                 my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2921                 return
2922                         '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2923                         join (', ', map {
2924                                 $cloud->{$_}->{'ctag'}
2925                         } splice(@tags, 0, $count)) .
2926                         '</div>';
2927         }
2928 }
2929
2930 sub git_get_project_url_list {
2931         my $path = shift;
2932
2933         $git_dir = "$projectroot/$path";
2934         open my $fd, '<', "$git_dir/cloneurl"
2935                 or return wantarray ?
2936                 @{ config_to_multi(git_get_project_config('url')) } :
2937                    config_to_multi(git_get_project_config('url'));
2938         my @git_project_url_list = map { chomp; $_ } <$fd>;
2939         close $fd;
2940
2941         return wantarray ? @git_project_url_list : \@git_project_url_list;
2942 }
2943
2944 sub git_get_projects_list {
2945         my $filter = shift || '';
2946         my $paranoid = shift;
2947         my @list;
2948
2949         if (-d $projects_list) {
2950                 # search in directory
2951                 my $dir = $projects_list;
2952                 # remove the trailing "/"
2953                 $dir =~ s!/+$!!;
2954                 my $pfxlen = length("$dir");
2955                 my $pfxdepth = ($dir =~ tr!/!!);
2956                 # when filtering, search only given subdirectory
2957                 if ($filter && !$paranoid) {
2958                         $dir .= "/$filter";
2959                         $dir =~ s!/+$!!;
2960                 }
2961
2962                 File::Find::find({
2963                         follow_fast => 1, # follow symbolic links
2964                         follow_skip => 2, # ignore duplicates
2965                         dangling_symlinks => 0, # ignore dangling symlinks, silently
2966                         wanted => sub {
2967                                 # global variables
2968                                 our $project_maxdepth;
2969                                 our $projectroot;
2970                                 # skip project-list toplevel, if we get it.
2971                                 return if (m!^[/.]$!);
2972                                 # only directories can be git repositories
2973                                 return unless (-d $_);
2974                                 # don't traverse too deep (Find is super slow on os x)
2975                                 # $project_maxdepth excludes depth of $projectroot
2976                                 if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2977                                         $File::Find::prune = 1;
2978                                         return;
2979                                 }
2980
2981                                 my $path = substr($File::Find::name, $pfxlen + 1);
2982                                 # paranoidly only filter here
2983                                 if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
2984                                         next;
2985                                 }
2986                                 # we check related file in $projectroot
2987                                 if (check_export_ok("$projectroot/$path")) {
2988                                         push @list, { path => $path };
2989                                         $File::Find::prune = 1;
2990                                 }
2991                         },
2992                 }, "$dir");
2993
2994         } elsif (-f $projects_list) {
2995                 # read from file(url-encoded):
2996                 # 'git%2Fgit.git Linus+Torvalds'
2997                 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2998                 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2999                 open my $fd, '<', $projects_list or return;
3000         PROJECT:
3001                 while (my $line = <$fd>) {
3002                         chomp $line;
3003                         my ($path, $owner) = split ' ', $line;
3004                         $path = unescape($path);
3005                         $owner = unescape($owner);
3006                         if (!defined $path) {
3007                                 next;
3008                         }
3009                         # if $filter is rpovided, check if $path begins with $filter
3010                         if ($filter && $path !~ m!^\Q$filter\E/!) {
3011                                 next;
3012                         }
3013                         if (check_export_ok("$projectroot/$path")) {
3014                                 my $pr = {
3015                                         path => $path
3016                                 };
3017                                 if ($owner) {
3018                                         $pr->{'owner'} = to_utf8($owner);
3019                                 }
3020                                 push @list, $pr;
3021                         }
3022                 }
3023                 close $fd;
3024         }
3025         return @list;
3026 }
3027
3028 # written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
3029 # as side effects it sets 'forks' field to list of forks for forked projects
3030 sub filter_forks_from_projects_list {
3031         my $projects = shift;
3032
3033         my %trie; # prefix tree of directories (path components)
3034         # generate trie out of those directories that might contain forks
3035         foreach my $pr (@$projects) {
3036                 my $path = $pr->{'path'};
3037                 $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
3038                 next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
3039                 next unless ($path);      # skip '.git' repository: tests, git-instaweb
3040                 next unless (-d "$projectroot/$path"); # containing directory exists
3041                 $pr->{'forks'} = [];      # there can be 0 or more forks of project
3042
3043                 # add to trie
3044                 my @dirs = split('/', $path);
3045                 # walk the trie, until either runs out of components or out of trie
3046                 my $ref = \%trie;
3047                 while (scalar @dirs &&
3048                        exists($ref->{$dirs[0]})) {
3049                         $ref = $ref->{shift @dirs};
3050                 }
3051                 # create rest of trie structure from rest of components
3052                 foreach my $dir (@dirs) {
3053                         $ref = $ref->{$dir} = {};
3054                 }
3055                 # create end marker, store $pr as a data
3056                 $ref->{''} = $pr if (!exists $ref->{''});
3057         }
3058
3059         # filter out forks, by finding shortest prefix match for paths
3060         my @filtered;
3061  PROJECT:
3062         foreach my $pr (@$projects) {
3063                 # trie lookup
3064                 my $ref = \%trie;
3065         DIR:
3066                 foreach my $dir (split('/', $pr->{'path'})) {
3067                         if (exists $ref->{''}) {
3068                                 # found [shortest] prefix, is a fork - skip it
3069                                 push @{$ref->{''}{'forks'}}, $pr;
3070                                 next PROJECT;
3071                         }
3072                         if (!exists $ref->{$dir}) {
3073                                 # not in trie, cannot have prefix, not a fork
3074                                 push @filtered, $pr;
3075                                 next PROJECT;
3076                         }
3077                         # If the dir is there, we just walk one step down the trie.
3078                         $ref = $ref->{$dir};
3079                 }
3080                 # we ran out of trie
3081                 # (shouldn't happen: it's either no match, or end marker)
3082                 push @filtered, $pr;
3083         }
3084
3085         return @filtered;
3086 }
3087
3088 # note: fill_project_list_info must be run first,
3089 # for 'descr_long' and 'ctags' to be filled
3090 sub search_projects_list {
3091         my ($projlist, %opts) = @_;
3092         my $tagfilter  = $opts{'tagfilter'};
3093         my $search_re = $opts{'search_regexp'};
3094
3095         return @$projlist
3096                 unless ($tagfilter || $search_re);
3097
3098         # searching projects require filling to be run before it;
3099         fill_project_list_info($projlist,
3100                                $tagfilter  ? 'ctags' : (),
3101                                $search_re ? ('path', 'descr') : ());
3102         my @projects;
3103  PROJECT:
3104         foreach my $pr (@$projlist) {
3105
3106                 if ($tagfilter) {
3107                         next unless ref($pr->{'ctags'}) eq 'HASH';
3108                         next unless
3109                                 grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
3110                 }
3111
3112                 if ($search_re) {
3113                         next unless
3114                                 $pr->{'path'} =~ /$search_re/ ||
3115                                 $pr->{'descr_long'} =~ /$search_re/;
3116                 }
3117
3118                 push @projects, $pr;
3119         }
3120
3121         return @projects;
3122 }
3123
3124 our $gitweb_project_owner = undef;
3125 sub git_get_project_list_from_file {
3126
3127         return if (defined $gitweb_project_owner);
3128
3129         $gitweb_project_owner = {};
3130         # read from file (url-encoded):
3131         # 'git%2Fgit.git Linus+Torvalds'
3132         # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3133         # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3134         if (-f $projects_list) {
3135                 open(my $fd, '<', $projects_list);
3136                 while (my $line = <$fd>) {
3137                         chomp $line;
3138                         my ($pr, $ow) = split ' ', $line;
3139                         $pr = unescape($pr);
3140                         $ow = unescape($ow);
3141                         $gitweb_project_owner->{$pr} = to_utf8($ow);
3142                 }
3143                 close $fd;
3144         }
3145 }
3146
3147 sub git_get_project_owner {
3148         my $project = shift;
3149         my $owner;
3150
3151         return undef unless $project;
3152         $git_dir = "$projectroot/$project";
3153
3154         if (!defined $gitweb_project_owner) {
3155                 git_get_project_list_from_file();
3156         }
3157
3158         if (exists $gitweb_project_owner->{$project}) {
3159                 $owner = $gitweb_project_owner->{$project};
3160         }
3161         if (!defined $owner){
3162                 $owner = git_get_project_config('owner');
3163         }
3164         if (!defined $owner) {
3165                 $owner = get_file_owner("$git_dir");
3166         }
3167
3168         return $owner;
3169 }
3170
3171 sub git_get_last_activity {
3172         my ($path) = @_;
3173         my $fd;
3174
3175         $git_dir = "$projectroot/$path";
3176         open($fd, "-|", git_cmd(), 'for-each-ref',
3177              '--format=%(committer)',
3178              '--sort=-committerdate',
3179              '--count=1',
3180              'refs/heads') or return;
3181         my $most_recent = <$fd>;
3182         close $fd or return;
3183         if (defined $most_recent &&
3184             $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3185                 my $timestamp = $1;
3186                 my $age = time - $timestamp;
3187                 return ($age, age_string($age));
3188         }
3189         return (undef, undef);
3190 }
3191
3192 # Implementation note: when a single remote is wanted, we cannot use 'git
3193 # remote show -n' because that command always work (assuming it's a remote URL
3194 # if it's not defined), and we cannot use 'git remote show' because that would
3195 # try to make a network roundtrip. So the only way to find if that particular
3196 # remote is defined is to walk the list provided by 'git remote -v' and stop if
3197 # and when we find what we want.
3198 sub git_get_remotes_list {
3199         my $wanted = shift;
3200         my %remotes = ();
3201
3202         open my $fd, '-|' , git_cmd(), 'remote', '-v';
3203         return unless $fd;
3204         while (my $remote = <$fd>) {
3205                 chomp $remote;
3206                 $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3207                 next if $wanted and not $remote eq $wanted;
3208                 my ($url, $key) = ($1, $2);
3209
3210                 $remotes{$remote} ||= { 'heads' => () };
3211                 $remotes{$remote}{$key} = $url;
3212         }
3213         close $fd or return;
3214         return wantarray ? %remotes : \%remotes;
3215 }
3216
3217 # Takes a hash of remotes as first parameter and fills it by adding the
3218 # available remote heads for each of the indicated remotes.
3219 sub fill_remote_heads {
3220         my $remotes = shift;
3221         my @heads = map { "remotes/$_" } keys %$remotes;
3222         my @remoteheads = git_get_heads_list(undef, @heads);
3223         foreach my $remote (keys %$remotes) {
3224                 $remotes->{$remote}{'heads'} = [ grep {
3225                         $_->{'name'} =~ s!^$remote/!!
3226                         } @remoteheads ];
3227         }
3228 }
3229
3230 sub git_get_references {
3231         my $type = shift || "";
3232         my %refs;
3233         # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3234         # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3235         open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3236                 ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3237                 or return;
3238
3239         while (my $line = <$fd>) {
3240                 chomp $line;
3241                 if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3242                         if (defined $refs{$1}) {
3243                                 push @{$refs{$1}}, $2;
3244                         } else {
3245                                 $refs{$1} = [ $2 ];
3246                         }
3247                 }
3248         }
3249         close $fd or return;
3250         return \%refs;
3251 }
3252
3253 sub git_get_rev_name_tags {
3254         my $hash = shift || return undef;
3255
3256         open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3257                 or return;
3258         my $name_rev = <$fd>;
3259         close $fd;
3260
3261         if ($name_rev =~ m|^$hash tags/(.*)$|) {
3262                 return $1;
3263         } else {
3264                 # catches also '$hash undefined' output
3265                 return undef;
3266         }
3267 }
3268
3269 ## ----------------------------------------------------------------------
3270 ## parse to hash functions
3271
3272 sub parse_date {
3273         my $epoch = shift;
3274         my $tz = shift || "-0000";
3275
3276         my %date;
3277         my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3278         my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3279         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3280         $date{'hour'} = $hour;
3281         $date{'minute'} = $min;
3282         $date{'mday'} = $mday;
3283         $date{'day'} = $days[$wday];
3284         $date{'month'} = $months[$mon];
3285         $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3286                              $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3287         $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3288                              $mday, $months[$mon], $hour ,$min;
3289         $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3290                              1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3291
3292         my ($tz_sign, $tz_hour, $tz_min) =
3293                 ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3294         $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3295         my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3296         ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3297         $date{'hour_local'} = $hour;
3298         $date{'minute_local'} = $min;
3299         $date{'tz_local'} = $tz;
3300         $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3301                                   1900+$year, $mon+1, $mday,
3302                                   $hour, $min, $sec, $tz);
3303         return %date;
3304 }
3305
3306 sub parse_tag {
3307         my $tag_id = shift;
3308         my %tag;
3309         my @comment;
3310
3311         open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3312         $tag{'id'} = $tag_id;
3313         while (my $line = <$fd>) {
3314                 chomp $line;
3315                 if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3316                         $tag{'object'} = $1;
3317                 } elsif ($line =~ m/^type (.+)$/) {
3318                         $tag{'type'} = $1;
3319                 } elsif ($line =~ m/^tag (.+)$/) {
3320                         $tag{'name'} = $1;
3321                 } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3322                         $tag{'author'} = $1;
3323                         $tag{'author_epoch'} = $2;
3324                         $tag{'author_tz'} = $3;
3325                         if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3326                                 $tag{'author_name'}  = $1;
3327                                 $tag{'author_email'} = $2;
3328                         } else {
3329                                 $tag{'author_name'} = $tag{'author'};
3330                         }
3331                 } elsif ($line =~ m/--BEGIN/) {
3332                         push @comment, $line;
3333                         last;
3334                 } elsif ($line eq "") {
3335                         last;
3336                 }
3337         }
3338         push @comment, <$fd>;
3339         $tag{'comment'} = \@comment;
3340         close $fd or return;
3341         if (!defined $tag{'name'}) {
3342                 return
3343         };
3344         return %tag
3345 }
3346
3347 sub parse_commit_text {
3348         my ($commit_text, $withparents) = @_;
3349         my @commit_lines = split '\n', $commit_text;
3350         my %co;
3351
3352         pop @commit_lines; # Remove '\0'
3353
3354         if (! @commit_lines) {
3355                 return;
3356         }
3357
3358         my $header = shift @commit_lines;
3359         if ($header !~ m/^[0-9a-fA-F]{40}/) {
3360                 return;
3361         }
3362         ($co{'id'}, my @parents) = split ' ', $header;
3363         while (my $line = shift @commit_lines) {
3364                 last if $line eq "\n";
3365                 if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3366                         $co{'tree'} = $1;
3367                 } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3368                         push @parents, $1;
3369                 } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3370                         $co{'author'} = to_utf8($1);
3371                         $co{'author_epoch'} = $2;
3372                         $co{'author_tz'} = $3;
3373                         if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3374                                 $co{'author_name'}  = $1;
3375                                 $co{'author_email'} = $2;
3376                         } else {
3377                                 $co{'author_name'} = $co{'author'};
3378                         }
3379                 } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3380                         $co{'committer'} = to_utf8($1);
3381                         $co{'committer_epoch'} = $2;
3382                         $co{'committer_tz'} = $3;
3383                         if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3384                                 $co{'committer_name'}  = $1;
3385                                 $co{'committer_email'} = $2;
3386                         } else {
3387                                 $co{'committer_name'} = $co{'committer'};
3388                         }
3389                 }
3390         }
3391         if (!defined $co{'tree'}) {
3392                 return;
3393         };
3394         $co{'parents'} = \@parents;
3395         $co{'parent'} = $parents[0];
3396
3397         foreach my $title (@commit_lines) {
3398                 $title =~ s/^    //;
3399                 if ($title ne "") {
3400                         $co{'title'} = chop_str($title, 80, 5);
3401                         # remove leading stuff of merges to make the interesting part visible
3402                         if (length($title) > 50) {
3403                                 $title =~ s/^Automatic //;
3404                                 $title =~ s/^merge (of|with) /Merge ... /i;
3405                                 if (length($title) > 50) {
3406                                         $title =~ s/(http|rsync):\/\///;
3407                                 }
3408                                 if (length($title) > 50) {
3409                                         $title =~ s/(master|www|rsync)\.//;
3410                                 }
3411                                 if (length($title) > 50) {
3412                                         $title =~ s/kernel.org:?//;
3413                                 }
3414                                 if (length($title) > 50) {
3415                                         $title =~ s/\/pub\/scm//;
3416                                 }
3417                         }
3418                         $co{'title_short'} = chop_str($title, 50, 5);
3419                         last;
3420                 }
3421         }
3422         if (! defined $co{'title'} || $co{'title'} eq "") {
3423                 $co{'title'} = $co{'title_short'} = '(no commit message)';
3424         }
3425         # remove added spaces
3426         foreach my $line (@commit_lines) {
3427                 $line =~ s/^    //;
3428         }
3429         $co{'comment'} = \@commit_lines;
3430
3431         my $age = time - $co{'committer_epoch'};
3432         $co{'age'} = $age;
3433         $co{'age_string'} = age_string($age);
3434         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3435         if ($age > 60*60*24*7*2) {
3436                 $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3437                 $co{'age_string_age'} = $co{'age_string'};
3438         } else {
3439                 $co{'age_string_date'} = $co{'age_string'};
3440                 $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3441         }
3442         return %co;
3443 }
3444
3445 sub parse_commit {
3446         my ($commit_id) = @_;
3447         my %co;
3448
3449         local $/ = "\0";
3450
3451         open my $fd, "-|", git_cmd(), "rev-list",
3452                 "--parents",
3453                 "--header",
3454                 "--max-count=1",
3455                 $commit_id,
3456                 "--",
3457                 or die_error(500, "Open git-rev-list failed");
3458         %co = parse_commit_text(<$fd>, 1);
3459         close $fd;
3460
3461         return %co;
3462 }
3463
3464 sub parse_commits {
3465         my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3466         my @cos;
3467
3468         $maxcount ||= 1;
3469         $skip ||= 0;
3470
3471         local $/ = "\0";
3472
3473         open my $fd, "-|", git_cmd(), "rev-list",
3474                 "--header",
3475                 @args,
3476                 ("--max-count=" . $maxcount),
3477                 ("--skip=" . $skip),
3478                 @extra_options,
3479                 $commit_id,
3480                 "--",
3481                 ($filename ? ($filename) : ())
3482                 or die_error(500, "Open git-rev-list failed");
3483         while (my $line = <$fd>) {
3484                 my %co = parse_commit_text($line);
3485                 push @cos, \%co;
3486         }
3487         close $fd;
3488
3489         return wantarray ? @cos : \@cos;
3490 }
3491
3492 # parse line of git-diff-tree "raw" output
3493 sub parse_difftree_raw_line {
3494         my $line = shift;
3495         my %res;
3496
3497         # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3498         # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3499         if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3500                 $res{'from_mode'} = $1;
3501                 $res{'to_mode'} = $2;
3502                 $res{'from_id'} = $3;
3503                 $res{'to_id'} = $4;
3504                 $res{'status'} = $5;
3505                 $res{'similarity'} = $6;
3506                 if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3507                         ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3508                 } else {
3509                         $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3510                 }
3511         }
3512         # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3513         # combined diff (for merge commit)
3514         elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3515                 $res{'nparents'}  = length($1);
3516                 $res{'from_mode'} = [ split(' ', $2) ];
3517                 $res{'to_mode'} = pop @{$res{'from_mode'}};
3518                 $res{'from_id'} = [ split(' ', $3) ];
3519                 $res{'to_id'} = pop @{$res{'from_id'}};
3520                 $res{'status'} = [ split('', $4) ];
3521                 $res{'to_file'} = unquote($5);
3522         }
3523         # 'c512b523472485aef4fff9e57b229d9d243c967f'
3524         elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3525                 $res{'commit'} = $1;
3526         }
3527
3528         return wantarray ? %res : \%res;
3529 }
3530
3531 # wrapper: return parsed line of git-diff-tree "raw" output
3532 # (the argument might be raw line, or parsed info)
3533 sub parsed_difftree_line {
3534         my $line_or_ref = shift;
3535
3536         if (ref($line_or_ref) eq "HASH") {
3537                 # pre-parsed (or generated by hand)
3538                 return $line_or_ref;
3539         } else {
3540                 return parse_difftree_raw_line($line_or_ref);
3541         }
3542 }
3543
3544 # parse line of git-ls-tree output
3545 sub parse_ls_tree_line {
3546         my $line = shift;
3547         my %opts = @_;
3548         my %res;
3549
3550         if ($opts{'-l'}) {
3551                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3552                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3553
3554                 $res{'mode'} = $1;
3555                 $res{'type'} = $2;
3556                 $res{'hash'} = $3;
3557                 $res{'size'} = $4;
3558                 if ($opts{'-z'}) {
3559                         $res{'name'} = $5;
3560                 } else {
3561                         $res{'name'} = unquote($5);
3562                 }
3563         } else {
3564                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3565                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3566
3567                 $res{'mode'} = $1;
3568                 $res{'type'} = $2;
3569                 $res{'hash'} = $3;
3570                 if ($opts{'-z'}) {
3571                         $res{'name'} = $4;
3572                 } else {
3573                         $res{'name'} = unquote($4);
3574                 }
3575         }
3576
3577         return wantarray ? %res : \%res;
3578 }
3579
3580 # generates _two_ hashes, references to which are passed as 2 and 3 argument
3581 sub parse_from_to_diffinfo {
3582         my ($diffinfo, $from, $to, @parents) = @_;
3583
3584         if ($diffinfo->{'nparents'}) {
3585                 # combined diff
3586                 $from->{'file'} = [];
3587                 $from->{'href'} = [];
3588                 fill_from_file_info($diffinfo, @parents)
3589                         unless exists $diffinfo->{'from_file'};
3590                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3591                         $from->{'file'}[$i] =
3592                                 defined $diffinfo->{'from_file'}[$i] ?
3593                                         $diffinfo->{'from_file'}[$i] :
3594                                         $diffinfo->{'to_file'};
3595                         if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3596                                 $from->{'href'}[$i] = href(action=>"blob",
3597                                                            hash_base=>$parents[$i],
3598                                                            hash=>$diffinfo->{'from_id'}[$i],
3599                                                            file_name=>$from->{'file'}[$i]);
3600                         } else {
3601                                 $from->{'href'}[$i] = undef;
3602                         }
3603                 }
3604         } else {
3605                 # ordinary (not combined) diff
3606                 $from->{'file'} = $diffinfo->{'from_file'};
3607                 if ($diffinfo->{'status'} ne "A") { # not new (added) file
3608                         $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3609                                                hash=>$diffinfo->{'from_id'},
3610                                                file_name=>$from->{'file'});
3611                 } else {
3612                         delete $from->{'href'};
3613                 }
3614         }
3615
3616         $to->{'file'} = $diffinfo->{'to_file'};
3617         if (!is_deleted($diffinfo)) { # file exists in result
3618                 $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3619                                      hash=>$diffinfo->{'to_id'},
3620                                      file_name=>$to->{'file'});
3621         } else {
3622                 delete $to->{'href'};
3623         }
3624 }
3625
3626 ## ......................................................................
3627 ## parse to array of hashes functions
3628
3629 sub git_get_heads_list {
3630         my ($limit, @classes) = @_;
3631         @classes = ('heads') unless @classes;
3632         my @patterns = map { "refs/$_" } @classes;
3633         my @headslist;
3634
3635         open my $fd, '-|', git_cmd(), 'for-each-ref',
3636                 ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3637                 '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3638                 @patterns
3639                 or return;
3640         while (my $line = <$fd>) {
3641                 my %ref_item;
3642
3643                 chomp $line;
3644                 my ($refinfo, $committerinfo) = split(/\0/, $line);
3645                 my ($hash, $name, $title) = split(' ', $refinfo, 3);
3646                 my ($committer, $epoch, $tz) =
3647                         ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3648                 $ref_item{'fullname'}  = $name;
3649                 $name =~ s!^refs/(?:head|remote)s/!!;
3650
3651                 $ref_item{'name'}  = $name;
3652                 $ref_item{'id'}    = $hash;
3653                 $ref_item{'title'} = $title || '(no commit message)';
3654                 $ref_item{'epoch'} = $epoch;
3655                 if ($epoch) {
3656                         $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3657                 } else {
3658                         $ref_item{'age'} = "unknown";
3659                 }
3660
3661                 push @headslist, \%ref_item;
3662         }
3663         close $fd;
3664
3665         return wantarray ? @headslist : \@headslist;
3666 }
3667
3668 sub git_get_tags_list {
3669         my $limit = shift;
3670         my @tagslist;
3671
3672         open my $fd, '-|', git_cmd(), 'for-each-ref',
3673                 ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3674                 '--format=%(objectname) %(objecttype) %(refname) '.
3675                 '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3676                 'refs/tags'
3677                 or return;
3678         while (my $line = <$fd>) {
3679                 my %ref_item;
3680
3681                 chomp $line;
3682                 my ($refinfo, $creatorinfo) = split(/\0/, $line);
3683                 my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3684                 my ($creator, $epoch, $tz) =
3685                         ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3686                 $ref_item{'fullname'} = $name;
3687                 $name =~ s!^refs/tags/!!;
3688
3689                 $ref_item{'type'} = $type;
3690                 $ref_item{'id'} = $id;
3691                 $ref_item{'name'} = $name;
3692                 if ($type eq "tag") {
3693                         $ref_item{'subject'} = $title;
3694                         $ref_item{'reftype'} = $reftype;
3695                         $ref_item{'refid'}   = $refid;
3696                 } else {
3697                         $ref_item{'reftype'} = $type;
3698                         $ref_item{'refid'}   = $id;
3699                 }
3700
3701                 if ($type eq "tag" || $type eq "commit") {
3702                         $ref_item{'epoch'} = $epoch;
3703                         if ($epoch) {
3704                                 $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3705                         } else {
3706                                 $ref_item{'age'} = "unknown";
3707                         }
3708                 }
3709
3710                 push @tagslist, \%ref_item;
3711         }
3712         close $fd;
3713
3714         return wantarray ? @tagslist : \@tagslist;
3715 }
3716
3717 ## ----------------------------------------------------------------------
3718 ## filesystem-related functions
3719
3720 sub get_file_owner {
3721         my $path = shift;
3722
3723         my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3724         my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3725         if (!defined $gcos) {
3726                 return undef;
3727         }
3728         my $owner = $gcos;
3729         $owner =~ s/[,;].*$//;
3730         return to_utf8($owner);
3731 }
3732
3733 # assume that file exists
3734 sub insert_file {
3735         my $filename = shift;
3736
3737         open my $fd, '<', $filename;
3738         print map { to_utf8($_) } <$fd>;
3739         close $fd;
3740 }
3741
3742 ## ......................................................................
3743 ## mimetype related functions
3744
3745 sub mimetype_guess_file {
3746         my $filename = shift;
3747         my $mimemap = shift;
3748         -r $mimemap or return undef;
3749
3750         my %mimemap;
3751         open(my $mh, '<', $mimemap) or return undef;
3752         while (<$mh>) {
3753                 next if m/^#/; # skip comments
3754                 my ($mimetype, @exts) = split(/\s+/);
3755                 foreach my $ext (@exts) {
3756                         $mimemap{$ext} = $mimetype;
3757                 }
3758         }
3759         close($mh);
3760
3761         $filename =~ /\.([^.]*)$/;
3762         return $mimemap{$1};
3763 }
3764
3765 sub mimetype_guess {
3766         my $filename = shift;
3767         my $mime;
3768         $filename =~ /\./ or return undef;
3769
3770         if ($mimetypes_file) {
3771                 my $file = $mimetypes_file;
3772                 if ($file !~ m!^/!) { # if it is relative path
3773                         # it is relative to project
3774                         $file = "$projectroot/$project/$file";
3775                 }
3776                 $mime = mimetype_guess_file($filename, $file);
3777         }
3778         $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3779         return $mime;
3780 }
3781
3782 sub blob_mimetype {
3783         my $fd = shift;
3784         my $filename = shift;
3785
3786         if ($filename) {
3787                 my $mime = mimetype_guess($filename);
3788                 $mime and return $mime;
3789         }
3790
3791         # just in case
3792         return $default_blob_plain_mimetype unless $fd;
3793
3794         if (-T $fd) {
3795                 return 'text/plain';
3796         } elsif (! $filename) {
3797                 return 'application/octet-stream';
3798         } elsif ($filename =~ m/\.png$/i) {
3799                 return 'image/png';
3800         } elsif ($filename =~ m/\.gif$/i) {
3801                 return 'image/gif';
3802         } elsif ($filename =~ m/\.jpe?g$/i) {
3803                 return 'image/jpeg';
3804         } else {
3805                 return 'application/octet-stream';
3806         }
3807 }
3808
3809 sub blob_contenttype {
3810         my ($fd, $file_name, $type) = @_;
3811
3812         $type ||= blob_mimetype($fd, $file_name);
3813         if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3814                 $type .= "; charset=$default_text_plain_charset";
3815         }
3816
3817         return $type;
3818 }
3819
3820 # guess file syntax for syntax highlighting; return undef if no highlighting
3821 # the name of syntax can (in the future) depend on syntax highlighter used
3822 sub guess_file_syntax {
3823         my ($highlight, $mimetype, $file_name) = @_;
3824         return undef unless ($highlight && defined $file_name);
3825         my $basename = basename($file_name, '.in');
3826         return $highlight_basename{$basename}
3827                 if exists $highlight_basename{$basename};
3828
3829         $basename =~ /\.([^.]*)$/;
3830         my $ext = $1 or return undef;
3831         return $highlight_ext{$ext}
3832                 if exists $highlight_ext{$ext};
3833
3834         return undef;
3835 }
3836
3837 # run highlighter and return FD of its output,
3838 # or return original FD if no highlighting
3839 sub run_highlighter {
3840         my ($fd, $highlight, $syntax) = @_;
3841         return $fd unless ($highlight && defined $syntax);
3842
3843         close $fd;
3844         open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3845                   quote_command($highlight_bin).
3846                   " --replace-tabs=8 --fragment --syntax $syntax |"
3847                 or die_error(500, "Couldn't open file or run syntax highlighter");
3848         return $fd;
3849 }
3850
3851 ## ======================================================================
3852 ## functions printing HTML: header, footer, error page
3853
3854 sub get_page_title {
3855         my $title = to_utf8($site_name);
3856
3857         unless (defined $project) {
3858                 if (defined $project_filter) {
3859                         $title .= " - projects in '" . esc_path($project_filter) . "'";
3860                 }
3861                 return $title;
3862         }
3863         $title .= " - " . to_utf8($project);
3864
3865         return $title unless (defined $action);
3866         $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3867
3868         return $title unless (defined $file_name);
3869         $title .= " - " . esc_path($file_name);
3870         if ($action eq "tree" && $file_name !~ m|/$|) {
3871                 $title .= "/";
3872         }
3873
3874         return $title;
3875 }
3876
3877 sub get_content_type_html {
3878         # require explicit support from the UA if we are to send the page as
3879         # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3880         # we have to do this because MSIE sometimes globs '*/*', pretending to
3881         # support xhtml+xml but choking when it gets what it asked for.
3882         if (defined $cgi->http('HTTP_ACCEPT') &&
3883             $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3884             $cgi->Accept('application/xhtml+xml') != 0) {
3885                 return 'application/xhtml+xml';
3886         } else {
3887                 return 'text/html';
3888         }
3889 }
3890
3891 sub print_feed_meta {
3892         if (defined $project) {
3893                 my %href_params = get_feed_info();
3894                 if (!exists $href_params{'-title'}) {
3895                         $href_params{'-title'} = 'log';
3896                 }
3897
3898                 foreach my $format (qw(RSS Atom)) {
3899                         my $type = lc($format);
3900                         my %link_attr = (
3901                                 '-rel' => 'alternate',
3902                                 '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3903                                 '-type' => "application/$type+xml"
3904                         );
3905
3906                         $href_params{'extra_options'} = undef;
3907                         $href_params{'action'} = $type;
3908                         $link_attr{'-href'} = href(%href_params);
3909                         print "<link ".
3910                               "rel=\"$link_attr{'-rel'}\" ".
3911                               "title=\"$link_attr{'-title'}\" ".
3912                               "href=\"$link_attr{'-href'}\" ".
3913                               "type=\"$link_attr{'-type'}\" ".
3914                               "/>\n";
3915
3916                         $href_params{'extra_options'} = '--no-merges';
3917                         $link_attr{'-href'} = href(%href_params);
3918                         $link_attr{'-title'} .= ' (no merges)';
3919                         print "<link ".
3920                               "rel=\"$link_attr{'-rel'}\" ".
3921                               "title=\"$link_attr{'-title'}\" ".
3922                               "href=\"$link_attr{'-href'}\" ".
3923                               "type=\"$link_attr{'-type'}\" ".
3924                               "/>\n";
3925                 }
3926
3927         } else {
3928                 printf('<link rel="alternate" title="%s projects list" '.
3929                        'href="%s" type="text/plain; charset=utf-8" />'."\n",
3930                        esc_attr($site_name), href(project=>undef, action=>"project_index"));
3931                 printf('<link rel="alternate" title="%s projects feeds" '.
3932                        'href="%s" type="text/x-opml" />'."\n",
3933                        esc_attr($site_name), href(project=>undef, action=>"opml"));
3934         }
3935 }
3936
3937 sub print_header_links {
3938         my $status = shift;
3939
3940         # print out each stylesheet that exist, providing backwards capability
3941         # for those people who defined $stylesheet in a config file
3942         if (defined $stylesheet) {
3943                 print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3944         } else {
3945                 foreach my $stylesheet (@stylesheets) {
3946                         next unless $stylesheet;
3947                         print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3948                 }
3949         }
3950         print_feed_meta()
3951                 if ($status eq '200 OK');
3952         if (defined $favicon) {
3953                 print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3954         }
3955 }
3956
3957 sub print_nav_breadcrumbs_path {
3958         my $dirprefix = undef;
3959         while (my $part = shift) {
3960                 $dirprefix .= "/" if defined $dirprefix;
3961                 $dirprefix .= $part;
3962                 print $cgi->a({-href => href(project => undef,
3963                                              project_filter => $dirprefix,
3964                                              action => "project_list")},
3965                               esc_html($part)) . " / ";
3966         }
3967 }
3968
3969 sub print_nav_breadcrumbs {
3970         my %opts = @_;
3971
3972         print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3973         if (defined $project) {
3974                 my @dirname = split '/', $project;
3975                 my $projectbasename = pop @dirname;
3976                 print_nav_breadcrumbs_path(@dirname);
3977                 print $cgi->a({-href => href(action=>"summary")}, esc_html($projectbasename));
3978                 if (defined $action) {
3979                         my $action_print = $action ;
3980                         if (defined $opts{-action_extra}) {
3981                                 $action_print = $cgi->a({-href => href(action=>$action)},
3982                                         $action);
3983                         }
3984                         print " / $action_print";
3985                 }
3986                 if (defined $opts{-action_extra}) {
3987                         print " / $opts{-action_extra}";
3988                 }
3989                 print "\n";
3990         } elsif (defined $project_filter) {
3991                 print_nav_breadcrumbs_path(split '/', $project_filter);
3992         }
3993 }
3994
3995 sub print_search_form {
3996         if (!defined $searchtext) {
3997                 $searchtext = "";
3998         }
3999         my $search_hash;
4000         if (defined $hash_base) {
4001                 $search_hash = $hash_base;
4002         } elsif (defined $hash) {
4003                 $search_hash = $hash;
4004         } else {
4005                 $search_hash = "HEAD";
4006         }
4007         my $action = $my_uri;
4008         my $use_pathinfo = gitweb_check_feature('pathinfo');
4009         if ($use_pathinfo) {
4010                 $action .= "/".esc_url($project);
4011         }
4012         print $cgi->startform(-method => "get", -action => $action) .
4013               "<div class=\"search\">\n" .
4014               (!$use_pathinfo &&
4015               $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
4016               $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
4017               $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
4018               $cgi->popup_menu(-name => 'st', -default => 'commit',
4019                                -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
4020               $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
4021               " search:\n",
4022               $cgi->textfield(-name => "s", -value => $searchtext, -override => 1) . "\n" .
4023               "<span title=\"Extended regular expression\">" .
4024               $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
4025                              -checked => $search_use_regexp) .
4026               "</span>" .
4027               "</div>" .
4028               $cgi->end_form() . "\n";
4029 }
4030
4031 sub git_header_html {
4032         my $status = shift || "200 OK";
4033         my $expires = shift;
4034         my %opts = @_;
4035
4036         my $title = get_page_title();
4037         my $content_type = get_content_type_html();
4038         print $cgi->header(-type=>$content_type, -charset => 'utf-8',
4039                            -status=> $status, -expires => $expires)
4040                 unless ($opts{'-no_http_header'});
4041         my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
4042         print <<EOF;
4043 <?xml version="1.0" encoding="utf-8"?>
4044 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
4045 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
4046 <!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
4047 <!-- git core binaries version $git_version -->
4048 <head>
4049 <meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
4050 <meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
4051 <meta name="robots" content="index, nofollow"/>
4052 <title>$title</title>
4053 EOF
4054         # the stylesheet, favicon etc urls won't work correctly with path_info
4055         # unless we set the appropriate base URL
4056         if ($ENV{'PATH_INFO'}) {
4057                 print "<base href=\"".esc_url($base_url)."\" />\n";
4058         }
4059         print_header_links($status);
4060
4061         if (defined $site_html_head_string) {
4062                 print to_utf8($site_html_head_string);
4063         }
4064
4065         print "</head>\n" .
4066               "<body>\n";
4067
4068         if (defined $site_header && -f $site_header) {
4069                 insert_file($site_header);
4070         }
4071
4072         print "<div class=\"page_header\">\n";
4073         if (defined $logo) {
4074                 print $cgi->a({-href => esc_url($logo_url),
4075                                -title => $logo_label},
4076                               $cgi->img({-src => esc_url($logo),
4077                                          -width => 72, -height => 27,
4078                                          -alt => "git",
4079                                          -class => "logo"}));
4080         }
4081         print_nav_breadcrumbs(%opts);
4082         print "</div>\n";
4083
4084         my $have_search = gitweb_check_feature('search');
4085         if (defined $project && $have_search) {
4086                 print_search_form();
4087         }
4088 }
4089
4090 sub git_footer_html {
4091         my $feed_class = 'rss_logo';
4092
4093         print "<div class=\"page_footer\">\n";
4094         if (defined $project) {
4095                 my $descr = git_get_project_description($project);
4096                 if (defined $descr) {
4097                         print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
4098                 }
4099
4100                 my %href_params = get_feed_info();
4101                 if (!%href_params) {
4102                         $feed_class .= ' generic';
4103                 }
4104                 $href_params{'-title'} ||= 'log';
4105
4106                 foreach my $format (qw(RSS Atom)) {
4107                         $href_params{'action'} = lc($format);
4108                         print $cgi->a({-href => href(%href_params),
4109                                       -title => "$href_params{'-title'} $format feed",
4110                                       -class => $feed_class}, $format)."\n";
4111                 }
4112
4113         } else {
4114                 print $cgi->a({-href => href(project=>undef, action=>"opml",
4115                                              project_filter => $project_filter),
4116                               -class => $feed_class}, "OPML") . " ";
4117                 print $cgi->a({-href => href(project=>undef, action=>"project_index",
4118                                              project_filter => $project_filter),
4119                               -class => $feed_class}, "TXT") . "\n";
4120         }
4121         print "</div>\n"; # class="page_footer"
4122
4123         if (defined $t0 && gitweb_check_feature('timed')) {
4124                 print "<div id=\"generating_info\">\n";
4125                 print 'This page took '.
4126                       '<span id="generating_time" class="time_span">'.
4127                       tv_interval($t0, [ gettimeofday() ]).
4128                       ' seconds </span>'.
4129                       ' and '.
4130                       '<span id="generating_cmd">'.
4131                       $number_of_git_cmds.
4132                       '</span> git commands '.
4133                       " to generate.\n";
4134                 print "</div>\n"; # class="page_footer"
4135         }
4136
4137         if (defined $site_footer && -f $site_footer) {
4138                 insert_file($site_footer);
4139         }
4140
4141         print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
4142         if (defined $action &&
4143             $action eq 'blame_incremental') {
4144                 print qq!<script type="text/javascript">\n!.
4145                       qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
4146                       qq!           "!. href() .qq!");\n!.
4147                       qq!</script>\n!;
4148         } else {
4149                 my ($jstimezone, $tz_cookie, $datetime_class) =
4150                         gitweb_get_feature('javascript-timezone');
4151
4152                 print qq!<script type="text/javascript">\n!.
4153                       qq!window.onload = function () {\n!;
4154                 if (gitweb_check_feature('javascript-actions')) {
4155                         print qq!       fixLinks();\n!;
4156                 }
4157                 if ($jstimezone && $tz_cookie && $datetime_class) {
4158                         print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4159                               qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4160                 }
4161                 print qq!};\n!.
4162                       qq!</script>\n!;
4163         }
4164
4165         print "</body>\n" .
4166               "</html>";
4167 }
4168
4169 # die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4170 # Example: die_error(404, 'Hash not found')
4171 # By convention, use the following status codes (as defined in RFC 2616):
4172 # 400: Invalid or missing CGI parameters, or
4173 #      requested object exists but has wrong type.
4174 # 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4175 #      this server or project.
4176 # 404: Requested object/revision/project doesn't exist.
4177 # 500: The server isn't configured properly, or
4178 #      an internal error occurred (e.g. failed assertions caused by bugs), or
4179 #      an unknown error occurred (e.g. the git binary died unexpectedly).
4180 # 503: The server is currently unavailable (because it is overloaded,
4181 #      or down for maintenance).  Generally, this is a temporary state.
4182 sub die_error {
4183         my $status = shift || 500;
4184         my $error = esc_html(shift) || "Internal Server Error";
4185         my $extra = shift;
4186         my %opts = @_;
4187
4188         my %http_responses = (
4189                 400 => '400 Bad Request',
4190                 403 => '403 Forbidden',
4191                 404 => '404 Not Found',
4192                 500 => '500 Internal Server Error',
4193                 503 => '503 Service Unavailable',
4194         );
4195         git_header_html($http_responses{$status}, undef, %opts);
4196         print <<EOF;
4197 <div class="page_body">
4198 <br /><br />
4199 $status - $error
4200 <br />
4201 EOF
4202         if (defined $extra) {
4203                 print "<hr />\n" .
4204                       "$extra\n";
4205         }
4206         print "</div>\n";
4207
4208         git_footer_html();
4209         goto DONE_GITWEB
4210                 unless ($opts{'-error_handler'});
4211 }
4212
4213 ## ----------------------------------------------------------------------
4214 ## functions printing or outputting HTML: navigation
4215
4216 sub git_print_page_nav {
4217         my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4218         $extra = '' if !defined $extra; # pager or formats
4219
4220         my @navs = qw(summary shortlog log commit commitdiff tree);
4221         if ($suppress) {
4222                 @navs = grep { $_ ne $suppress } @navs;
4223         }
4224
4225         my %arg = map { $_ => {action=>$_} } @navs;
4226         if (defined $head) {
4227                 for (qw(commit commitdiff)) {
4228                         $arg{$_}{'hash'} = $head;
4229                 }
4230                 if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4231                         for (qw(shortlog log)) {
4232                                 $arg{$_}{'hash'} = $head;
4233                         }
4234                 }
4235         }
4236
4237         $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4238         $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4239
4240         my @actions = gitweb_get_feature('actions');
4241         my %repl = (
4242                 '%' => '%',
4243                 'n' => $project,         # project name
4244                 'f' => $git_dir,         # project path within filesystem
4245                 'h' => $treehead || '',  # current hash ('h' parameter)
4246                 'b' => $treebase || '',  # hash base ('hb' parameter)
4247         );
4248         while (@actions) {
4249                 my ($label, $link, $pos) = splice(@actions,0,3);
4250                 # insert
4251                 @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4252                 # munch munch
4253                 $link =~ s/%([%nfhb])/$repl{$1}/g;
4254                 $arg{$label}{'_href'} = $link;
4255         }
4256
4257         print "<div class=\"page_nav\">\n" .
4258                 (join " | ",
4259                  map { $_ eq $current ?
4260                        $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4261                  } @navs);
4262         print "<br/>\n$extra<br/>\n" .
4263               "</div>\n";
4264 }
4265
4266 # returns a submenu for the nagivation of the refs views (tags, heads,
4267 # remotes) with the current view disabled and the remotes view only
4268 # available if the feature is enabled
4269 sub format_ref_views {
4270         my ($current) = @_;
4271         my @ref_views = qw{tags heads};
4272         push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4273         return join " | ", map {
4274                 $_ eq $current ? $_ :
4275                 $cgi->a({-href => href(action=>$_)}, $_)
4276         } @ref_views
4277 }
4278
4279 sub format_paging_nav {
4280         my ($action, $page, $has_next_link) = @_;
4281         my $paging_nav;
4282
4283
4284         if ($page > 0) {
4285                 $paging_nav .=
4286                         $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4287                         " &sdot; " .
4288                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
4289                                  -accesskey => "p", -title => "Alt-p"}, "prev");
4290         } else {
4291                 $paging_nav .= "first &sdot; prev";
4292         }
4293
4294         if ($has_next_link) {
4295                 $paging_nav .= " &sdot; " .
4296                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
4297                                  -accesskey => "n", -title => "Alt-n"}, "next");
4298         } else {
4299                 $paging_nav .= " &sdot; next";
4300         }
4301
4302         return $paging_nav;
4303 }
4304
4305 ## ......................................................................
4306 ## functions printing or outputting HTML: div
4307
4308 sub git_print_header_div {
4309         my ($action, $title, $hash, $hash_base) = @_;
4310         my %args = ();
4311
4312         $args{'action'} = $action;
4313         $args{'hash'} = $hash if $hash;
4314         $args{'hash_base'} = $hash_base if $hash_base;
4315
4316         print "<div class=\"header\">\n" .
4317               $cgi->a({-href => href(%args), -class => "title"},
4318               $title ? $title : $action) .
4319               "\n</div>\n";
4320 }
4321
4322 sub format_repo_url {
4323         my ($name, $url) = @_;
4324         return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4325 }
4326
4327 # Group output by placing it in a DIV element and adding a header.
4328 # Options for start_div() can be provided by passing a hash reference as the
4329 # first parameter to the function.
4330 # Options to git_print_header_div() can be provided by passing an array
4331 # reference. This must follow the options to start_div if they are present.
4332 # The content can be a scalar, which is output as-is, a scalar reference, which
4333 # is output after html escaping, an IO handle passed either as *handle or
4334 # *handle{IO}, or a function reference. In the latter case all following
4335 # parameters will be taken as argument to the content function call.
4336 sub git_print_section {
4337         my ($div_args, $header_args, $content);
4338         my $arg = shift;
4339         if (ref($arg) eq 'HASH') {
4340                 $div_args = $arg;
4341                 $arg = shift;
4342         }
4343         if (ref($arg) eq 'ARRAY') {
4344                 $header_args = $arg;
4345                 $arg = shift;
4346         }
4347         $content = $arg;
4348
4349         print $cgi->start_div($div_args);
4350         git_print_header_div(@$header_args);
4351
4352         if (ref($content) eq 'CODE') {
4353                 $content->(@_);
4354         } elsif (ref($content) eq 'SCALAR') {
4355                 print esc_html($$content);
4356         } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4357                 print <$content>;
4358         } elsif (!ref($content) && defined($content)) {
4359                 print $content;
4360         }
4361
4362         print $cgi->end_div;
4363 }
4364
4365 sub format_timestamp_html {
4366         my $date = shift;
4367         my $strtime = $date->{'rfc2822'};
4368
4369         my (undef, undef, $datetime_class) =
4370                 gitweb_get_feature('javascript-timezone');
4371         if ($datetime_class) {
4372                 $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4373         }
4374
4375         my $localtime_format = '(%02d:%02d %s)';
4376         if ($date->{'hour_local'} < 6) {
4377                 $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4378         }
4379         $strtime .= ' ' .
4380                     sprintf($localtime_format,
4381                             $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4382
4383         return $strtime;
4384 }
4385
4386 # Outputs the author name and date in long form
4387 sub git_print_authorship {
4388         my $co = shift;
4389         my %opts = @_;
4390         my $tag = $opts{-tag} || 'div';
4391         my $author = $co->{'author_name'};
4392
4393         my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4394         print "<$tag class=\"author_date\">" .
4395               format_search_author($author, "author", esc_html($author)) .
4396               " [".format_timestamp_html(\%ad)."]".
4397               git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4398               "</$tag>\n";
4399 }
4400
4401 # Outputs table rows containing the full author or committer information,
4402 # in the format expected for 'commit' view (& similar).
4403 # Parameters are a commit hash reference, followed by the list of people
4404 # to output information for. If the list is empty it defaults to both
4405 # author and committer.
4406 sub git_print_authorship_rows {
4407         my $co = shift;
4408         # too bad we can't use @people = @_ || ('author', 'committer')
4409         my @people = @_;
4410         @people = ('author', 'committer') unless @people;
4411         foreach my $who (@people) {
4412                 my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4413                 print "<tr><td>$who</td><td>" .
4414                       format_search_author($co->{"${who}_name"}, $who,
4415                                            esc_html($co->{"${who}_name"})) . " " .
4416                       format_search_author($co->{"${who}_email"}, $who,
4417                                            esc_html("<" . $co->{"${who}_email"} . ">")) .
4418                       "</td><td rowspan=\"2\">" .
4419                       git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4420                       "</td></tr>\n" .
4421                       "<tr>" .
4422                       "<td></td><td>" .
4423                       format_timestamp_html(\%wd) .
4424                       "</td>" .
4425                       "</tr>\n";
4426         }
4427 }
4428
4429 sub git_print_page_path {
4430         my $name = shift;
4431         my $type = shift;
4432         my $hb = shift;
4433
4434
4435         print "<div class=\"page_path\">";
4436         print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4437                       -title => 'tree root'}, to_utf8("[$project]"));
4438         print " / ";
4439         if (defined $name) {
4440                 my @dirname = split '/', $name;
4441                 my $basename = pop @dirname;
4442                 my $fullname = '';
4443
4444                 foreach my $dir (@dirname) {
4445                         $fullname .= ($fullname ? '/' : '') . $dir;
4446                         print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4447                                                      hash_base=>$hb),
4448                                       -title => $fullname}, esc_path($dir));
4449                         print " / ";
4450                 }
4451                 if (defined $type && $type eq 'blob') {
4452                         print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4453                                                      hash_base=>$hb),
4454                                       -title => $name}, esc_path($basename));
4455                 } elsif (defined $type && $type eq 'tree') {
4456                         print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4457                                                      hash_base=>$hb),
4458                                       -title => $name}, esc_path($basename));
4459                         print " / ";
4460                 } else {
4461                         print esc_path($basename);
4462                 }
4463         }
4464         print "<br/></div>\n";
4465 }
4466
4467 sub git_print_log {
4468         my $log = shift;
4469         my %opts = @_;
4470
4471         if ($opts{'-remove_title'}) {
4472                 # remove title, i.e. first line of log
4473                 shift @$log;
4474         }
4475         # remove leading empty lines
4476         while (defined $log->[0] && $log->[0] eq "") {
4477                 shift @$log;
4478         }
4479
4480         # print log
4481         my $signoff = 0;
4482         my $empty = 0;
4483         foreach my $line (@$log) {
4484                 if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4485                         $signoff = 1;
4486                         $empty = 0;
4487                         if (! $opts{'-remove_signoff'}) {
4488                                 print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4489                                 next;
4490                         } else {
4491                                 # remove signoff lines
4492                                 next;
4493                         }
4494                 } else {
4495                         $signoff = 0;
4496                 }
4497
4498                 # print only one empty line
4499                 # do not print empty line after signoff
4500                 if ($line eq "") {
4501                         next if ($empty || $signoff);
4502                         $empty = 1;
4503                 } else {
4504                         $empty = 0;
4505                 }
4506
4507                 print format_log_line_html($line) . "<br/>\n";
4508         }
4509
4510         if ($opts{'-final_empty_line'}) {
4511                 # end with single empty line
4512                 print "<br/>\n" unless $empty;
4513         }
4514 }
4515
4516 # return link target (what link points to)
4517 sub git_get_link_target {
4518         my $hash = shift;
4519         my $link_target;
4520
4521         # read link
4522         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4523                 or return;
4524         {
4525                 local $/ = undef;
4526                 $link_target = <$fd>;
4527         }
4528         close $fd
4529                 or return;
4530
4531         return $link_target;
4532 }
4533
4534 # given link target, and the directory (basedir) the link is in,
4535 # return target of link relative to top directory (top tree);
4536 # return undef if it is not possible (including absolute links).
4537 sub normalize_link_target {
4538         my ($link_target, $basedir) = @_;
4539
4540         # absolute symlinks (beginning with '/') cannot be normalized
4541         return if (substr($link_target, 0, 1) eq '/');
4542
4543         # normalize link target to path from top (root) tree (dir)
4544         my $path;
4545         if ($basedir) {
4546                 $path = $basedir . '/' . $link_target;
4547         } else {
4548                 # we are in top (root) tree (dir)
4549                 $path = $link_target;
4550         }
4551
4552         # remove //, /./, and /../
4553         my @path_parts;
4554         foreach my $part (split('/', $path)) {
4555                 # discard '.' and ''
4556                 next if (!$part || $part eq '.');
4557                 # handle '..'
4558                 if ($part eq '..') {
4559                         if (@path_parts) {
4560                                 pop @path_parts;
4561                         } else {
4562                                 # link leads outside repository (outside top dir)
4563                                 return;
4564                         }
4565                 } else {
4566                         push @path_parts, $part;
4567                 }
4568         }
4569         $path = join('/', @path_parts);
4570
4571         return $path;
4572 }
4573
4574 # print tree entry (row of git_tree), but without encompassing <tr> element
4575 sub git_print_tree_entry {
4576         my ($t, $basedir, $hash_base, $have_blame) = @_;
4577
4578         my %base_key = ();
4579         $base_key{'hash_base'} = $hash_base if defined $hash_base;
4580
4581         # The format of a table row is: mode list link.  Where mode is
4582         # the mode of the entry, list is the name of the entry, an href,
4583         # and link is the action links of the entry.
4584
4585         print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4586         if (exists $t->{'size'}) {
4587                 print "<td class=\"size\">$t->{'size'}</td>\n";
4588         }
4589         if ($t->{'type'} eq "blob") {
4590                 print "<td class=\"list\">" .
4591                         $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4592                                                file_name=>"$basedir$t->{'name'}", %base_key),
4593                                 -class => "list"}, esc_path($t->{'name'}));
4594                 if (S_ISLNK(oct $t->{'mode'})) {
4595                         my $link_target = git_get_link_target($t->{'hash'});
4596                         if ($link_target) {
4597                                 my $norm_target = normalize_link_target($link_target, $basedir);
4598                                 if (defined $norm_target) {
4599                                         print " -> " .
4600                                               $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4601                                                                      file_name=>$norm_target),
4602                                                        -title => $norm_target}, esc_path($link_target));
4603                                 } else {
4604                                         print " -> " . esc_path($link_target);
4605                                 }
4606                         }
4607                 }
4608                 print "</td>\n";
4609                 print "<td class=\"link\">";
4610                 print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4611                                              file_name=>"$basedir$t->{'name'}", %base_key)},
4612                               "blob");
4613                 if ($have_blame) {
4614                         print " | " .
4615                               $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4616                                                      file_name=>"$basedir$t->{'name'}", %base_key)},
4617                                       "blame");
4618                 }
4619                 if (defined $hash_base) {
4620                         print " | " .
4621                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4622                                                      hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4623                                       "history");
4624                 }
4625                 print " | " .
4626                         $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4627                                                file_name=>"$basedir$t->{'name'}")},
4628                                 "raw");
4629                 print "</td>\n";
4630
4631         } elsif ($t->{'type'} eq "tree") {
4632                 print "<td class=\"list\">";
4633                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4634                                              file_name=>"$basedir$t->{'name'}",
4635                                              %base_key)},
4636                               esc_path($t->{'name'}));
4637                 print "</td>\n";
4638                 print "<td class=\"link\">";
4639                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4640                                              file_name=>"$basedir$t->{'name'}",
4641                                              %base_key)},
4642                               "tree");
4643                 if (defined $hash_base) {
4644                         print " | " .
4645                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4646                                                      file_name=>"$basedir$t->{'name'}")},
4647                                       "history");
4648                 }
4649                 print "</td>\n";
4650         } else {
4651                 # unknown object: we can only present history for it
4652                 # (this includes 'commit' object, i.e. submodule support)
4653                 print "<td class=\"list\">" .
4654                       esc_path($t->{'name'}) .
4655                       "</td>\n";
4656                 print "<td class=\"link\">";
4657                 if (defined $hash_base) {
4658                         print $cgi->a({-href => href(action=>"history",
4659                                                      hash_base=>$hash_base,
4660                                                      file_name=>"$basedir$t->{'name'}")},
4661                                       "history");
4662                 }
4663                 print "</td>\n";
4664         }
4665 }
4666
4667 ## ......................................................................
4668 ## functions printing large fragments of HTML
4669
4670 # get pre-image filenames for merge (combined) diff
4671 sub fill_from_file_info {
4672         my ($diff, @parents) = @_;
4673
4674         $diff->{'from_file'} = [ ];
4675         $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4676         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4677                 if ($diff->{'status'}[$i] eq 'R' ||
4678                     $diff->{'status'}[$i] eq 'C') {
4679                         $diff->{'from_file'}[$i] =
4680                                 git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4681                 }
4682         }
4683
4684         return $diff;
4685 }
4686
4687 # is current raw difftree line of file deletion
4688 sub is_deleted {
4689         my $diffinfo = shift;
4690
4691         return $diffinfo->{'to_id'} eq ('0' x 40);
4692 }
4693
4694 # does patch correspond to [previous] difftree raw line
4695 # $diffinfo  - hashref of parsed raw diff format
4696 # $patchinfo - hashref of parsed patch diff format
4697 #              (the same keys as in $diffinfo)
4698 sub is_patch_split {
4699         my ($diffinfo, $patchinfo) = @_;
4700
4701         return defined $diffinfo && defined $patchinfo
4702                 && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4703 }
4704
4705
4706 sub git_difftree_body {
4707         my ($difftree, $hash, @parents) = @_;
4708         my ($parent) = $parents[0];
4709         my $have_blame = gitweb_check_feature('blame');
4710         print "<div class=\"list_head\">\n";
4711         if ($#{$difftree} > 10) {
4712                 print(($#{$difftree} + 1) . " files changed:\n");
4713         }
4714         print "</div>\n";
4715
4716         print "<table class=\"" .
4717               (@parents > 1 ? "combined " : "") .
4718               "diff_tree\">\n";
4719
4720         # header only for combined diff in 'commitdiff' view
4721         my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4722         if ($has_header) {
4723                 # table header
4724                 print "<thead><tr>\n" .
4725                        "<th></th><th></th>\n"; # filename, patchN link
4726                 for (my $i = 0; $i < @parents; $i++) {
4727                         my $par = $parents[$i];
4728                         print "<th>" .
4729                               $cgi->a({-href => href(action=>"commitdiff",
4730                                                      hash=>$hash, hash_parent=>$par),
4731                                        -title => 'commitdiff to parent number ' .
4732                                                   ($i+1) . ': ' . substr($par,0,7)},
4733                                       $i+1) .
4734                               "&nbsp;</th>\n";
4735                 }
4736                 print "</tr></thead>\n<tbody>\n";
4737         }
4738
4739         my $alternate = 1;
4740         my $patchno = 0;
4741         foreach my $line (@{$difftree}) {
4742                 my $diff = parsed_difftree_line($line);
4743
4744                 if ($alternate) {
4745                         print "<tr class=\"dark\">\n";
4746                 } else {
4747                         print "<tr class=\"light\">\n";
4748                 }
4749                 $alternate ^= 1;
4750
4751                 if (exists $diff->{'nparents'}) { # combined diff
4752
4753                         fill_from_file_info($diff, @parents)
4754                                 unless exists $diff->{'from_file'};
4755
4756                         if (!is_deleted($diff)) {
4757                                 # file exists in the result (child) commit
4758                                 print "<td>" .
4759                                       $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4760                                                              file_name=>$diff->{'to_file'},
4761                                                              hash_base=>$hash),
4762                                               -class => "list"}, esc_path($diff->{'to_file'})) .
4763                                       "</td>\n";
4764                         } else {
4765                                 print "<td>" .
4766                                       esc_path($diff->{'to_file'}) .
4767                                       "</td>\n";
4768                         }
4769
4770                         if ($action eq 'commitdiff') {
4771                                 # link to patch
4772                                 $patchno++;
4773                                 print "<td class=\"link\">" .
4774                                       $cgi->a({-href => href(-anchor=>"patch$patchno")},
4775                                               "patch") .
4776                                       " | " .
4777                                       "</td>\n";
4778                         }
4779
4780                         my $has_history = 0;
4781                         my $not_deleted = 0;
4782                         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4783                                 my $hash_parent = $parents[$i];
4784                                 my $from_hash = $diff->{'from_id'}[$i];
4785                                 my $from_path = $diff->{'from_file'}[$i];
4786                                 my $status = $diff->{'status'}[$i];
4787
4788                                 $has_history ||= ($status ne 'A');
4789                                 $not_deleted ||= ($status ne 'D');
4790
4791                                 if ($status eq 'A') {
4792                                         print "<td  class=\"link\" align=\"right\"> | </td>\n";
4793                                 } elsif ($status eq 'D') {
4794                                         print "<td class=\"link\">" .
4795                                               $cgi->a({-href => href(action=>"blob",
4796                                                                      hash_base=>$hash,
4797                                                                      hash=>$from_hash,
4798                                                                      file_name=>$from_path)},
4799                                                       "blob" . ($i+1)) .
4800                                               " | </td>\n";
4801                                 } else {
4802                                         if ($diff->{'to_id'} eq $from_hash) {
4803                                                 print "<td class=\"link nochange\">";
4804                                         } else {
4805                                                 print "<td class=\"link\">";
4806                                         }
4807                                         print $cgi->a({-href => href(action=>"blobdiff",
4808                                                                      hash=>$diff->{'to_id'},
4809                                                                      hash_parent=>$from_hash,
4810                                                                      hash_base=>$hash,
4811                                                                      hash_parent_base=>$hash_parent,
4812                                                                      file_name=>$diff->{'to_file'},
4813                                                                      file_parent=>$from_path)},
4814                                                       "diff" . ($i+1)) .
4815                                               " | </td>\n";
4816                                 }
4817                         }
4818
4819                         print "<td class=\"link\">";
4820                         if ($not_deleted) {
4821                                 print $cgi->a({-href => href(action=>"blob",
4822                                                              hash=>$diff->{'to_id'},
4823                                                              file_name=>$diff->{'to_file'},
4824                                                              hash_base=>$hash)},
4825                                               "blob");
4826                                 print " | " if ($has_history);
4827                         }
4828                         if ($has_history) {
4829                                 print $cgi->a({-href => href(action=>"history",
4830                                                              file_name=>$diff->{'to_file'},
4831                                                              hash_base=>$hash)},
4832                                               "history");
4833                         }
4834                         print "</td>\n";
4835
4836                         print "</tr>\n";
4837                         next; # instead of 'else' clause, to avoid extra indent
4838                 }
4839                 # else ordinary diff
4840
4841                 my ($to_mode_oct, $to_mode_str, $to_file_type);
4842                 my ($from_mode_oct, $from_mode_str, $from_file_type);
4843                 if ($diff->{'to_mode'} ne ('0' x 6)) {
4844                         $to_mode_oct = oct $diff->{'to_mode'};
4845                         if (S_ISREG($to_mode_oct)) { # only for regular file
4846                                 $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4847                         }
4848                         $to_file_type = file_type($diff->{'to_mode'});
4849                 }
4850                 if ($diff->{'from_mode'} ne ('0' x 6)) {
4851                         $from_mode_oct = oct $diff->{'from_mode'};
4852                         if (S_ISREG($from_mode_oct)) { # only for regular file
4853                                 $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4854                         }
4855                         $from_file_type = file_type($diff->{'from_mode'});
4856                 }
4857
4858                 if ($diff->{'status'} eq "A") { # created
4859                         my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4860                         $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4861                         $mode_chng   .= "]</span>";
4862                         print "<td>";
4863                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4864                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4865                                       -class => "list"}, esc_path($diff->{'file'}));
4866                         print "</td>\n";
4867                         print "<td>$mode_chng</td>\n";
4868                         print "<td class=\"link\">";
4869                         if ($action eq 'commitdiff') {
4870                                 # link to patch
4871                                 $patchno++;
4872                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4873                                               "patch") .
4874                                       " | ";
4875                         }
4876                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4877                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4878                                       "blob");
4879                         print "</td>\n";
4880
4881                 } elsif ($diff->{'status'} eq "D") { # deleted
4882                         my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4883                         print "<td>";
4884                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4885                                                      hash_base=>$parent, file_name=>$diff->{'file'}),
4886                                        -class => "list"}, esc_path($diff->{'file'}));
4887                         print "</td>\n";
4888                         print "<td>$mode_chng</td>\n";
4889                         print "<td class=\"link\">";
4890                         if ($action eq 'commitdiff') {
4891                                 # link to patch
4892                                 $patchno++;
4893                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4894                                               "patch") .
4895                                       " | ";
4896                         }
4897                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4898                                                      hash_base=>$parent, file_name=>$diff->{'file'})},
4899                                       "blob") . " | ";
4900                         if ($have_blame) {
4901                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4902                                                              file_name=>$diff->{'file'})},
4903                                               "blame") . " | ";
4904                         }
4905                         print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4906                                                      file_name=>$diff->{'file'})},
4907                                       "history");
4908                         print "</td>\n";
4909
4910                 } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4911                         my $mode_chnge = "";
4912                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4913                                 $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4914                                 if ($from_file_type ne $to_file_type) {
4915                                         $mode_chnge .= " from $from_file_type to $to_file_type";
4916                                 }
4917                                 if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4918                                         if ($from_mode_str && $to_mode_str) {
4919                                                 $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4920                                         } elsif ($to_mode_str) {
4921                                                 $mode_chnge .= " mode: $to_mode_str";
4922                                         }
4923                                 }
4924                                 $mode_chnge .= "]</span>\n";
4925                         }
4926                         print "<td>";
4927                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4928                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4929                                       -class => "list"}, esc_path($diff->{'file'}));
4930                         print "</td>\n";
4931                         print "<td>$mode_chnge</td>\n";
4932                         print "<td class=\"link\">";
4933                         if ($action eq 'commitdiff') {
4934                                 # link to patch
4935                                 $patchno++;
4936                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4937                                               "patch") .
4938                                       " | ";
4939                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4940                                 # "commit" view and modified file (not onlu mode changed)
4941                                 print $cgi->a({-href => href(action=>"blobdiff",
4942                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4943                                                              hash_base=>$hash, hash_parent_base=>$parent,
4944                                                              file_name=>$diff->{'file'})},
4945                                               "diff") .
4946                                       " | ";
4947                         }
4948                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4949                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4950                                        "blob") . " | ";
4951                         if ($have_blame) {
4952                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4953                                                              file_name=>$diff->{'file'})},
4954                                               "blame") . " | ";
4955                         }
4956                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4957                                                      file_name=>$diff->{'file'})},
4958                                       "history");
4959                         print "</td>\n";
4960
4961                 } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4962                         my %status_name = ('R' => 'moved', 'C' => 'copied');
4963                         my $nstatus = $status_name{$diff->{'status'}};
4964                         my $mode_chng = "";
4965                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4966                                 # mode also for directories, so we cannot use $to_mode_str
4967                                 $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4968                         }
4969                         print "<td>" .
4970                               $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4971                                                      hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4972                                       -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4973                               "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4974                               $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4975                                                      hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4976                                       -class => "list"}, esc_path($diff->{'from_file'})) .
4977                               " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4978                               "<td class=\"link\">";
4979                         if ($action eq 'commitdiff') {
4980                                 # link to patch
4981                                 $patchno++;
4982                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4983                                               "patch") .
4984                                       " | ";
4985                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4986                                 # "commit" view and modified file (not only pure rename or copy)
4987                                 print $cgi->a({-href => href(action=>"blobdiff",
4988                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4989                                                              hash_base=>$hash, hash_parent_base=>$parent,
4990                                                              file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4991                                               "diff") .
4992                                       " | ";
4993                         }
4994                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4995                                                      hash_base=>$parent, file_name=>$diff->{'to_file'})},
4996                                       "blob") . " | ";
4997                         if ($have_blame) {
4998                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4999                                                              file_name=>$diff->{'to_file'})},
5000                                               "blame") . " | ";
5001                         }
5002                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
5003                                                     file_name=>$diff->{'to_file'})},
5004                                       "history");
5005                         print "</td>\n";
5006
5007                 } # we should not encounter Unmerged (U) or Unknown (X) status
5008                 print "</tr>\n";
5009         }
5010         print "</tbody>" if $has_header;
5011         print "</table>\n";
5012 }
5013
5014 # Print context lines and then rem/add lines in a side-by-side manner.
5015 sub print_sidebyside_diff_lines {
5016         my ($ctx, $rem, $add) = @_;
5017
5018         # print context block before add/rem block
5019         if (@$ctx) {
5020                 print join '',
5021                         '<div class="chunk_block ctx">',
5022                                 '<div class="old">',
5023                                 @$ctx,
5024                                 '</div>',
5025                                 '<div class="new">',
5026                                 @$ctx,
5027                                 '</div>',
5028                         '</div>';
5029         }
5030
5031         if (!@$add) {
5032                 # pure removal
5033                 print join '',
5034                         '<div class="chunk_block rem">',
5035                                 '<div class="old">',
5036                                 @$rem,
5037                                 '</div>',
5038                         '</div>';
5039         } elsif (!@$rem) {
5040                 # pure addition
5041                 print join '',
5042                         '<div class="chunk_block add">',
5043                                 '<div class="new">',
5044                                 @$add,
5045                                 '</div>',
5046                         '</div>';
5047         } else {
5048                 print join '',
5049                         '<div class="chunk_block chg">',
5050                                 '<div class="old">',
5051                                 @$rem,
5052                                 '</div>',
5053                                 '<div class="new">',
5054                                 @$add,
5055                                 '</div>',
5056                         '</div>';
5057         }
5058 }
5059
5060 # Print context lines and then rem/add lines in inline manner.
5061 sub print_inline_diff_lines {
5062         my ($ctx, $rem, $add) = @_;
5063
5064         print @$ctx, @$rem, @$add;
5065 }
5066
5067 # Format removed and added line, mark changed part and HTML-format them.
5068 # Implementation is based on contrib/diff-highlight
5069 sub format_rem_add_lines_pair {
5070         my ($rem, $add, $num_parents) = @_;
5071
5072         # We need to untabify lines before split()'ing them;
5073         # otherwise offsets would be invalid.
5074         chomp $rem;
5075         chomp $add;
5076         $rem = untabify($rem);
5077         $add = untabify($add);
5078
5079         my @rem = split(//, $rem);
5080         my @add = split(//, $add);
5081         my ($esc_rem, $esc_add);
5082         # Ignore leading +/- characters for each parent.
5083         my ($prefix_len, $suffix_len) = ($num_parents, 0);
5084         my ($prefix_has_nonspace, $suffix_has_nonspace);
5085
5086         my $shorter = (@rem < @add) ? @rem : @add;
5087         while ($prefix_len < $shorter) {
5088                 last if ($rem[$prefix_len] ne $add[$prefix_len]);
5089
5090                 $prefix_has_nonspace = 1 if ($rem[$prefix_len] !~ /\s/);
5091                 $prefix_len++;
5092         }
5093
5094         while ($prefix_len + $suffix_len < $shorter) {
5095                 last if ($rem[-1 - $suffix_len] ne $add[-1 - $suffix_len]);
5096
5097                 $suffix_has_nonspace = 1 if ($rem[-1 - $suffix_len] !~ /\s/);
5098                 $suffix_len++;
5099         }
5100
5101         # Mark lines that are different from each other, but have some common
5102         # part that isn't whitespace.  If lines are completely different, don't
5103         # mark them because that would make output unreadable, especially if
5104         # diff consists of multiple lines.
5105         if ($prefix_has_nonspace || $suffix_has_nonspace) {
5106                 $esc_rem = esc_html_hl_regions($rem, 'marked',
5107                         [$prefix_len, @rem - $suffix_len], -nbsp=>1);
5108                 $esc_add = esc_html_hl_regions($add, 'marked',
5109                         [$prefix_len, @add - $suffix_len], -nbsp=>1);
5110         } else {
5111                 $esc_rem = esc_html($rem, -nbsp=>1);
5112                 $esc_add = esc_html($add, -nbsp=>1);
5113         }
5114
5115         return format_diff_line(\$esc_rem, 'rem'),
5116                format_diff_line(\$esc_add, 'add');
5117 }
5118
5119 # HTML-format diff context, removed and added lines.
5120 sub format_ctx_rem_add_lines {
5121         my ($ctx, $rem, $add, $num_parents) = @_;
5122         my (@new_ctx, @new_rem, @new_add);
5123         my $can_highlight = 0;
5124         my $is_combined = ($num_parents > 1);
5125
5126         # Highlight if every removed line has a corresponding added line.
5127         if (@$add > 0 && @$add == @$rem) {
5128                 $can_highlight = 1;
5129
5130                 # Highlight lines in combined diff only if the chunk contains
5131                 # diff between the same version, e.g.
5132                 #
5133                 #    - a
5134                 #   -  b
5135                 #    + c
5136                 #   +  d
5137                 #
5138                 # Otherwise the highlightling would be confusing.
5139                 if ($is_combined) {
5140                         for (my $i = 0; $i < @$add; $i++) {
5141                                 my $prefix_rem = substr($rem->[$i], 0, $num_parents);
5142                                 my $prefix_add = substr($add->[$i], 0, $num_parents);
5143
5144                                 $prefix_rem =~ s/-/+/g;
5145
5146                                 if ($prefix_rem ne $prefix_add) {
5147                                         $can_highlight = 0;
5148                                         last;
5149                                 }
5150                         }
5151                 }
5152         }
5153
5154         if ($can_highlight) {
5155                 for (my $i = 0; $i < @$add; $i++) {
5156                         my ($line_rem, $line_add) = format_rem_add_lines_pair(
5157                                 $rem->[$i], $add->[$i], $num_parents);
5158                         push @new_rem, $line_rem;
5159                         push @new_add, $line_add;
5160                 }
5161         } else {
5162                 @new_rem = map { format_diff_line($_, 'rem') } @$rem;
5163                 @new_add = map { format_diff_line($_, 'add') } @$add;
5164         }
5165
5166         @new_ctx = map { format_diff_line($_, 'ctx') } @$ctx;
5167
5168         return (\@new_ctx, \@new_rem, \@new_add);
5169 }
5170
5171 # Print context lines and then rem/add lines.
5172 sub print_diff_lines {
5173         my ($ctx, $rem, $add, $diff_style, $num_parents) = @_;
5174         my $is_combined = $num_parents > 1;
5175
5176         ($ctx, $rem, $add) = format_ctx_rem_add_lines($ctx, $rem, $add,
5177                 $num_parents);
5178
5179         if ($diff_style eq 'sidebyside' && !$is_combined) {
5180                 print_sidebyside_diff_lines($ctx, $rem, $add);
5181         } else {
5182                 # default 'inline' style and unknown styles
5183                 print_inline_diff_lines($ctx, $rem, $add);
5184         }
5185 }
5186
5187 sub print_diff_chunk {
5188         my ($diff_style, $num_parents, $from, $to, @chunk) = @_;
5189         my (@ctx, @rem, @add);
5190
5191         # The class of the previous line.
5192         my $prev_class = '';
5193
5194         return unless @chunk;
5195
5196         # incomplete last line might be among removed or added lines,
5197         # or both, or among context lines: find which
5198         for (my $i = 1; $i < @chunk; $i++) {
5199                 if ($chunk[$i][0] eq 'incomplete') {
5200                         $chunk[$i][0] = $chunk[$i-1][0];
5201                 }
5202         }
5203
5204         # guardian
5205         push @chunk, ["", ""];
5206
5207         foreach my $line_info (@chunk) {
5208                 my ($class, $line) = @$line_info;
5209
5210                 # print chunk headers
5211                 if ($class && $class eq 'chunk_header') {
5212                         print format_diff_line($line, $class, $from, $to);
5213                         next;
5214                 }
5215
5216                 ## print from accumulator when have some add/rem lines or end
5217                 # of chunk (flush context lines), or when have add and rem
5218                 # lines and new block is reached (otherwise add/rem lines could
5219                 # be reordered)
5220                 if (!$class || ((@rem || @add) && $class eq 'ctx') ||
5221                     (@rem && @add && $class ne $prev_class)) {
5222                         print_diff_lines(\@ctx, \@rem, \@add,
5223                                          $diff_style, $num_parents);
5224                         @ctx = @rem = @add = ();
5225                 }
5226
5227                 ## adding lines to accumulator
5228                 # guardian value
5229                 last unless $line;
5230                 # rem, add or change
5231                 if ($class eq 'rem') {
5232                         push @rem, $line;
5233                 } elsif ($class eq 'add') {
5234                         push @add, $line;
5235                 }
5236                 # context line
5237                 if ($class eq 'ctx') {
5238                         push @ctx, $line;
5239                 }
5240
5241                 $prev_class = $class;
5242         }
5243 }
5244
5245 sub git_patchset_body {
5246         my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
5247         my ($hash_parent) = $hash_parents[0];
5248
5249         my $is_combined = (@hash_parents > 1);
5250         my $patch_idx = 0;
5251         my $patch_number = 0;
5252         my $patch_line;
5253         my $diffinfo;
5254         my $to_name;
5255         my (%from, %to);
5256         my @chunk; # for side-by-side diff
5257
5258         print "<div class=\"patchset\">\n";
5259
5260         # skip to first patch
5261         while ($patch_line = <$fd>) {
5262                 chomp $patch_line;
5263
5264                 last if ($patch_line =~ m/^diff /);
5265         }
5266
5267  PATCH:
5268         while ($patch_line) {
5269
5270                 # parse "git diff" header line
5271                 if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
5272                         # $1 is from_name, which we do not use
5273                         $to_name = unquote($2);
5274                         $to_name =~ s!^b/!!;
5275                 } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
5276                         # $1 is 'cc' or 'combined', which we do not use
5277                         $to_name = unquote($2);
5278                 } else {
5279                         $to_name = undef;
5280                 }
5281
5282                 # check if current patch belong to current raw line
5283                 # and parse raw git-diff line if needed
5284                 if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
5285                         # this is continuation of a split patch
5286                         print "<div class=\"patch cont\">\n";
5287                 } else {
5288                         # advance raw git-diff output if needed
5289                         $patch_idx++ if defined $diffinfo;
5290
5291                         # read and prepare patch information
5292                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5293
5294                         # compact combined diff output can have some patches skipped
5295                         # find which patch (using pathname of result) we are at now;
5296                         if ($is_combined) {
5297                                 while ($to_name ne $diffinfo->{'to_file'}) {
5298                                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5299                                               format_diff_cc_simplified($diffinfo, @hash_parents) .
5300                                               "</div>\n";  # class="patch"
5301
5302                                         $patch_idx++;
5303                                         $patch_number++;
5304
5305                                         last if $patch_idx > $#$difftree;
5306                                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5307                                 }
5308                         }
5309
5310                         # modifies %from, %to hashes
5311                         parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5312
5313                         # this is first patch for raw difftree line with $patch_idx index
5314                         # we index @$difftree array from 0, but number patches from 1
5315                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5316                 }
5317
5318                 # git diff header
5319                 #assert($patch_line =~ m/^diff /) if DEBUG;
5320                 #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5321                 $patch_number++;
5322                 # print "git diff" header
5323                 print format_git_diff_header_line($patch_line, $diffinfo,
5324                                                   \%from, \%to);
5325
5326                 # print extended diff header
5327                 print "<div class=\"diff extended_header\">\n";
5328         EXTENDED_HEADER:
5329                 while ($patch_line = <$fd>) {
5330                         chomp $patch_line;
5331
5332                         last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5333
5334                         print format_extended_diff_header_line($patch_line, $diffinfo,
5335                                                                \%from, \%to);
5336                 }
5337                 print "</div>\n"; # class="diff extended_header"
5338
5339                 # from-file/to-file diff header
5340                 if (! $patch_line) {
5341                         print "</div>\n"; # class="patch"
5342                         last PATCH;
5343                 }
5344                 next PATCH if ($patch_line =~ m/^diff /);
5345                 #assert($patch_line =~ m/^---/) if DEBUG;
5346
5347                 my $last_patch_line = $patch_line;
5348                 $patch_line = <$fd>;
5349                 chomp $patch_line;
5350                 #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5351
5352                 print format_diff_from_to_header($last_patch_line, $patch_line,
5353                                                  $diffinfo, \%from, \%to,
5354                                                  @hash_parents);
5355
5356                 # the patch itself
5357         LINE:
5358                 while ($patch_line = <$fd>) {
5359                         chomp $patch_line;
5360
5361                         next PATCH if ($patch_line =~ m/^diff /);
5362
5363                         my $class = diff_line_class($patch_line, \%from, \%to);
5364
5365                         if ($class eq 'chunk_header') {
5366                                 print_diff_chunk($diff_style, scalar @hash_parents, \%from, \%to, @chunk);
5367                                 @chunk = ();
5368                         }
5369
5370                         push @chunk, [ $class, $patch_line ];
5371                 }
5372
5373         } continue {
5374                 if (@chunk) {
5375                         print_diff_chunk($diff_style, scalar @hash_parents, \%from, \%to, @chunk);
5376                         @chunk = ();
5377                 }
5378                 print "</div>\n"; # class="patch"
5379         }
5380
5381         # for compact combined (--cc) format, with chunk and patch simplification
5382         # the patchset might be empty, but there might be unprocessed raw lines
5383         for (++$patch_idx if $patch_number > 0;
5384              $patch_idx < @$difftree;
5385              ++$patch_idx) {
5386                 # read and prepare patch information
5387                 $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5388
5389                 # generate anchor for "patch" links in difftree / whatchanged part
5390                 print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5391                       format_diff_cc_simplified($diffinfo, @hash_parents) .
5392                       "</div>\n";  # class="patch"
5393
5394                 $patch_number++;
5395         }
5396
5397         if ($patch_number == 0) {
5398                 if (@hash_parents > 1) {
5399                         print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5400                 } else {
5401                         print "<div class=\"diff nodifferences\">No differences found</div>\n";
5402                 }
5403         }
5404
5405         print "</div>\n"; # class="patchset"
5406 }
5407
5408 # . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5409
5410 sub git_project_search_form {
5411         my ($searchtext, $search_use_regexp) = @_;
5412
5413         my $limit = '';
5414         if ($project_filter) {
5415                 $limit = " in '$project_filter/'";
5416         }
5417
5418         print "<div class=\"projsearch\">\n";
5419         print $cgi->startform(-method => 'get', -action => $my_uri) .
5420               $cgi->hidden(-name => 'a', -value => 'project_list')  . "\n";
5421         print $cgi->hidden(-name => 'pf', -value => $project_filter). "\n"
5422                 if (defined $project_filter);
5423         print $cgi->textfield(-name => 's', -value => $searchtext,
5424                               -title => "Search project by name and description$limit",
5425                               -size => 60) . "\n" .
5426               "<span title=\"Extended regular expression\">" .
5427               $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
5428                              -checked => $search_use_regexp) .
5429               "</span>\n" .
5430               $cgi->submit(-name => 'btnS', -value => 'Search') .
5431               $cgi->end_form() . "\n" .
5432               $cgi->a({-href => href(project => undef, searchtext => undef,
5433                                      project_filter => $project_filter)},
5434                       esc_html("List all projects$limit")) . "<br />\n";
5435         print "</div>\n";
5436 }
5437
5438 # entry for given @keys needs filling if at least one of keys in list
5439 # is not present in %$project_info
5440 sub project_info_needs_filling {
5441         my ($project_info, @keys) = @_;
5442
5443         # return List::MoreUtils::any { !exists $project_info->{$_} } @keys;
5444         foreach my $key (@keys) {
5445                 if (!exists $project_info->{$key}) {
5446                         return 1;
5447                 }
5448         }
5449         return;
5450 }
5451
5452 # fills project list info (age, description, owner, category, forks, etc.)
5453 # for each project in the list, removing invalid projects from
5454 # returned list, or fill only specified info.
5455 #
5456 # Invalid projects are removed from the returned list if and only if you
5457 # ask 'age' or 'age_string' to be filled, because they are the only fields
5458 # that run unconditionally git command that requires repository, and
5459 # therefore do always check if project repository is invalid.
5460 #
5461 # USAGE:
5462 # * fill_project_list_info(\@project_list, 'descr_long', 'ctags')
5463 #   ensures that 'descr_long' and 'ctags' fields are filled
5464 # * @project_list = fill_project_list_info(\@project_list)
5465 #   ensures that all fields are filled (and invalid projects removed)
5466 #
5467 # NOTE: modifies $projlist, but does not remove entries from it
5468 sub fill_project_list_info {
5469         my ($projlist, @wanted_keys) = @_;
5470         my @projects;
5471         my $filter_set = sub { return @_; };
5472         if (@wanted_keys) {
5473                 my %wanted_keys = map { $_ => 1 } @wanted_keys;
5474                 $filter_set = sub { return grep { $wanted_keys{$_} } @_; };
5475         }
5476
5477         my $show_ctags = gitweb_check_feature('ctags');
5478  PROJECT:
5479         foreach my $pr (@$projlist) {
5480                 if (project_info_needs_filling($pr, $filter_set->('age', 'age_string'))) {
5481                         my (@activity) = git_get_last_activity($pr->{'path'});
5482                         unless (@activity) {
5483                                 next PROJECT;
5484                         }
5485                         ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5486                 }
5487                 if (project_info_needs_filling($pr, $filter_set->('descr', 'descr_long'))) {
5488                         my $descr = git_get_project_description($pr->{'path'}) || "";
5489                         $descr = to_utf8($descr);
5490                         $pr->{'descr_long'} = $descr;
5491                         $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5492                 }
5493                 if (project_info_needs_filling($pr, $filter_set->('owner'))) {
5494                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5495                 }
5496                 if ($show_ctags &&
5497                     project_info_needs_filling($pr, $filter_set->('ctags'))) {
5498                         $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5499                 }
5500                 if ($projects_list_group_categories &&
5501                     project_info_needs_filling($pr, $filter_set->('category'))) {
5502                         my $cat = git_get_project_category($pr->{'path'}) ||
5503                                                            $project_list_default_category;
5504                         $pr->{'category'} = to_utf8($cat);
5505                 }
5506
5507                 push @projects, $pr;
5508         }
5509
5510         return @projects;
5511 }
5512
5513 sub sort_projects_list {
5514         my ($projlist, $order) = @_;
5515         my @projects;
5516
5517         my %order_info = (
5518                 project => { key => 'path', type => 'str' },
5519                 descr => { key => 'descr_long', type => 'str' },
5520                 owner => { key => 'owner', type => 'str' },
5521                 age => { key => 'age', type => 'num' }
5522         );
5523         my $oi = $order_info{$order};
5524         return @$projlist unless defined $oi;
5525         if ($oi->{'type'} eq 'str') {
5526                 @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5527         } else {
5528                 @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5529         }
5530
5531         return @projects;
5532 }
5533
5534 # returns a hash of categories, containing the list of project
5535 # belonging to each category
5536 sub build_projlist_by_category {
5537         my ($projlist, $from, $to) = @_;
5538         my %categories;
5539
5540         $from = 0 unless defined $from;
5541         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5542
5543         for (my $i = $from; $i <= $to; $i++) {
5544                 my $pr = $projlist->[$i];
5545                 push @{$categories{ $pr->{'category'} }}, $pr;
5546         }
5547
5548         return wantarray ? %categories : \%categories;
5549 }
5550
5551 # print 'sort by' <th> element, generating 'sort by $name' replay link
5552 # if that order is not selected
5553 sub print_sort_th {
5554         print format_sort_th(@_);
5555 }
5556
5557 sub format_sort_th {
5558         my ($name, $order, $header) = @_;
5559         my $sort_th = "";
5560         $header ||= ucfirst($name);
5561
5562         if ($order eq $name) {
5563                 $sort_th .= "<th>$header</th>\n";
5564         } else {
5565                 $sort_th .= "<th>" .
5566                             $cgi->a({-href => href(-replay=>1, order=>$name),
5567                                      -class => "header"}, $header) .
5568                             "</th>\n";
5569         }
5570
5571         return $sort_th;
5572 }
5573
5574 sub git_project_list_rows {
5575         my ($projlist, $from, $to, $check_forks) = @_;
5576
5577         $from = 0 unless defined $from;
5578         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5579
5580         my $alternate = 1;
5581         for (my $i = $from; $i <= $to; $i++) {
5582                 my $pr = $projlist->[$i];
5583
5584                 if ($alternate) {
5585                         print "<tr class=\"dark\">\n";
5586                 } else {
5587                         print "<tr class=\"light\">\n";
5588                 }
5589                 $alternate ^= 1;
5590
5591                 if ($check_forks) {
5592                         print "<td>";
5593                         if ($pr->{'forks'}) {
5594                                 my $nforks = scalar @{$pr->{'forks'}};
5595                                 if ($nforks > 0) {
5596                                         print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5597                                                        -title => "$nforks forks"}, "+");
5598                                 } else {
5599                                         print $cgi->span({-title => "$nforks forks"}, "+");
5600                                 }
5601                         }
5602                         print "</td>\n";
5603                 }
5604                 print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5605                                         -class => "list"},
5606                                        esc_html_match_hl($pr->{'path'}, $search_regexp)) .
5607                       "</td>\n" .
5608                       "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5609                                         -class => "list",
5610                                         -title => $pr->{'descr_long'}},
5611                                         $search_regexp
5612                                         ? esc_html_match_hl_chopped($pr->{'descr_long'},
5613                                                                     $pr->{'descr'}, $search_regexp)
5614                                         : esc_html($pr->{'descr'})) .
5615                       "</td>\n" .
5616                       "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5617                 print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5618                       (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
5619                       "<td class=\"link\">" .
5620                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5621                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5622                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5623                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5624                       ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5625                       "</td>\n" .
5626                       "</tr>\n";
5627         }
5628 }
5629
5630 sub git_project_list_body {
5631         # actually uses global variable $project
5632         my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5633         my @projects = @$projlist;
5634
5635         my $check_forks = gitweb_check_feature('forks');
5636         my $show_ctags  = gitweb_check_feature('ctags');
5637         my $tagfilter = $show_ctags ? $input_params{'ctag'} : undef;
5638         $check_forks = undef
5639                 if ($tagfilter || $search_regexp);
5640
5641         # filtering out forks before filling info allows to do less work
5642         @projects = filter_forks_from_projects_list(\@projects)
5643                 if ($check_forks);
5644         # search_projects_list pre-fills required info
5645         @projects = search_projects_list(\@projects,
5646                                          'search_regexp' => $search_regexp,
5647                                          'tagfilter'  => $tagfilter)
5648                 if ($tagfilter || $search_regexp);
5649         # fill the rest
5650         @projects = fill_project_list_info(\@projects);
5651
5652         $order ||= $default_projects_order;
5653         $from = 0 unless defined $from;
5654         $to = $#projects if (!defined $to || $#projects < $to);
5655
5656         # short circuit
5657         if ($from > $to) {
5658                 print "<center>\n".
5659                       "<b>No such projects found</b><br />\n".
5660                       "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5661                       "</center>\n<br />\n";
5662                 return;
5663         }
5664
5665         @projects = sort_projects_list(\@projects, $order);
5666
5667         if ($show_ctags) {
5668                 my $ctags = git_gather_all_ctags(\@projects);
5669                 my $cloud = git_populate_project_tagcloud($ctags);
5670                 print git_show_project_tagcloud($cloud, 64);
5671         }
5672
5673         print "<table class=\"project_list\">\n";
5674         unless ($no_header) {
5675                 print "<tr>\n";
5676                 if ($check_forks) {
5677                         print "<th></th>\n";
5678                 }
5679                 print_sort_th('project', $order, 'Project');
5680                 print_sort_th('descr', $order, 'Description');
5681                 print_sort_th('owner', $order, 'Owner');
5682                 print_sort_th('age', $order, 'Last Change');
5683                 print "<th></th>\n" . # for links
5684                       "</tr>\n";
5685         }
5686
5687         if ($projects_list_group_categories) {
5688                 # only display categories with projects in the $from-$to window
5689                 @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5690                 my %categories = build_projlist_by_category(\@projects, $from, $to);
5691                 foreach my $cat (sort keys %categories) {
5692                         unless ($cat eq "") {
5693                                 print "<tr>\n";
5694                                 if ($check_forks) {
5695                                         print "<td></td>\n";
5696                                 }
5697                                 print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5698                                 print "</tr>\n";
5699                         }
5700
5701                         git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5702                 }
5703         } else {
5704                 git_project_list_rows(\@projects, $from, $to, $check_forks);
5705         }
5706
5707         if (defined $extra) {
5708                 print "<tr>\n";
5709                 if ($check_forks) {
5710                         print "<td></td>\n";
5711                 }
5712                 print "<td colspan=\"5\">$extra</td>\n" .
5713                       "</tr>\n";
5714         }
5715         print "</table>\n";
5716 }
5717
5718 sub git_log_body {
5719         # uses global variable $project
5720         my ($commitlist, $from, $to, $refs, $extra) = @_;
5721
5722         $from = 0 unless defined $from;
5723         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5724
5725         for (my $i = 0; $i <= $to; $i++) {
5726                 my %co = %{$commitlist->[$i]};
5727                 next if !%co;
5728                 my $commit = $co{'id'};
5729                 my $ref = format_ref_marker($refs, $commit);
5730                 git_print_header_div('commit',
5731                                "<span class=\"age\">$co{'age_string'}</span>" .
5732                                esc_html($co{'title'}) . $ref,
5733                                $commit);
5734                 print "<div class=\"title_text\">\n" .
5735                       "<div class=\"log_link\">\n" .
5736                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5737                       " | " .
5738                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5739                       " | " .
5740                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5741                       "<br/>\n" .
5742                       "</div>\n";
5743                       git_print_authorship(\%co, -tag => 'span');
5744                       print "<br/>\n</div>\n";
5745
5746                 print "<div class=\"log_body\">\n";
5747                 git_print_log($co{'comment'}, -final_empty_line=> 1);
5748                 print "</div>\n";
5749         }
5750         if ($extra) {
5751                 print "<div class=\"page_nav\">\n";
5752                 print "$extra\n";
5753                 print "</div>\n";
5754         }
5755 }
5756
5757 sub git_shortlog_body {
5758         # uses global variable $project
5759         my ($commitlist, $from, $to, $refs, $extra) = @_;
5760
5761         $from = 0 unless defined $from;
5762         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5763
5764         print "<table class=\"shortlog\">\n";
5765         my $alternate = 1;
5766         for (my $i = $from; $i <= $to; $i++) {
5767                 my %co = %{$commitlist->[$i]};
5768                 my $commit = $co{'id'};
5769                 my $ref = format_ref_marker($refs, $commit);
5770                 if ($alternate) {
5771                         print "<tr class=\"dark\">\n";
5772                 } else {
5773                         print "<tr class=\"light\">\n";
5774                 }
5775                 $alternate ^= 1;
5776                 # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5777                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5778                       format_author_html('td', \%co, 10) . "<td>";
5779                 print format_subject_html($co{'title'}, $co{'title_short'},
5780                                           href(action=>"commit", hash=>$commit), $ref);
5781                 print "</td>\n" .
5782                       "<td class=\"link\">" .
5783                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5784                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5785                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5786                 my $snapshot_links = format_snapshot_links($commit);
5787                 if (defined $snapshot_links) {
5788                         print " | " . $snapshot_links;
5789                 }
5790                 print "</td>\n" .
5791                       "</tr>\n";
5792         }
5793         if (defined $extra) {
5794                 print "<tr>\n" .
5795                       "<td colspan=\"4\">$extra</td>\n" .
5796                       "</tr>\n";
5797         }
5798         print "</table>\n";
5799 }
5800
5801 sub git_history_body {
5802         # Warning: assumes constant type (blob or tree) during history
5803         my ($commitlist, $from, $to, $refs, $extra,
5804             $file_name, $file_hash, $ftype) = @_;
5805
5806         $from = 0 unless defined $from;
5807         $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5808
5809         print "<table class=\"history\">\n";
5810         my $alternate = 1;
5811         for (my $i = $from; $i <= $to; $i++) {
5812                 my %co = %{$commitlist->[$i]};
5813                 if (!%co) {
5814                         next;
5815                 }
5816                 my $commit = $co{'id'};
5817
5818                 my $ref = format_ref_marker($refs, $commit);
5819
5820                 if ($alternate) {
5821                         print "<tr class=\"dark\">\n";
5822                 } else {
5823                         print "<tr class=\"light\">\n";
5824                 }
5825                 $alternate ^= 1;
5826                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5827         # shortlog:   format_author_html('td', \%co, 10)
5828                       format_author_html('td', \%co, 15, 3) . "<td>";
5829                 # originally git_history used chop_str($co{'title'}, 50)
5830                 print format_subject_html($co{'title'}, $co{'title_short'},
5831                                           href(action=>"commit", hash=>$commit), $ref);
5832                 print "</td>\n" .
5833                       "<td class=\"link\">" .
5834                       $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5835                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5836
5837                 if ($ftype eq 'blob') {
5838                         my $blob_current = $file_hash;
5839                         my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5840                         if (defined $blob_current && defined $blob_parent &&
5841                                         $blob_current ne $blob_parent) {
5842                                 print " | " .
5843                                         $cgi->a({-href => href(action=>"blobdiff",
5844                                                                hash=>$blob_current, hash_parent=>$blob_parent,
5845                                                                hash_base=>$hash_base, hash_parent_base=>$commit,
5846                                                                file_name=>$file_name)},
5847                                                 "diff to current");
5848                         }
5849                 }
5850                 print "</td>\n" .
5851                       "</tr>\n";
5852         }
5853         if (defined $extra) {
5854                 print "<tr>\n" .
5855                       "<td colspan=\"4\">$extra</td>\n" .
5856                       "</tr>\n";
5857         }
5858         print "</table>\n";
5859 }
5860
5861 sub git_tags_body {
5862         # uses global variable $project
5863         my ($taglist, $from, $to, $extra) = @_;
5864         $from = 0 unless defined $from;
5865         $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5866
5867         print "<table class=\"tags\">\n";
5868         my $alternate = 1;
5869         for (my $i = $from; $i <= $to; $i++) {
5870                 my $entry = $taglist->[$i];
5871                 my %tag = %$entry;
5872                 my $comment = $tag{'subject'};
5873                 my $comment_short;
5874                 if (defined $comment) {
5875                         $comment_short = chop_str($comment, 30, 5);
5876                 }
5877                 if ($alternate) {
5878                         print "<tr class=\"dark\">\n";
5879                 } else {
5880                         print "<tr class=\"light\">\n";
5881                 }
5882                 $alternate ^= 1;
5883                 if (defined $tag{'age'}) {
5884                         print "<td><i>$tag{'age'}</i></td>\n";
5885                 } else {
5886                         print "<td></td>\n";
5887                 }
5888                 print "<td>" .
5889                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5890                                -class => "list name"}, esc_html($tag{'name'})) .
5891                       "</td>\n" .
5892                       "<td>";
5893                 if (defined $comment) {
5894                         print format_subject_html($comment, $comment_short,
5895                                                   href(action=>"tag", hash=>$tag{'id'}));
5896                 }
5897                 print "</td>\n" .
5898                       "<td class=\"selflink\">";
5899                 if ($tag{'type'} eq "tag") {
5900                         print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5901                 } else {
5902                         print "&nbsp;";
5903                 }
5904                 print "</td>\n" .
5905                       "<td class=\"link\">" . " | " .
5906                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5907                 if ($tag{'reftype'} eq "commit") {
5908                         print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5909                               " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5910                 } elsif ($tag{'reftype'} eq "blob") {
5911                         print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5912                 }
5913                 print "</td>\n" .
5914                       "</tr>";
5915         }
5916         if (defined $extra) {
5917                 print "<tr>\n" .
5918                       "<td colspan=\"5\">$extra</td>\n" .
5919                       "</tr>\n";
5920         }
5921         print "</table>\n";
5922 }
5923
5924 sub git_heads_body {
5925         # uses global variable $project
5926         my ($headlist, $head_at, $from, $to, $extra) = @_;
5927         $from = 0 unless defined $from;
5928         $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5929
5930         print "<table class=\"heads\">\n";
5931         my $alternate = 1;
5932         for (my $i = $from; $i <= $to; $i++) {
5933                 my $entry = $headlist->[$i];
5934                 my %ref = %$entry;
5935                 my $curr = defined $head_at && $ref{'id'} eq $head_at;
5936                 if ($alternate) {
5937                         print "<tr class=\"dark\">\n";
5938                 } else {
5939                         print "<tr class=\"light\">\n";
5940                 }
5941                 $alternate ^= 1;
5942                 print "<td><i>$ref{'age'}</i></td>\n" .
5943                       ($curr ? "<td class=\"current_head\">" : "<td>") .
5944                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5945                                -class => "list name"},esc_html($ref{'name'})) .
5946                       "</td>\n" .
5947                       "<td class=\"link\">" .
5948                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5949                       $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5950                       $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5951                       "</td>\n" .
5952                       "</tr>";
5953         }
5954         if (defined $extra) {
5955                 print "<tr>\n" .
5956                       "<td colspan=\"3\">$extra</td>\n" .
5957                       "</tr>\n";
5958         }
5959         print "</table>\n";
5960 }
5961
5962 # Display a single remote block
5963 sub git_remote_block {
5964         my ($remote, $rdata, $limit, $head) = @_;
5965
5966         my $heads = $rdata->{'heads'};
5967         my $fetch = $rdata->{'fetch'};
5968         my $push = $rdata->{'push'};
5969
5970         my $urls_table = "<table class=\"projects_list\">\n" ;
5971
5972         if (defined $fetch) {
5973                 if ($fetch eq $push) {
5974                         $urls_table .= format_repo_url("URL", $fetch);
5975                 } else {
5976                         $urls_table .= format_repo_url("Fetch URL", $fetch);
5977                         $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5978                 }
5979         } elsif (defined $push) {
5980                 $urls_table .= format_repo_url("Push URL", $push);
5981         } else {
5982                 $urls_table .= format_repo_url("", "No remote URL");
5983         }
5984
5985         $urls_table .= "</table>\n";
5986
5987         my $dots;
5988         if (defined $limit && $limit < @$heads) {
5989                 $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5990         }
5991
5992         print $urls_table;
5993         git_heads_body($heads, $head, 0, $limit, $dots);
5994 }
5995
5996 # Display a list of remote names with the respective fetch and push URLs
5997 sub git_remotes_list {
5998         my ($remotedata, $limit) = @_;
5999         print "<table class=\"heads\">\n";
6000         my $alternate = 1;
6001         my @remotes = sort keys %$remotedata;
6002
6003         my $limited = $limit && $limit < @remotes;
6004
6005         $#remotes = $limit - 1 if $limited;
6006
6007         while (my $remote = shift @remotes) {
6008                 my $rdata = $remotedata->{$remote};
6009                 my $fetch = $rdata->{'fetch'};
6010                 my $push = $rdata->{'push'};
6011                 if ($alternate) {
6012                         print "<tr class=\"dark\">\n";
6013                 } else {
6014                         print "<tr class=\"light\">\n";
6015                 }
6016                 $alternate ^= 1;
6017                 print "<td>" .
6018                       $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
6019                                -class=> "list name"},esc_html($remote)) .
6020                       "</td>";
6021                 print "<td class=\"link\">" .
6022                       (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
6023                       " | " .
6024                       (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
6025                       "</td>";
6026
6027                 print "</tr>\n";
6028         }
6029
6030         if ($limited) {
6031                 print "<tr>\n" .
6032                       "<td colspan=\"3\">" .
6033                       $cgi->a({-href => href(action=>"remotes")}, "...") .
6034                       "</td>\n" . "</tr>\n";
6035         }
6036
6037         print "</table>";
6038 }
6039
6040 # Display remote heads grouped by remote, unless there are too many
6041 # remotes, in which case we only display the remote names
6042 sub git_remotes_body {
6043         my ($remotedata, $limit, $head) = @_;
6044         if ($limit and $limit < keys %$remotedata) {
6045                 git_remotes_list($remotedata, $limit);
6046         } else {
6047                 fill_remote_heads($remotedata);
6048                 while (my ($remote, $rdata) = each %$remotedata) {
6049                         git_print_section({-class=>"remote", -id=>$remote},
6050                                 ["remotes", $remote, $remote], sub {
6051                                         git_remote_block($remote, $rdata, $limit, $head);
6052                                 });
6053                 }
6054         }
6055 }
6056
6057 sub git_search_message {
6058         my %co = @_;
6059
6060         my $greptype;
6061         if ($searchtype eq 'commit') {
6062                 $greptype = "--grep=";
6063         } elsif ($searchtype eq 'author') {
6064                 $greptype = "--author=";
6065         } elsif ($searchtype eq 'committer') {
6066                 $greptype = "--committer=";
6067         }
6068         $greptype .= $searchtext;
6069         my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
6070                                        $greptype, '--regexp-ignore-case',
6071                                        $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
6072
6073         my $paging_nav = '';
6074         if ($page > 0) {
6075                 $paging_nav .=
6076                         $cgi->a({-href => href(-replay=>1, page=>undef)},
6077                                 "first") .
6078                         " &sdot; " .
6079                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
6080                                  -accesskey => "p", -title => "Alt-p"}, "prev");
6081         } else {
6082                 $paging_nav .= "first &sdot; prev";
6083         }
6084         my $next_link = '';
6085         if ($#commitlist >= 100) {
6086                 $next_link =
6087                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
6088                                  -accesskey => "n", -title => "Alt-n"}, "next");
6089                 $paging_nav .= " &sdot; $next_link";
6090         } else {
6091                 $paging_nav .= " &sdot; next";
6092         }
6093
6094         git_header_html();
6095
6096         git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
6097         git_print_header_div('commit', esc_html($co{'title'}), $hash);
6098         if ($page == 0 && !@commitlist) {
6099                 print "<p>No match.</p>\n";
6100         } else {
6101                 git_search_grep_body(\@commitlist, 0, 99, $next_link);
6102         }
6103
6104         git_footer_html();
6105 }
6106
6107 sub git_search_changes {
6108         my %co = @_;
6109
6110         local $/ = "\n";
6111         open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
6112                 '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
6113                 ($search_use_regexp ? '--pickaxe-regex' : ())
6114                         or die_error(500, "Open git-log failed");
6115
6116         git_header_html();
6117
6118         git_print_page_nav('','', $hash,$co{'tree'},$hash);
6119         git_print_header_div('commit', esc_html($co{'title'}), $hash);
6120
6121         print "<table class=\"pickaxe search\">\n";
6122         my $alternate = 1;
6123         undef %co;
6124         my @files;
6125         while (my $line = <$fd>) {
6126                 chomp $line;
6127                 next unless $line;
6128
6129                 my %set = parse_difftree_raw_line($line);
6130                 if (defined $set{'commit'}) {
6131                         # finish previous commit
6132                         if (%co) {
6133                                 print "</td>\n" .
6134                                       "<td class=\"link\">" .
6135                                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
6136                                               "commit") .
6137                                       " | " .
6138                                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
6139                                                              hash_base=>$co{'id'})},
6140                                               "tree") .
6141                                       "</td>\n" .
6142                                       "</tr>\n";
6143                         }
6144
6145                         if ($alternate) {
6146                                 print "<tr class=\"dark\">\n";
6147                         } else {
6148                                 print "<tr class=\"light\">\n";
6149                         }
6150                         $alternate ^= 1;
6151                         %co = parse_commit($set{'commit'});
6152                         my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
6153                         print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6154                               "<td><i>$author</i></td>\n" .
6155                               "<td>" .
6156                               $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6157                                       -class => "list subject"},
6158                                       chop_and_escape_str($co{'title'}, 50) . "<br/>");
6159                 } elsif (defined $set{'to_id'}) {
6160                         next if ($set{'to_id'} =~ m/^0{40}$/);
6161
6162                         print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
6163                                                      hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
6164                                       -class => "list"},
6165                                       "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
6166                               "<br/>\n";
6167                 }
6168         }
6169         close $fd;
6170
6171         # finish last commit (warning: repetition!)
6172         if (%co) {
6173                 print "</td>\n" .
6174                       "<td class=\"link\">" .
6175                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
6176                               "commit") .
6177                       " | " .
6178                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
6179                                              hash_base=>$co{'id'})},
6180                               "tree") .
6181                       "</td>\n" .
6182                       "</tr>\n";
6183         }
6184
6185         print "</table>\n";
6186
6187         git_footer_html();
6188 }
6189
6190 sub git_search_files {
6191         my %co = @_;
6192
6193         local $/ = "\n";
6194         open my $fd, "-|", git_cmd(), 'grep', '-n', '-z',
6195                 $search_use_regexp ? ('-E', '-i') : '-F',
6196                 $searchtext, $co{'tree'}
6197                         or die_error(500, "Open git-grep failed");
6198
6199         git_header_html();
6200
6201         git_print_page_nav('','', $hash,$co{'tree'},$hash);
6202         git_print_header_div('commit', esc_html($co{'title'}), $hash);
6203
6204         print "<table class=\"grep_search\">\n";
6205         my $alternate = 1;
6206         my $matches = 0;
6207         my $lastfile = '';
6208         my $file_href;
6209         while (my $line = <$fd>) {
6210                 chomp $line;
6211                 my ($file, $lno, $ltext, $binary);
6212                 last if ($matches++ > 1000);
6213                 if ($line =~ /^Binary file (.+) matches$/) {
6214                         $file = $1;
6215                         $binary = 1;
6216                 } else {
6217                         ($file, $lno, $ltext) = split(/\0/, $line, 3);
6218                         $file =~ s/^$co{'tree'}://;
6219                 }
6220                 if ($file ne $lastfile) {
6221                         $lastfile and print "</td></tr>\n";
6222                         if ($alternate++) {
6223                                 print "<tr class=\"dark\">\n";
6224                         } else {
6225                                 print "<tr class=\"light\">\n";
6226                         }
6227                         $file_href = href(action=>"blob", hash_base=>$co{'id'},
6228                                           file_name=>$file);
6229                         print "<td class=\"list\">".
6230                                 $cgi->a({-href => $file_href, -class => "list"}, esc_path($file));
6231                         print "</td><td>\n";
6232                         $lastfile = $file;
6233                 }
6234                 if ($binary) {
6235                         print "<div class=\"binary\">Binary file</div>\n";
6236                 } else {
6237                         $ltext = untabify($ltext);
6238                         if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
6239                                 $ltext = esc_html($1, -nbsp=>1);
6240                                 $ltext .= '<span class="match">';
6241                                 $ltext .= esc_html($2, -nbsp=>1);
6242                                 $ltext .= '</span>';
6243                                 $ltext .= esc_html($3, -nbsp=>1);
6244                         } else {
6245                                 $ltext = esc_html($ltext, -nbsp=>1);
6246                         }
6247                         print "<div class=\"pre\">" .
6248                                 $cgi->a({-href => $file_href.'#l'.$lno,
6249                                         -class => "linenr"}, sprintf('%4i', $lno)) .
6250                                 ' ' .  $ltext . "</div>\n";
6251                 }
6252         }
6253         if ($lastfile) {
6254                 print "</td></tr>\n";
6255                 if ($matches > 1000) {
6256                         print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6257                 }
6258         } else {
6259                 print "<div class=\"diff nodifferences\">No matches found</div>\n";
6260         }
6261         close $fd;
6262
6263         print "</table>\n";
6264
6265         git_footer_html();
6266 }
6267
6268 sub git_search_grep_body {
6269         my ($commitlist, $from, $to, $extra) = @_;
6270         $from = 0 unless defined $from;
6271         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
6272
6273         print "<table class=\"commit_search\">\n";
6274         my $alternate = 1;
6275         for (my $i = $from; $i <= $to; $i++) {
6276                 my %co = %{$commitlist->[$i]};
6277                 if (!%co) {
6278                         next;
6279                 }
6280                 my $commit = $co{'id'};
6281                 if ($alternate) {
6282                         print "<tr class=\"dark\">\n";
6283                 } else {
6284                         print "<tr class=\"light\">\n";
6285                 }
6286                 $alternate ^= 1;
6287                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6288                       format_author_html('td', \%co, 15, 5) .
6289                       "<td>" .
6290                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6291                                -class => "list subject"},
6292                               chop_and_escape_str($co{'title'}, 50) . "<br/>");
6293                 my $comment = $co{'comment'};
6294                 foreach my $line (@$comment) {
6295                         if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
6296                                 my ($lead, $match, $trail) = ($1, $2, $3);
6297                                 $match = chop_str($match, 70, 5, 'center');
6298                                 my $contextlen = int((80 - length($match))/2);
6299                                 $contextlen = 30 if ($contextlen > 30);
6300                                 $lead  = chop_str($lead,  $contextlen, 10, 'left');
6301                                 $trail = chop_str($trail, $contextlen, 10, 'right');
6302
6303                                 $lead  = esc_html($lead);
6304                                 $match = esc_html($match);
6305                                 $trail = esc_html($trail);
6306
6307                                 print "$lead<span class=\"match\">$match</span>$trail<br />";
6308                         }
6309                 }
6310                 print "</td>\n" .
6311                       "<td class=\"link\">" .
6312                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6313                       " | " .
6314                       $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
6315                       " | " .
6316                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6317                 print "</td>\n" .
6318                       "</tr>\n";
6319         }
6320         if (defined $extra) {
6321                 print "<tr>\n" .
6322                       "<td colspan=\"3\">$extra</td>\n" .
6323                       "</tr>\n";
6324         }
6325         print "</table>\n";
6326 }
6327
6328 ## ======================================================================
6329 ## ======================================================================
6330 ## actions
6331
6332 sub git_project_list {
6333         my $order = $input_params{'order'};
6334         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6335                 die_error(400, "Unknown order parameter");
6336         }
6337
6338         my @list = git_get_projects_list($project_filter, $strict_export);
6339         if (!@list) {
6340                 die_error(404, "No projects found");
6341         }
6342
6343         git_header_html();
6344         if (defined $home_text && -f $home_text) {
6345                 print "<div class=\"index_include\">\n";
6346                 insert_file($home_text);
6347                 print "</div>\n";
6348         }
6349
6350         git_project_search_form($searchtext, $search_use_regexp);
6351         git_project_list_body(\@list, $order);
6352         git_footer_html();
6353 }
6354
6355 sub git_forks {
6356         my $order = $input_params{'order'};
6357         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6358                 die_error(400, "Unknown order parameter");
6359         }
6360
6361         my $filter = $project;
6362         $filter =~ s/\.git$//;
6363         my @list = git_get_projects_list($filter);
6364         if (!@list) {
6365                 die_error(404, "No forks found");
6366         }
6367
6368         git_header_html();
6369         git_print_page_nav('','');
6370         git_print_header_div('summary', "$project forks");
6371         git_project_list_body(\@list, $order);
6372         git_footer_html();
6373 }
6374
6375 sub git_project_index {
6376         my @projects = git_get_projects_list($project_filter, $strict_export);
6377         if (!@projects) {
6378                 die_error(404, "No projects found");
6379         }
6380
6381         print $cgi->header(
6382                 -type => 'text/plain',
6383                 -charset => 'utf-8',
6384                 -content_disposition => 'inline; filename="index.aux"');
6385
6386         foreach my $pr (@projects) {
6387                 if (!exists $pr->{'owner'}) {
6388                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6389                 }
6390
6391                 my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6392                 # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6393                 $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6394                 $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6395                 $path  =~ s/ /\+/g;
6396                 $owner =~ s/ /\+/g;
6397
6398                 print "$path $owner\n";
6399         }
6400 }
6401
6402 sub git_summary {
6403         my $descr = git_get_project_description($project) || "none";
6404         my %co = parse_commit("HEAD");
6405         my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6406         my $head = $co{'id'};
6407         my $remote_heads = gitweb_check_feature('remote_heads');
6408
6409         my $owner = git_get_project_owner($project);
6410
6411         my $refs = git_get_references();
6412         # These get_*_list functions return one more to allow us to see if
6413         # there are more ...
6414         my @taglist  = git_get_tags_list(16);
6415         my @headlist = git_get_heads_list(16);
6416         my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6417         my @forklist;
6418         my $check_forks = gitweb_check_feature('forks');
6419
6420         if ($check_forks) {
6421                 # find forks of a project
6422                 my $filter = $project;
6423                 $filter =~ s/\.git$//;
6424                 @forklist = git_get_projects_list($filter);
6425                 # filter out forks of forks
6426                 @forklist = filter_forks_from_projects_list(\@forklist)
6427                         if (@forklist);
6428         }
6429
6430         git_header_html();
6431         git_print_page_nav('summary','', $head);
6432
6433         print "<div class=\"title\">&nbsp;</div>\n";
6434         print "<table class=\"projects_list\">\n" .
6435               "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
6436               "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6437         if (defined $cd{'rfc2822'}) {
6438                 print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6439                       "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6440         }
6441
6442         # use per project git URL list in $projectroot/$project/cloneurl
6443         # or make project git URL from git base URL and project name
6444         my $url_tag = "URL";
6445         my @url_list = git_get_project_url_list($project);
6446         @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6447         foreach my $git_url (@url_list) {
6448                 next unless $git_url;
6449                 print format_repo_url($url_tag, $git_url);
6450                 $url_tag = "";
6451         }
6452
6453         # Tag cloud
6454         my $show_ctags = gitweb_check_feature('ctags');
6455         if ($show_ctags) {
6456                 my $ctags = git_get_project_ctags($project);
6457                 if (%$ctags) {
6458                         # without ability to add tags, don't show if there are none
6459                         my $cloud = git_populate_project_tagcloud($ctags);
6460                         print "<tr id=\"metadata_ctags\">" .
6461                               "<td>content tags</td>" .
6462                               "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6463                               "</tr>\n";
6464                 }
6465         }
6466
6467         print "</table>\n";
6468
6469         # If XSS prevention is on, we don't include README.html.
6470         # TODO: Allow a readme in some safe format.
6471         if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6472                 print "<div class=\"title\">readme</div>\n" .
6473                       "<div class=\"readme\">\n";
6474                 insert_file("$projectroot/$project/README.html");
6475                 print "\n</div>\n"; # class="readme"
6476         }
6477
6478         # we need to request one more than 16 (0..15) to check if
6479         # those 16 are all
6480         my @commitlist = $head ? parse_commits($head, 17) : ();
6481         if (@commitlist) {
6482                 git_print_header_div('shortlog');
6483                 git_shortlog_body(\@commitlist, 0, 15, $refs,
6484                                   $#commitlist <=  15 ? undef :
6485                                   $cgi->a({-href => href(action=>"shortlog")}, "..."));
6486         }
6487
6488         if (@taglist) {
6489                 git_print_header_div('tags');
6490                 git_tags_body(\@taglist, 0, 15,
6491                               $#taglist <=  15 ? undef :
6492                               $cgi->a({-href => href(action=>"tags")}, "..."));
6493         }
6494
6495         if (@headlist) {
6496                 git_print_header_div('heads');
6497                 git_heads_body(\@headlist, $head, 0, 15,
6498                                $#headlist <= 15 ? undef :
6499                                $cgi->a({-href => href(action=>"heads")}, "..."));
6500         }
6501
6502         if (%remotedata) {
6503                 git_print_header_div('remotes');
6504                 git_remotes_body(\%remotedata, 15, $head);
6505         }
6506
6507         if (@forklist) {
6508                 git_print_header_div('forks');
6509                 git_project_list_body(\@forklist, 'age', 0, 15,
6510                                       $#forklist <= 15 ? undef :
6511                                       $cgi->a({-href => href(action=>"forks")}, "..."),
6512                                       'no_header');
6513         }
6514
6515         git_footer_html();
6516 }
6517
6518 sub git_tag {
6519         my %tag = parse_tag($hash);
6520
6521         if (! %tag) {
6522                 die_error(404, "Unknown tag object");
6523         }
6524
6525         my $head = git_get_head_hash($project);
6526         git_header_html();
6527         git_print_page_nav('','', $head,undef,$head);
6528         git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6529         print "<div class=\"title_text\">\n" .
6530               "<table class=\"object_header\">\n" .
6531               "<tr>\n" .
6532               "<td>object</td>\n" .
6533               "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6534                                $tag{'object'}) . "</td>\n" .
6535               "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6536                                               $tag{'type'}) . "</td>\n" .
6537               "</tr>\n";
6538         if (defined($tag{'author'})) {
6539                 git_print_authorship_rows(\%tag, 'author');
6540         }
6541         print "</table>\n\n" .
6542               "</div>\n";
6543         print "<div class=\"page_body\">";
6544         my $comment = $tag{'comment'};
6545         foreach my $line (@$comment) {
6546                 chomp $line;
6547                 print esc_html($line, -nbsp=>1) . "<br/>\n";
6548         }
6549         print "</div>\n";
6550         git_footer_html();
6551 }
6552
6553 sub git_blame_common {
6554         my $format = shift || 'porcelain';
6555         if ($format eq 'porcelain' && $input_params{'javascript'}) {
6556                 $format = 'incremental';
6557                 $action = 'blame_incremental'; # for page title etc
6558         }
6559
6560         # permissions
6561         gitweb_check_feature('blame')
6562                 or die_error(403, "Blame view not allowed");
6563
6564         # error checking
6565         die_error(400, "No file name given") unless $file_name;
6566         $hash_base ||= git_get_head_hash($project);
6567         die_error(404, "Couldn't find base commit") unless $hash_base;
6568         my %co = parse_commit($hash_base)
6569                 or die_error(404, "Commit not found");
6570         my $ftype = "blob";
6571         if (!defined $hash) {
6572                 $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6573                         or die_error(404, "Error looking up file");
6574         } else {
6575                 $ftype = git_get_type($hash);
6576                 if ($ftype !~ "blob") {
6577                         die_error(400, "Object is not a blob");
6578                 }
6579         }
6580
6581         my $fd;
6582         if ($format eq 'incremental') {
6583                 # get file contents (as base)
6584                 open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6585                         or die_error(500, "Open git-cat-file failed");
6586         } elsif ($format eq 'data') {
6587                 # run git-blame --incremental
6588                 open $fd, "-|", git_cmd(), "blame", "--incremental",
6589                         $hash_base, "--", $file_name
6590                         or die_error(500, "Open git-blame --incremental failed");
6591         } else {
6592                 # run git-blame --porcelain
6593                 open $fd, "-|", git_cmd(), "blame", '-p',
6594                         $hash_base, '--', $file_name
6595                         or die_error(500, "Open git-blame --porcelain failed");
6596         }
6597
6598         # incremental blame data returns early
6599         if ($format eq 'data') {
6600                 print $cgi->header(
6601                         -type=>"text/plain", -charset => "utf-8",
6602                         -status=> "200 OK");
6603                 local $| = 1; # output autoflush
6604                 while (my $line = <$fd>) {
6605                         print to_utf8($line);
6606                 }
6607                 close $fd
6608                         or print "ERROR $!\n";
6609
6610                 print 'END';
6611                 if (defined $t0 && gitweb_check_feature('timed')) {
6612                         print ' '.
6613                               tv_interval($t0, [ gettimeofday() ]).
6614                               ' '.$number_of_git_cmds;
6615                 }
6616                 print "\n";
6617
6618                 return;
6619         }
6620
6621         # page header
6622         git_header_html();
6623         my $formats_nav =
6624                 $cgi->a({-href => href(action=>"blob", -replay=>1)},
6625                         "blob") .
6626                 " | ";
6627         if ($format eq 'incremental') {
6628                 $formats_nav .=
6629                         $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6630                                 "blame") . " (non-incremental)";
6631         } else {
6632                 $formats_nav .=
6633                         $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6634                                 "blame") . " (incremental)";
6635         }
6636         $formats_nav .=
6637                 " | " .
6638                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6639                         "history") .
6640                 " | " .
6641                 $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6642                         "HEAD");
6643         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6644         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6645         git_print_page_path($file_name, $ftype, $hash_base);
6646
6647         # page body
6648         if ($format eq 'incremental') {
6649                 print "<noscript>\n<div class=\"error\"><center><b>\n".
6650                       "This page requires JavaScript to run.\n Use ".
6651                       $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6652                               'this page').
6653                       " instead.\n".
6654                       "</b></center></div>\n</noscript>\n";
6655
6656                 print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6657         }
6658
6659         print qq!<div class="page_body">\n!;
6660         print qq!<div id="progress_info">... / ...</div>\n!
6661                 if ($format eq 'incremental');
6662         print qq!<table id="blame_table" class="blame" width="100%">\n!.
6663               #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6664               qq!<thead>\n!.
6665               qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6666               qq!</thead>\n!.
6667               qq!<tbody>\n!;
6668
6669         my @rev_color = qw(light dark);
6670         my $num_colors = scalar(@rev_color);
6671         my $current_color = 0;
6672
6673         if ($format eq 'incremental') {
6674                 my $color_class = $rev_color[$current_color];
6675
6676                 #contents of a file
6677                 my $linenr = 0;
6678         LINE:
6679                 while (my $line = <$fd>) {
6680                         chomp $line;
6681                         $linenr++;
6682
6683                         print qq!<tr id="l$linenr" class="$color_class">!.
6684                               qq!<td class="sha1"><a href=""> </a></td>!.
6685                               qq!<td class="linenr">!.
6686                               qq!<a class="linenr" href="">$linenr</a></td>!;
6687                         print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6688                         print qq!</tr>\n!;
6689                 }
6690
6691         } else { # porcelain, i.e. ordinary blame
6692                 my %metainfo = (); # saves information about commits
6693
6694                 # blame data
6695         LINE:
6696                 while (my $line = <$fd>) {
6697                         chomp $line;
6698                         # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6699                         # no <lines in group> for subsequent lines in group of lines
6700                         my ($full_rev, $orig_lineno, $lineno, $group_size) =
6701                            ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6702                         if (!exists $metainfo{$full_rev}) {
6703                                 $metainfo{$full_rev} = { 'nprevious' => 0 };
6704                         }
6705                         my $meta = $metainfo{$full_rev};
6706                         my $data;
6707                         while ($data = <$fd>) {
6708                                 chomp $data;
6709                                 last if ($data =~ s/^\t//); # contents of line
6710                                 if ($data =~ /^(\S+)(?: (.*))?$/) {
6711                                         $meta->{$1} = $2 unless exists $meta->{$1};
6712                                 }
6713                                 if ($data =~ /^previous /) {
6714                                         $meta->{'nprevious'}++;
6715                                 }
6716                         }
6717                         my $short_rev = substr($full_rev, 0, 8);
6718                         my $author = $meta->{'author'};
6719                         my %date =
6720                                 parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6721                         my $date = $date{'iso-tz'};
6722                         if ($group_size) {
6723                                 $current_color = ($current_color + 1) % $num_colors;
6724                         }
6725                         my $tr_class = $rev_color[$current_color];
6726                         $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6727                         $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6728                         $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6729                         print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6730                         if ($group_size) {
6731                                 print "<td class=\"sha1\"";
6732                                 print " title=\"". esc_html($author) . ", $date\"";
6733                                 print " rowspan=\"$group_size\"" if ($group_size > 1);
6734                                 print ">";
6735                                 print $cgi->a({-href => href(action=>"commit",
6736                                                              hash=>$full_rev,
6737                                                              file_name=>$file_name)},
6738                                               esc_html($short_rev));
6739                                 if ($group_size >= 2) {
6740                                         my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6741                                         if (@author_initials) {
6742                                                 print "<br />" .
6743                                                       esc_html(join('', @author_initials));
6744                                                 #           or join('.', ...)
6745                                         }
6746                                 }
6747                                 print "</td>\n";
6748                         }
6749                         # 'previous' <sha1 of parent commit> <filename at commit>
6750                         if (exists $meta->{'previous'} &&
6751                             $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6752                                 $meta->{'parent'} = $1;
6753                                 $meta->{'file_parent'} = unquote($2);
6754                         }
6755                         my $linenr_commit =
6756                                 exists($meta->{'parent'}) ?
6757                                 $meta->{'parent'} : $full_rev;
6758                         my $linenr_filename =
6759                                 exists($meta->{'file_parent'}) ?
6760                                 $meta->{'file_parent'} : unquote($meta->{'filename'});
6761                         my $blamed = href(action => 'blame',
6762                                           file_name => $linenr_filename,
6763                                           hash_base => $linenr_commit);
6764                         print "<td class=\"linenr\">";
6765                         print $cgi->a({ -href => "$blamed#l$orig_lineno",
6766                                         -class => "linenr" },
6767                                       esc_html($lineno));
6768                         print "</td>";
6769                         print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6770                         print "</tr>\n";
6771                 } # end while
6772
6773         }
6774
6775         # footer
6776         print "</tbody>\n".
6777               "</table>\n"; # class="blame"
6778         print "</div>\n";   # class="blame_body"
6779         close $fd
6780                 or print "Reading blob failed\n";
6781
6782         git_footer_html();
6783 }
6784
6785 sub git_blame {
6786         git_blame_common();
6787 }
6788
6789 sub git_blame_incremental {
6790         git_blame_common('incremental');
6791 }
6792
6793 sub git_blame_data {
6794         git_blame_common('data');
6795 }
6796
6797 sub git_tags {
6798         my $head = git_get_head_hash($project);
6799         git_header_html();
6800         git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6801         git_print_header_div('summary', $project);
6802
6803         my @tagslist = git_get_tags_list();
6804         if (@tagslist) {
6805                 git_tags_body(\@tagslist);
6806         }
6807         git_footer_html();
6808 }
6809
6810 sub git_heads {
6811         my $head = git_get_head_hash($project);
6812         git_header_html();
6813         git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6814         git_print_header_div('summary', $project);
6815
6816         my @headslist = git_get_heads_list();
6817         if (@headslist) {
6818                 git_heads_body(\@headslist, $head);
6819         }
6820         git_footer_html();
6821 }
6822
6823 # used both for single remote view and for list of all the remotes
6824 sub git_remotes {
6825         gitweb_check_feature('remote_heads')
6826                 or die_error(403, "Remote heads view is disabled");
6827
6828         my $head = git_get_head_hash($project);
6829         my $remote = $input_params{'hash'};
6830
6831         my $remotedata = git_get_remotes_list($remote);
6832         die_error(500, "Unable to get remote information") unless defined $remotedata;
6833
6834         unless (%$remotedata) {
6835                 die_error(404, defined $remote ?
6836                         "Remote $remote not found" :
6837                         "No remotes found");
6838         }
6839
6840         git_header_html(undef, undef, -action_extra => $remote);
6841         git_print_page_nav('', '',  $head, undef, $head,
6842                 format_ref_views($remote ? '' : 'remotes'));
6843
6844         fill_remote_heads($remotedata);
6845         if (defined $remote) {
6846                 git_print_header_div('remotes', "$remote remote for $project");
6847                 git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6848         } else {
6849                 git_print_header_div('summary', "$project remotes");
6850                 git_remotes_body($remotedata, undef, $head);
6851         }
6852
6853         git_footer_html();
6854 }
6855
6856 sub git_blob_plain {
6857         my $type = shift;
6858         my $expires;
6859
6860         if (!defined $hash) {
6861                 if (defined $file_name) {
6862                         my $base = $hash_base || git_get_head_hash($project);
6863                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6864                                 or die_error(404, "Cannot find file");
6865                 } else {
6866                         die_error(400, "No file name defined");
6867                 }
6868         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6869                 # blobs defined by non-textual hash id's can be cached
6870                 $expires = "+1d";
6871         }
6872
6873         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6874                 or die_error(500, "Open git-cat-file blob '$hash' failed");
6875
6876         # content-type (can include charset)
6877         $type = blob_contenttype($fd, $file_name, $type);
6878
6879         # "save as" filename, even when no $file_name is given
6880         my $save_as = "$hash";
6881         if (defined $file_name) {
6882                 $save_as = $file_name;
6883         } elsif ($type =~ m/^text\//) {
6884                 $save_as .= '.txt';
6885         }
6886
6887         # With XSS prevention on, blobs of all types except a few known safe
6888         # ones are served with "Content-Disposition: attachment" to make sure
6889         # they don't run in our security domain.  For certain image types,
6890         # blob view writes an <img> tag referring to blob_plain view, and we
6891         # want to be sure not to break that by serving the image as an
6892         # attachment (though Firefox 3 doesn't seem to care).
6893         my $sandbox = $prevent_xss &&
6894                 $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6895
6896         # serve text/* as text/plain
6897         if ($prevent_xss &&
6898             ($type =~ m!^text/[a-z]+\b(.*)$! ||
6899              ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
6900                 my $rest = $1;
6901                 $rest = defined $rest ? $rest : '';
6902                 $type = "text/plain$rest";
6903         }
6904
6905         print $cgi->header(
6906                 -type => $type,
6907                 -expires => $expires,
6908                 -content_disposition =>
6909                         ($sandbox ? 'attachment' : 'inline')
6910                         . '; filename="' . $save_as . '"');
6911         local $/ = undef;
6912         binmode STDOUT, ':raw';
6913         print <$fd>;
6914         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6915         close $fd;
6916 }
6917
6918 sub git_blob {
6919         my $expires;
6920
6921         if (!defined $hash) {
6922                 if (defined $file_name) {
6923                         my $base = $hash_base || git_get_head_hash($project);
6924                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6925                                 or die_error(404, "Cannot find file");
6926                 } else {
6927                         die_error(400, "No file name defined");
6928                 }
6929         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6930                 # blobs defined by non-textual hash id's can be cached
6931                 $expires = "+1d";
6932         }
6933
6934         my $have_blame = gitweb_check_feature('blame');
6935         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6936                 or die_error(500, "Couldn't cat $file_name, $hash");
6937         my $mimetype = blob_mimetype($fd, $file_name);
6938         # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6939         if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6940                 close $fd;
6941                 return git_blob_plain($mimetype);
6942         }
6943         # we can have blame only for text/* mimetype
6944         $have_blame &&= ($mimetype =~ m!^text/!);
6945
6946         my $highlight = gitweb_check_feature('highlight');
6947         my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6948         $fd = run_highlighter($fd, $highlight, $syntax)
6949                 if $syntax;
6950
6951         git_header_html(undef, $expires);
6952         my $formats_nav = '';
6953         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6954                 if (defined $file_name) {
6955                         if ($have_blame) {
6956                                 $formats_nav .=
6957                                         $cgi->a({-href => href(action=>"blame", -replay=>1)},
6958                                                 "blame") .
6959                                         " | ";
6960                         }
6961                         $formats_nav .=
6962                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6963                                         "history") .
6964                                 " | " .
6965                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6966                                         "raw") .
6967                                 " | " .
6968                                 $cgi->a({-href => href(action=>"blob",
6969                                                        hash_base=>"HEAD", file_name=>$file_name)},
6970                                         "HEAD");
6971                 } else {
6972                         $formats_nav .=
6973                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6974                                         "raw");
6975                 }
6976                 git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6977                 git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6978         } else {
6979                 print "<div class=\"page_nav\">\n" .
6980                       "<br/><br/></div>\n" .
6981                       "<div class=\"title\">".esc_html($hash)."</div>\n";
6982         }
6983         git_print_page_path($file_name, "blob", $hash_base);
6984         print "<div class=\"page_body\">\n";
6985         if ($mimetype =~ m!^image/!) {
6986                 print qq!<img type="!.esc_attr($mimetype).qq!"!;
6987                 if ($file_name) {
6988                         print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
6989                 }
6990                 print qq! src="! .
6991                       href(action=>"blob_plain", hash=>$hash,
6992                            hash_base=>$hash_base, file_name=>$file_name) .
6993                       qq!" />\n!;
6994         } else {
6995                 my $nr;
6996                 while (my $line = <$fd>) {
6997                         chomp $line;
6998                         $nr++;
6999                         $line = untabify($line);
7000                         printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
7001                                $nr, esc_attr(href(-replay => 1)), $nr, $nr,
7002                                $syntax ? sanitize($line) : esc_html($line, -nbsp=>1);
7003                 }
7004         }
7005         close $fd
7006                 or print "Reading blob failed.\n";
7007         print "</div>";
7008         git_footer_html();
7009 }
7010
7011 sub git_tree {
7012         if (!defined $hash_base) {
7013                 $hash_base = "HEAD";
7014         }
7015         if (!defined $hash) {
7016                 if (defined $file_name) {
7017                         $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
7018                 } else {
7019                         $hash = $hash_base;
7020                 }
7021         }
7022         die_error(404, "No such tree") unless defined($hash);
7023
7024         my $show_sizes = gitweb_check_feature('show-sizes');
7025         my $have_blame = gitweb_check_feature('blame');
7026
7027         my @entries = ();
7028         {
7029                 local $/ = "\0";
7030                 open my $fd, "-|", git_cmd(), "ls-tree", '-z',
7031                         ($show_sizes ? '-l' : ()), @extra_options, $hash
7032                         or die_error(500, "Open git-ls-tree failed");
7033                 @entries = map { chomp; $_ } <$fd>;
7034                 close $fd
7035                         or die_error(404, "Reading tree failed");
7036         }
7037
7038         my $refs = git_get_references();
7039         my $ref = format_ref_marker($refs, $hash_base);
7040         git_header_html();
7041         my $basedir = '';
7042         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7043                 my @views_nav = ();
7044                 if (defined $file_name) {
7045                         push @views_nav,
7046                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
7047                                         "history"),
7048                                 $cgi->a({-href => href(action=>"tree",
7049                                                        hash_base=>"HEAD", file_name=>$file_name)},
7050                                         "HEAD"),
7051                 }
7052                 my $snapshot_links = format_snapshot_links($hash);
7053                 if (defined $snapshot_links) {
7054                         # FIXME: Should be available when we have no hash base as well.
7055                         push @views_nav, $snapshot_links;
7056                 }
7057                 git_print_page_nav('tree','', $hash_base, undef, undef,
7058                                    join(' | ', @views_nav));
7059                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
7060         } else {
7061                 undef $hash_base;
7062                 print "<div class=\"page_nav\">\n";
7063                 print "<br/><br/></div>\n";
7064                 print "<div class=\"title\">".esc_html($hash)."</div>\n";
7065         }
7066         if (defined $file_name) {
7067                 $basedir = $file_name;
7068                 if ($basedir ne '' && substr($basedir, -1) ne '/') {
7069                         $basedir .= '/';
7070                 }
7071                 git_print_page_path($file_name, 'tree', $hash_base);
7072         }
7073         print "<div class=\"page_body\">\n";
7074         print "<table class=\"tree\">\n";
7075         my $alternate = 1;
7076         # '..' (top directory) link if possible
7077         if (defined $hash_base &&
7078             defined $file_name && $file_name =~ m![^/]+$!) {
7079                 if ($alternate) {
7080                         print "<tr class=\"dark\">\n";
7081                 } else {
7082                         print "<tr class=\"light\">\n";
7083                 }
7084                 $alternate ^= 1;
7085
7086                 my $up = $file_name;
7087                 $up =~ s!/?[^/]+$!!;
7088                 undef $up unless $up;
7089                 # based on git_print_tree_entry
7090                 print '<td class="mode">' . mode_str('040000') . "</td>\n";
7091                 print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
7092                 print '<td class="list">';
7093                 print $cgi->a({-href => href(action=>"tree",
7094                                              hash_base=>$hash_base,
7095                                              file_name=>$up)},
7096                               "..");
7097                 print "</td>\n";
7098                 print "<td class=\"link\"></td>\n";
7099
7100                 print "</tr>\n";
7101         }
7102         foreach my $line (@entries) {
7103                 my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
7104
7105                 if ($alternate) {
7106                         print "<tr class=\"dark\">\n";
7107                 } else {
7108                         print "<tr class=\"light\">\n";
7109                 }
7110                 $alternate ^= 1;
7111
7112                 git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
7113
7114                 print "</tr>\n";
7115         }
7116         print "</table>\n" .
7117               "</div>";
7118         git_footer_html();
7119 }
7120
7121 sub snapshot_name {
7122         my ($project, $hash) = @_;
7123
7124         # path/to/project.git  -> project
7125         # path/to/project/.git -> project
7126         my $name = to_utf8($project);
7127         $name =~ s,([^/])/*\.git$,$1,;
7128         $name = basename($name);
7129         # sanitize name
7130         $name =~ s/[[:cntrl:]]/?/g;
7131
7132         my $ver = $hash;
7133         if ($hash =~ /^[0-9a-fA-F]+$/) {
7134                 # shorten SHA-1 hash
7135                 my $full_hash = git_get_full_hash($project, $hash);
7136                 if ($full_hash =~ /^$hash/ && length($hash) > 7) {
7137                         $ver = git_get_short_hash($project, $hash);
7138                 }
7139         } elsif ($hash =~ m!^refs/tags/(.*)$!) {
7140                 # tags don't need shortened SHA-1 hash
7141                 $ver = $1;
7142         } else {
7143                 # branches and other need shortened SHA-1 hash
7144                 if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
7145                         $ver = $1;
7146                 }
7147                 $ver .= '-' . git_get_short_hash($project, $hash);
7148         }
7149         # in case of hierarchical branch names
7150         $ver =~ s!/!.!g;
7151
7152         # name = project-version_string
7153         $name = "$name-$ver";
7154
7155         return wantarray ? ($name, $name) : $name;
7156 }
7157
7158 sub exit_if_unmodified_since {
7159         my ($latest_epoch) = @_;
7160         our $cgi;
7161
7162         my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7163         if (defined $if_modified) {
7164                 my $since;
7165                 if (eval { require HTTP::Date; 1; }) {
7166                         $since = HTTP::Date::str2time($if_modified);
7167                 } elsif (eval { require Time::ParseDate; 1; }) {
7168                         $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7169                 }
7170                 if (defined $since && $latest_epoch <= $since) {
7171                         my %latest_date = parse_date($latest_epoch);
7172                         print $cgi->header(
7173                                 -last_modified => $latest_date{'rfc2822'},
7174                                 -status => '304 Not Modified');
7175                         goto DONE_GITWEB;
7176                 }
7177         }
7178 }
7179
7180 sub git_snapshot {
7181         my $format = $input_params{'snapshot_format'};
7182         if (!@snapshot_fmts) {
7183                 die_error(403, "Snapshots not allowed");
7184         }
7185         # default to first supported snapshot format
7186         $format ||= $snapshot_fmts[0];
7187         if ($format !~ m/^[a-z0-9]+$/) {
7188                 die_error(400, "Invalid snapshot format parameter");
7189         } elsif (!exists($known_snapshot_formats{$format})) {
7190                 die_error(400, "Unknown snapshot format");
7191         } elsif ($known_snapshot_formats{$format}{'disabled'}) {
7192                 die_error(403, "Snapshot format not allowed");
7193         } elsif (!grep($_ eq $format, @snapshot_fmts)) {
7194                 die_error(403, "Unsupported snapshot format");
7195         }
7196
7197         my $type = git_get_type("$hash^{}");
7198         if (!$type) {
7199                 die_error(404, 'Object does not exist');
7200         }  elsif ($type eq 'blob') {
7201                 die_error(400, 'Object is not a tree-ish');
7202         }
7203
7204         my ($name, $prefix) = snapshot_name($project, $hash);
7205         my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
7206
7207         my %co = parse_commit($hash);
7208         exit_if_unmodified_since($co{'committer_epoch'}) if %co;
7209
7210         my $cmd = quote_command(
7211                 git_cmd(), 'archive',
7212                 "--format=$known_snapshot_formats{$format}{'format'}",
7213                 "--prefix=$prefix/", $hash);
7214         if (exists $known_snapshot_formats{$format}{'compressor'}) {
7215                 $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
7216         }
7217
7218         $filename =~ s/(["\\])/\\$1/g;
7219         my %latest_date;
7220         if (%co) {
7221                 %latest_date = parse_date($co{'committer_epoch'}, $co{'committer_tz'});
7222         }
7223
7224         print $cgi->header(
7225                 -type => $known_snapshot_formats{$format}{'type'},
7226                 -content_disposition => 'inline; filename="' . $filename . '"',
7227                 %co ? (-last_modified => $latest_date{'rfc2822'}) : (),
7228                 -status => '200 OK');
7229
7230         open my $fd, "-|", $cmd
7231                 or die_error(500, "Execute git-archive failed");
7232         binmode STDOUT, ':raw';
7233         print <$fd>;
7234         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
7235         close $fd;
7236 }
7237
7238 sub git_log_generic {
7239         my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
7240
7241         my $head = git_get_head_hash($project);
7242         if (!defined $base) {
7243                 $base = $head;
7244         }
7245         if (!defined $page) {
7246                 $page = 0;
7247         }
7248         my $refs = git_get_references();
7249
7250         my $commit_hash = $base;
7251         if (defined $parent) {
7252                 $commit_hash = "$parent..$base";
7253         }
7254         my @commitlist =
7255                 parse_commits($commit_hash, 101, (100 * $page),
7256                               defined $file_name ? ($file_name, "--full-history") : ());
7257
7258         my $ftype;
7259         if (!defined $file_hash && defined $file_name) {
7260                 # some commits could have deleted file in question,
7261                 # and not have it in tree, but one of them has to have it
7262                 for (my $i = 0; $i < @commitlist; $i++) {
7263                         $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
7264                         last if defined $file_hash;
7265                 }
7266         }
7267         if (defined $file_hash) {
7268                 $ftype = git_get_type($file_hash);
7269         }
7270         if (defined $file_name && !defined $ftype) {
7271                 die_error(500, "Unknown type of object");
7272         }
7273         my %co;
7274         if (defined $file_name) {
7275                 %co = parse_commit($base)
7276                         or die_error(404, "Unknown commit object");
7277         }
7278
7279
7280         my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
7281         my $next_link = '';
7282         if ($#commitlist >= 100) {
7283                 $next_link =
7284                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
7285                                  -accesskey => "n", -title => "Alt-n"}, "next");
7286         }
7287         my $patch_max = gitweb_get_feature('patches');
7288         if ($patch_max && !defined $file_name) {
7289                 if ($patch_max < 0 || @commitlist <= $patch_max) {
7290                         $paging_nav .= " &sdot; " .
7291                                 $cgi->a({-href => href(action=>"patches", -replay=>1)},
7292                                         "patches");
7293                 }
7294         }
7295
7296         git_header_html();
7297         git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
7298         if (defined $file_name) {
7299                 git_print_header_div('commit', esc_html($co{'title'}), $base);
7300         } else {
7301                 git_print_header_div('summary', $project)
7302         }
7303         git_print_page_path($file_name, $ftype, $hash_base)
7304                 if (defined $file_name);
7305
7306         $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
7307                      $file_name, $file_hash, $ftype);
7308
7309         git_footer_html();
7310 }
7311
7312 sub git_log {
7313         git_log_generic('log', \&git_log_body,
7314                         $hash, $hash_parent);
7315 }
7316
7317 sub git_commit {
7318         $hash ||= $hash_base || "HEAD";
7319         my %co = parse_commit($hash)
7320             or die_error(404, "Unknown commit object");
7321
7322         my $parent  = $co{'parent'};
7323         my $parents = $co{'parents'}; # listref
7324
7325         # we need to prepare $formats_nav before any parameter munging
7326         my $formats_nav;
7327         if (!defined $parent) {
7328                 # --root commitdiff
7329                 $formats_nav .= '(initial)';
7330         } elsif (@$parents == 1) {
7331                 # single parent commit
7332                 $formats_nav .=
7333                         '(parent: ' .
7334                         $cgi->a({-href => href(action=>"commit",
7335                                                hash=>$parent)},
7336                                 esc_html(substr($parent, 0, 7))) .
7337                         ')';
7338         } else {
7339                 # merge commit
7340                 $formats_nav .=
7341                         '(merge: ' .
7342                         join(' ', map {
7343                                 $cgi->a({-href => href(action=>"commit",
7344                                                        hash=>$_)},
7345                                         esc_html(substr($_, 0, 7)));
7346                         } @$parents ) .
7347                         ')';
7348         }
7349         if (gitweb_check_feature('patches') && @$parents <= 1) {
7350                 $formats_nav .= " | " .
7351                         $cgi->a({-href => href(action=>"patch", -replay=>1)},
7352                                 "patch");
7353         }
7354
7355         if (!defined $parent) {
7356                 $parent = "--root";
7357         }
7358         my @difftree;
7359         open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
7360                 @diff_opts,
7361                 (@$parents <= 1 ? $parent : '-c'),
7362                 $hash, "--"
7363                 or die_error(500, "Open git-diff-tree failed");
7364         @difftree = map { chomp; $_ } <$fd>;
7365         close $fd or die_error(404, "Reading git-diff-tree failed");
7366
7367         # non-textual hash id's can be cached
7368         my $expires;
7369         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7370                 $expires = "+1d";
7371         }
7372         my $refs = git_get_references();
7373         my $ref = format_ref_marker($refs, $co{'id'});
7374
7375         git_header_html(undef, $expires);
7376         git_print_page_nav('commit', '',
7377                            $hash, $co{'tree'}, $hash,
7378                            $formats_nav);
7379
7380         if (defined $co{'parent'}) {
7381                 git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
7382         } else {
7383                 git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
7384         }
7385         print "<div class=\"title_text\">\n" .
7386               "<table class=\"object_header\">\n";
7387         git_print_authorship_rows(\%co);
7388         print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
7389         print "<tr>" .
7390               "<td>tree</td>" .
7391               "<td class=\"sha1\">" .
7392               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7393                        class => "list"}, $co{'tree'}) .
7394               "</td>" .
7395               "<td class=\"link\">" .
7396               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7397                       "tree");
7398         my $snapshot_links = format_snapshot_links($hash);
7399         if (defined $snapshot_links) {
7400                 print " | " . $snapshot_links;
7401         }
7402         print "</td>" .
7403               "</tr>\n";
7404
7405         foreach my $par (@$parents) {
7406                 print "<tr>" .
7407                       "<td>parent</td>" .
7408                       "<td class=\"sha1\">" .
7409                       $cgi->a({-href => href(action=>"commit", hash=>$par),
7410                                class => "list"}, $par) .
7411                       "</td>" .
7412                       "<td class=\"link\">" .
7413                       $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7414                       " | " .
7415                       $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7416                       "</td>" .
7417                       "</tr>\n";
7418         }
7419         print "</table>".
7420               "</div>\n";
7421
7422         print "<div class=\"page_body\">\n";
7423         git_print_log($co{'comment'});
7424         print "</div>\n";
7425
7426         git_difftree_body(\@difftree, $hash, @$parents);
7427
7428         git_footer_html();
7429 }
7430
7431 sub git_object {
7432         # object is defined by:
7433         # - hash or hash_base alone
7434         # - hash_base and file_name
7435         my $type;
7436
7437         # - hash or hash_base alone
7438         if ($hash || ($hash_base && !defined $file_name)) {
7439                 my $object_id = $hash || $hash_base;
7440
7441                 open my $fd, "-|", quote_command(
7442                         git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7443                         or die_error(404, "Object does not exist");
7444                 $type = <$fd>;
7445                 chomp $type;
7446                 close $fd
7447                         or die_error(404, "Object does not exist");
7448
7449         # - hash_base and file_name
7450         } elsif ($hash_base && defined $file_name) {
7451                 $file_name =~ s,/+$,,;
7452
7453                 system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7454                         or die_error(404, "Base object does not exist");
7455
7456                 # here errors should not hapen
7457                 open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7458                         or die_error(500, "Open git-ls-tree failed");
7459                 my $line = <$fd>;
7460                 close $fd;
7461
7462                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7463                 unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7464                         die_error(404, "File or directory for given base does not exist");
7465                 }
7466                 $type = $2;
7467                 $hash = $3;
7468         } else {
7469                 die_error(400, "Not enough information to find object");
7470         }
7471
7472         print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7473                                           hash=>$hash, hash_base=>$hash_base,
7474                                           file_name=>$file_name),
7475                              -status => '302 Found');
7476 }
7477
7478 sub git_blobdiff {
7479         my $format = shift || 'html';
7480         my $diff_style = $input_params{'diff_style'} || 'inline';
7481
7482         my $fd;
7483         my @difftree;
7484         my %diffinfo;
7485         my $expires;
7486
7487         # preparing $fd and %diffinfo for git_patchset_body
7488         # new style URI
7489         if (defined $hash_base && defined $hash_parent_base) {
7490                 if (defined $file_name) {
7491                         # read raw output
7492                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7493                                 $hash_parent_base, $hash_base,
7494                                 "--", (defined $file_parent ? $file_parent : ()), $file_name
7495                                 or die_error(500, "Open git-diff-tree failed");
7496                         @difftree = map { chomp; $_ } <$fd>;
7497                         close $fd
7498                                 or die_error(404, "Reading git-diff-tree failed");
7499                         @difftree
7500                                 or die_error(404, "Blob diff not found");
7501
7502                 } elsif (defined $hash &&
7503                          $hash =~ /[0-9a-fA-F]{40}/) {
7504                         # try to find filename from $hash
7505
7506                         # read filtered raw output
7507                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7508                                 $hash_parent_base, $hash_base, "--"
7509                                 or die_error(500, "Open git-diff-tree failed");
7510                         @difftree =
7511                                 # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7512                                 # $hash == to_id
7513                                 grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7514                                 map { chomp; $_ } <$fd>;
7515                         close $fd
7516                                 or die_error(404, "Reading git-diff-tree failed");
7517                         @difftree
7518                                 or die_error(404, "Blob diff not found");
7519
7520                 } else {
7521                         die_error(400, "Missing one of the blob diff parameters");
7522                 }
7523
7524                 if (@difftree > 1) {
7525                         die_error(400, "Ambiguous blob diff specification");
7526                 }
7527
7528                 %diffinfo = parse_difftree_raw_line($difftree[0]);
7529                 $file_parent ||= $diffinfo{'from_file'} || $file_name;
7530                 $file_name   ||= $diffinfo{'to_file'};
7531
7532                 $hash_parent ||= $diffinfo{'from_id'};
7533                 $hash        ||= $diffinfo{'to_id'};
7534
7535                 # non-textual hash id's can be cached
7536                 if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7537                     $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7538                         $expires = '+1d';
7539                 }
7540
7541                 # open patch output
7542                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7543                         '-p', ($format eq 'html' ? "--full-index" : ()),
7544                         $hash_parent_base, $hash_base,
7545                         "--", (defined $file_parent ? $file_parent : ()), $file_name
7546                         or die_error(500, "Open git-diff-tree failed");
7547         }
7548
7549         # old/legacy style URI -- not generated anymore since 1.4.3.
7550         if (!%diffinfo) {
7551                 die_error('404 Not Found', "Missing one of the blob diff parameters")
7552         }
7553
7554         # header
7555         if ($format eq 'html') {
7556                 my $formats_nav =
7557                         $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7558                                 "raw");
7559                 $formats_nav .= diff_style_nav($diff_style);
7560                 git_header_html(undef, $expires);
7561                 if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7562                         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7563                         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7564                 } else {
7565                         print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7566                         print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7567                 }
7568                 if (defined $file_name) {
7569                         git_print_page_path($file_name, "blob", $hash_base);
7570                 } else {
7571                         print "<div class=\"page_path\"></div>\n";
7572                 }
7573
7574         } elsif ($format eq 'plain') {
7575                 print $cgi->header(
7576                         -type => 'text/plain',
7577                         -charset => 'utf-8',
7578                         -expires => $expires,
7579                         -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7580
7581                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7582
7583         } else {
7584                 die_error(400, "Unknown blobdiff format");
7585         }
7586
7587         # patch
7588         if ($format eq 'html') {
7589                 print "<div class=\"page_body\">\n";
7590
7591                 git_patchset_body($fd, $diff_style,
7592                                   [ \%diffinfo ], $hash_base, $hash_parent_base);
7593                 close $fd;
7594
7595                 print "</div>\n"; # class="page_body"
7596                 git_footer_html();
7597
7598         } else {
7599                 while (my $line = <$fd>) {
7600                         $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7601                         $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7602
7603                         print $line;
7604
7605                         last if $line =~ m!^\+\+\+!;
7606                 }
7607                 local $/ = undef;
7608                 print <$fd>;
7609                 close $fd;
7610         }
7611 }
7612
7613 sub git_blobdiff_plain {
7614         git_blobdiff('plain');
7615 }
7616
7617 # assumes that it is added as later part of already existing navigation,
7618 # so it returns "| foo | bar" rather than just "foo | bar"
7619 sub diff_style_nav {
7620         my ($diff_style, $is_combined) = @_;
7621         $diff_style ||= 'inline';
7622
7623         return "" if ($is_combined);
7624
7625         my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7626         my %styles = @styles;
7627         @styles =
7628                 @styles[ map { $_ * 2 } 0..$#styles/2 ];
7629
7630         return join '',
7631                 map { " | ".$_ }
7632                 map {
7633                         $_ eq $diff_style ? $styles{$_} :
7634                         $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7635                 } @styles;
7636 }
7637
7638 sub git_commitdiff {
7639         my %params = @_;
7640         my $format = $params{-format} || 'html';
7641         my $diff_style = $input_params{'diff_style'} || 'inline';
7642
7643         my ($patch_max) = gitweb_get_feature('patches');
7644         if ($format eq 'patch') {
7645                 die_error(403, "Patch view not allowed") unless $patch_max;
7646         }
7647
7648         $hash ||= $hash_base || "HEAD";
7649         my %co = parse_commit($hash)
7650             or die_error(404, "Unknown commit object");
7651
7652         # choose format for commitdiff for merge
7653         if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7654                 $hash_parent = '--cc';
7655         }
7656         # we need to prepare $formats_nav before almost any parameter munging
7657         my $formats_nav;
7658         if ($format eq 'html') {
7659                 $formats_nav =
7660                         $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7661                                 "raw");
7662                 if ($patch_max && @{$co{'parents'}} <= 1) {
7663                         $formats_nav .= " | " .
7664                                 $cgi->a({-href => href(action=>"patch", -replay=>1)},
7665                                         "patch");
7666                 }
7667                 $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7668
7669                 if (defined $hash_parent &&
7670                     $hash_parent ne '-c' && $hash_parent ne '--cc') {
7671                         # commitdiff with two commits given
7672                         my $hash_parent_short = $hash_parent;
7673                         if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7674                                 $hash_parent_short = substr($hash_parent, 0, 7);
7675                         }
7676                         $formats_nav .=
7677                                 ' (from';
7678                         for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7679                                 if ($co{'parents'}[$i] eq $hash_parent) {
7680                                         $formats_nav .= ' parent ' . ($i+1);
7681                                         last;
7682                                 }
7683                         }
7684                         $formats_nav .= ': ' .
7685                                 $cgi->a({-href => href(-replay=>1,
7686                                                        hash=>$hash_parent, hash_base=>undef)},
7687                                         esc_html($hash_parent_short)) .
7688                                 ')';
7689                 } elsif (!$co{'parent'}) {
7690                         # --root commitdiff
7691                         $formats_nav .= ' (initial)';
7692                 } elsif (scalar @{$co{'parents'}} == 1) {
7693                         # single parent commit
7694                         $formats_nav .=
7695                                 ' (parent: ' .
7696                                 $cgi->a({-href => href(-replay=>1,
7697                                                        hash=>$co{'parent'}, hash_base=>undef)},
7698                                         esc_html(substr($co{'parent'}, 0, 7))) .
7699                                 ')';
7700                 } else {
7701                         # merge commit
7702                         if ($hash_parent eq '--cc') {
7703                                 $formats_nav .= ' | ' .
7704                                         $cgi->a({-href => href(-replay=>1,
7705                                                                hash=>$hash, hash_parent=>'-c')},
7706                                                 'combined');
7707                         } else { # $hash_parent eq '-c'
7708                                 $formats_nav .= ' | ' .
7709                                         $cgi->a({-href => href(-replay=>1,
7710                                                                hash=>$hash, hash_parent=>'--cc')},
7711                                                 'compact');
7712                         }
7713                         $formats_nav .=
7714                                 ' (merge: ' .
7715                                 join(' ', map {
7716                                         $cgi->a({-href => href(-replay=>1,
7717                                                                hash=>$_, hash_base=>undef)},
7718                                                 esc_html(substr($_, 0, 7)));
7719                                 } @{$co{'parents'}} ) .
7720                                 ')';
7721                 }
7722         }
7723
7724         my $hash_parent_param = $hash_parent;
7725         if (!defined $hash_parent_param) {
7726                 # --cc for multiple parents, --root for parentless
7727                 $hash_parent_param =
7728                         @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7729         }
7730
7731         # read commitdiff
7732         my $fd;
7733         my @difftree;
7734         if ($format eq 'html') {
7735                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7736                         "--no-commit-id", "--patch-with-raw", "--full-index",
7737                         $hash_parent_param, $hash, "--"
7738                         or die_error(500, "Open git-diff-tree failed");
7739
7740                 while (my $line = <$fd>) {
7741                         chomp $line;
7742                         # empty line ends raw part of diff-tree output
7743                         last unless $line;
7744                         push @difftree, scalar parse_difftree_raw_line($line);
7745                 }
7746
7747         } elsif ($format eq 'plain') {
7748                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7749                         '-p', $hash_parent_param, $hash, "--"
7750                         or die_error(500, "Open git-diff-tree failed");
7751         } elsif ($format eq 'patch') {
7752                 # For commit ranges, we limit the output to the number of
7753                 # patches specified in the 'patches' feature.
7754                 # For single commits, we limit the output to a single patch,
7755                 # diverging from the git-format-patch default.
7756                 my @commit_spec = ();
7757                 if ($hash_parent) {
7758                         if ($patch_max > 0) {
7759                                 push @commit_spec, "-$patch_max";
7760                         }
7761                         push @commit_spec, '-n', "$hash_parent..$hash";
7762                 } else {
7763                         if ($params{-single}) {
7764                                 push @commit_spec, '-1';
7765                         } else {
7766                                 if ($patch_max > 0) {
7767                                         push @commit_spec, "-$patch_max";
7768                                 }
7769                                 push @commit_spec, "-n";
7770                         }
7771                         push @commit_spec, '--root', $hash;
7772                 }
7773                 open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7774                         '--encoding=utf8', '--stdout', @commit_spec
7775                         or die_error(500, "Open git-format-patch failed");
7776         } else {
7777                 die_error(400, "Unknown commitdiff format");
7778         }
7779
7780         # non-textual hash id's can be cached
7781         my $expires;
7782         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7783                 $expires = "+1d";
7784         }
7785
7786         # write commit message
7787         if ($format eq 'html') {
7788                 my $refs = git_get_references();
7789                 my $ref = format_ref_marker($refs, $co{'id'});
7790
7791                 git_header_html(undef, $expires);
7792                 git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7793                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7794                 print "<div class=\"title_text\">\n" .
7795                       "<table class=\"object_header\">\n";
7796                 git_print_authorship_rows(\%co);
7797                 print "</table>".
7798                       "</div>\n";
7799                 print "<div class=\"page_body\">\n";
7800                 if (@{$co{'comment'}} > 1) {
7801                         print "<div class=\"log\">\n";
7802                         git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7803                         print "</div>\n"; # class="log"
7804                 }
7805
7806         } elsif ($format eq 'plain') {
7807                 my $refs = git_get_references("tags");
7808                 my $tagname = git_get_rev_name_tags($hash);
7809                 my $filename = basename($project) . "-$hash.patch";
7810
7811                 print $cgi->header(
7812                         -type => 'text/plain',
7813                         -charset => 'utf-8',
7814                         -expires => $expires,
7815                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7816                 my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7817                 print "From: " . to_utf8($co{'author'}) . "\n";
7818                 print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7819                 print "Subject: " . to_utf8($co{'title'}) . "\n";
7820
7821                 print "X-Git-Tag: $tagname\n" if $tagname;
7822                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7823
7824                 foreach my $line (@{$co{'comment'}}) {
7825                         print to_utf8($line) . "\n";
7826                 }
7827                 print "---\n\n";
7828         } elsif ($format eq 'patch') {
7829                 my $filename = basename($project) . "-$hash.patch";
7830
7831                 print $cgi->header(
7832                         -type => 'text/plain',
7833                         -charset => 'utf-8',
7834                         -expires => $expires,
7835                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7836         }
7837
7838         # write patch
7839         if ($format eq 'html') {
7840                 my $use_parents = !defined $hash_parent ||
7841                         $hash_parent eq '-c' || $hash_parent eq '--cc';
7842                 git_difftree_body(\@difftree, $hash,
7843                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7844                 print "<br/>\n";
7845
7846                 git_patchset_body($fd, $diff_style,
7847                                   \@difftree, $hash,
7848                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7849                 close $fd;
7850                 print "</div>\n"; # class="page_body"
7851                 git_footer_html();
7852
7853         } elsif ($format eq 'plain') {
7854                 local $/ = undef;
7855                 print <$fd>;
7856                 close $fd
7857                         or print "Reading git-diff-tree failed\n";
7858         } elsif ($format eq 'patch') {
7859                 local $/ = undef;
7860                 print <$fd>;
7861                 close $fd
7862                         or print "Reading git-format-patch failed\n";
7863         }
7864 }
7865
7866 sub git_commitdiff_plain {
7867         git_commitdiff(-format => 'plain');
7868 }
7869
7870 # format-patch-style patches
7871 sub git_patch {
7872         git_commitdiff(-format => 'patch', -single => 1);
7873 }
7874
7875 sub git_patches {
7876         git_commitdiff(-format => 'patch');
7877 }
7878
7879 sub git_history {
7880         git_log_generic('history', \&git_history_body,
7881                         $hash_base, $hash_parent_base,
7882                         $file_name, $hash);
7883 }
7884
7885 sub git_search {
7886         $searchtype ||= 'commit';
7887
7888         # check if appropriate features are enabled
7889         gitweb_check_feature('search')
7890                 or die_error(403, "Search is disabled");
7891         if ($searchtype eq 'pickaxe') {
7892                 # pickaxe may take all resources of your box and run for several minutes
7893                 # with every query - so decide by yourself how public you make this feature
7894                 gitweb_check_feature('pickaxe')
7895                         or die_error(403, "Pickaxe search is disabled");
7896         }
7897         if ($searchtype eq 'grep') {
7898                 # grep search might be potentially CPU-intensive, too
7899                 gitweb_check_feature('grep')
7900                         or die_error(403, "Grep search is disabled");
7901         }
7902
7903         if (!defined $searchtext) {
7904                 die_error(400, "Text field is empty");
7905         }
7906         if (!defined $hash) {
7907                 $hash = git_get_head_hash($project);
7908         }
7909         my %co = parse_commit($hash);
7910         if (!%co) {
7911                 die_error(404, "Unknown commit object");
7912         }
7913         if (!defined $page) {
7914                 $page = 0;
7915         }
7916
7917         if ($searchtype eq 'commit' ||
7918             $searchtype eq 'author' ||
7919             $searchtype eq 'committer') {
7920                 git_search_message(%co);
7921         } elsif ($searchtype eq 'pickaxe') {
7922                 git_search_changes(%co);
7923         } elsif ($searchtype eq 'grep') {
7924                 git_search_files(%co);
7925         } else {
7926                 die_error(400, "Unknown search type");
7927         }
7928 }
7929
7930 sub git_search_help {
7931         git_header_html();
7932         git_print_page_nav('','', $hash,$hash,$hash);
7933         print <<EOT;
7934 <p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7935 regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7936 the pattern entered is recognized as the POSIX extended
7937 <a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7938 insensitive).</p>
7939 <dl>
7940 <dt><b>commit</b></dt>
7941 <dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7942 EOT
7943         my $have_grep = gitweb_check_feature('grep');
7944         if ($have_grep) {
7945                 print <<EOT;
7946 <dt><b>grep</b></dt>
7947 <dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7948     a different one) are searched for the given pattern. On large trees, this search can take
7949 a while and put some strain on the server, so please use it with some consideration. Note that
7950 due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7951 case-sensitive.</dd>
7952 EOT
7953         }
7954         print <<EOT;
7955 <dt><b>author</b></dt>
7956 <dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7957 <dt><b>committer</b></dt>
7958 <dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7959 EOT
7960         my $have_pickaxe = gitweb_check_feature('pickaxe');
7961         if ($have_pickaxe) {
7962                 print <<EOT;
7963 <dt><b>pickaxe</b></dt>
7964 <dd>All commits that caused the string to appear or disappear from any file (changes that
7965 added, removed or "modified" the string) will be listed. This search can take a while and
7966 takes a lot of strain on the server, so please use it wisely. Note that since you may be
7967 interested even in changes just changing the case as well, this search is case sensitive.</dd>
7968 EOT
7969         }
7970         print "</dl>\n";
7971         git_footer_html();
7972 }
7973
7974 sub git_shortlog {
7975         git_log_generic('shortlog', \&git_shortlog_body,
7976                         $hash, $hash_parent);
7977 }
7978
7979 ## ......................................................................
7980 ## feeds (RSS, Atom; OPML)
7981
7982 sub git_feed {
7983         my $format = shift || 'atom';
7984         my $have_blame = gitweb_check_feature('blame');
7985
7986         # Atom: http://www.atomenabled.org/developers/syndication/
7987         # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7988         if ($format ne 'rss' && $format ne 'atom') {
7989                 die_error(400, "Unknown web feed format");
7990         }
7991
7992         # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7993         my $head = $hash || 'HEAD';
7994         my @commitlist = parse_commits($head, 150, 0, $file_name);
7995
7996         my %latest_commit;
7997         my %latest_date;
7998         my $content_type = "application/$format+xml";
7999         if (defined $cgi->http('HTTP_ACCEPT') &&
8000                  $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
8001                 # browser (feed reader) prefers text/xml
8002                 $content_type = 'text/xml';
8003         }
8004         if (defined($commitlist[0])) {
8005                 %latest_commit = %{$commitlist[0]};
8006                 my $latest_epoch = $latest_commit{'committer_epoch'};
8007                 exit_if_unmodified_since($latest_epoch);
8008                 %latest_date = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
8009         }
8010         print $cgi->header(
8011                 -type => $content_type,
8012                 -charset => 'utf-8',
8013                 %latest_date ? (-last_modified => $latest_date{'rfc2822'}) : (),
8014                 -status => '200 OK');
8015
8016         # Optimization: skip generating the body if client asks only
8017         # for Last-Modified date.
8018         return if ($cgi->request_method() eq 'HEAD');
8019
8020         # header variables
8021         my $title = "$site_name - $project/$action";
8022         my $feed_type = 'log';
8023         if (defined $hash) {
8024                 $title .= " - '$hash'";
8025                 $feed_type = 'branch log';
8026                 if (defined $file_name) {
8027                         $title .= " :: $file_name";
8028                         $feed_type = 'history';
8029                 }
8030         } elsif (defined $file_name) {
8031                 $title .= " - $file_name";
8032                 $feed_type = 'history';
8033         }
8034         $title .= " $feed_type";
8035         my $descr = git_get_project_description($project);
8036         if (defined $descr) {
8037                 $descr = esc_html($descr);
8038         } else {
8039                 $descr = "$project " .
8040                          ($format eq 'rss' ? 'RSS' : 'Atom') .
8041                          " feed";
8042         }
8043         my $owner = git_get_project_owner($project);
8044         $owner = esc_html($owner);
8045
8046         #header
8047         my $alt_url;
8048         if (defined $file_name) {
8049                 $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
8050         } elsif (defined $hash) {
8051                 $alt_url = href(-full=>1, action=>"log", hash=>$hash);
8052         } else {
8053                 $alt_url = href(-full=>1, action=>"summary");
8054         }
8055         print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
8056         if ($format eq 'rss') {
8057                 print <<XML;
8058 <rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
8059 <channel>
8060 XML
8061                 print "<title>$title</title>\n" .
8062                       "<link>$alt_url</link>\n" .
8063                       "<description>$descr</description>\n" .
8064                       "<language>en</language>\n" .
8065                       # project owner is responsible for 'editorial' content
8066                       "<managingEditor>$owner</managingEditor>\n";
8067                 if (defined $logo || defined $favicon) {
8068                         # prefer the logo to the favicon, since RSS
8069                         # doesn't allow both
8070                         my $img = esc_url($logo || $favicon);
8071                         print "<image>\n" .
8072                               "<url>$img</url>\n" .
8073                               "<title>$title</title>\n" .
8074                               "<link>$alt_url</link>\n" .
8075                               "</image>\n";
8076                 }
8077                 if (%latest_date) {
8078                         print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
8079                         print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
8080                 }
8081                 print "<generator>gitweb v.$version/$git_version</generator>\n";
8082         } elsif ($format eq 'atom') {
8083                 print <<XML;
8084 <feed xmlns="http://www.w3.org/2005/Atom">
8085 XML
8086                 print "<title>$title</title>\n" .
8087                       "<subtitle>$descr</subtitle>\n" .
8088                       '<link rel="alternate" type="text/html" href="' .
8089                       $alt_url . '" />' . "\n" .
8090                       '<link rel="self" type="' . $content_type . '" href="' .
8091                       $cgi->self_url() . '" />' . "\n" .
8092                       "<id>" . href(-full=>1) . "</id>\n" .
8093                       # use project owner for feed author
8094                       "<author><name>$owner</name></author>\n";
8095                 if (defined $favicon) {
8096                         print "<icon>" . esc_url($favicon) . "</icon>\n";
8097                 }
8098                 if (defined $logo) {
8099                         # not twice as wide as tall: 72 x 27 pixels
8100                         print "<logo>" . esc_url($logo) . "</logo>\n";
8101                 }
8102                 if (! %latest_date) {
8103                         # dummy date to keep the feed valid until commits trickle in:
8104                         print "<updated>1970-01-01T00:00:00Z</updated>\n";
8105                 } else {
8106                         print "<updated>$latest_date{'iso-8601'}</updated>\n";
8107                 }
8108                 print "<generator version='$version/$git_version'>gitweb</generator>\n";
8109         }
8110
8111         # contents
8112         for (my $i = 0; $i <= $#commitlist; $i++) {
8113                 my %co = %{$commitlist[$i]};
8114                 my $commit = $co{'id'};
8115                 # we read 150, we always show 30 and the ones more recent than 48 hours
8116                 if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
8117                         last;
8118                 }
8119                 my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
8120
8121                 # get list of changed files
8122                 open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
8123                         $co{'parent'} || "--root",
8124                         $co{'id'}, "--", (defined $file_name ? $file_name : ())
8125                         or next;
8126                 my @difftree = map { chomp; $_ } <$fd>;
8127                 close $fd
8128                         or next;
8129
8130                 # print element (entry, item)
8131                 my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
8132                 if ($format eq 'rss') {
8133                         print "<item>\n" .
8134                               "<title>" . esc_html($co{'title'}) . "</title>\n" .
8135                               "<author>" . esc_html($co{'author'}) . "</author>\n" .
8136                               "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
8137                               "<guid isPermaLink=\"true\">$co_url</guid>\n" .
8138                               "<link>$co_url</link>\n" .
8139                               "<description>" . esc_html($co{'title'}) . "</description>\n" .
8140                               "<content:encoded>" .
8141                               "<![CDATA[\n";
8142                 } elsif ($format eq 'atom') {
8143                         print "<entry>\n" .
8144                               "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
8145                               "<updated>$cd{'iso-8601'}</updated>\n" .
8146                               "<author>\n" .
8147                               "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
8148                         if ($co{'author_email'}) {
8149                                 print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
8150                         }
8151                         print "</author>\n" .
8152                               # use committer for contributor
8153                               "<contributor>\n" .
8154                               "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
8155                         if ($co{'committer_email'}) {
8156                                 print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
8157                         }
8158                         print "</contributor>\n" .
8159                               "<published>$cd{'iso-8601'}</published>\n" .
8160                               "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
8161                               "<id>$co_url</id>\n" .
8162                               "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
8163                               "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
8164                 }
8165                 my $comment = $co{'comment'};
8166                 print "<pre>\n";
8167                 foreach my $line (@$comment) {
8168                         $line = esc_html($line);
8169                         print "$line\n";
8170                 }
8171                 print "</pre><ul>\n";
8172                 foreach my $difftree_line (@difftree) {
8173                         my %difftree = parse_difftree_raw_line($difftree_line);
8174                         next if !$difftree{'from_id'};
8175
8176                         my $file = $difftree{'file'} || $difftree{'to_file'};
8177
8178                         print "<li>" .
8179                               "[" .
8180                               $cgi->a({-href => href(-full=>1, action=>"blobdiff",
8181                                                      hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
8182                                                      hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
8183                                                      file_name=>$file, file_parent=>$difftree{'from_file'}),
8184                                       -title => "diff"}, 'D');
8185                         if ($have_blame) {
8186                                 print $cgi->a({-href => href(-full=>1, action=>"blame",
8187                                                              file_name=>$file, hash_base=>$commit),
8188                                               -title => "blame"}, 'B');
8189                         }
8190                         # if this is not a feed of a file history
8191                         if (!defined $file_name || $file_name ne $file) {
8192                                 print $cgi->a({-href => href(-full=>1, action=>"history",
8193                                                              file_name=>$file, hash=>$commit),
8194                                               -title => "history"}, 'H');
8195                         }
8196                         $file = esc_path($file);
8197                         print "] ".
8198                               "$file</li>\n";
8199                 }
8200                 if ($format eq 'rss') {
8201                         print "</ul>]]>\n" .
8202                               "</content:encoded>\n" .
8203                               "</item>\n";
8204                 } elsif ($format eq 'atom') {
8205                         print "</ul>\n</div>\n" .
8206                               "</content>\n" .
8207                               "</entry>\n";
8208                 }
8209         }
8210
8211         # end of feed
8212         if ($format eq 'rss') {
8213                 print "</channel>\n</rss>\n";
8214         } elsif ($format eq 'atom') {
8215                 print "</feed>\n";
8216         }
8217 }
8218
8219 sub git_rss {
8220         git_feed('rss');
8221 }
8222
8223 sub git_atom {
8224         git_feed('atom');
8225 }
8226
8227 sub git_opml {
8228         my @list = git_get_projects_list($project_filter, $strict_export);
8229         if (!@list) {
8230                 die_error(404, "No projects found");
8231         }
8232
8233         print $cgi->header(
8234                 -type => 'text/xml',
8235                 -charset => 'utf-8',
8236                 -content_disposition => 'inline; filename="opml.xml"');
8237
8238         my $title = esc_html($site_name);
8239         my $filter = " within subdirectory ";
8240         if (defined $project_filter) {
8241                 $filter .= esc_html($project_filter);
8242         } else {
8243                 $filter = "";
8244         }
8245         print <<XML;
8246 <?xml version="1.0" encoding="utf-8"?>
8247 <opml version="1.0">
8248 <head>
8249   <title>$title OPML Export$filter</title>
8250 </head>
8251 <body>
8252 <outline text="git RSS feeds">
8253 XML
8254
8255         foreach my $pr (@list) {
8256                 my %proj = %$pr;
8257                 my $head = git_get_head_hash($proj{'path'});
8258                 if (!defined $head) {
8259                         next;
8260                 }
8261                 $git_dir = "$projectroot/$proj{'path'}";
8262                 my %co = parse_commit($head);
8263                 if (!%co) {
8264                         next;
8265                 }
8266
8267                 my $path = esc_html(chop_str($proj{'path'}, 25, 5));
8268                 my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
8269                 my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
8270                 print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
8271         }
8272         print <<XML;
8273 </outline>
8274 </body>
8275 </opml>
8276 XML
8277 }