Merge branch 'pj/completion-remote-set-url-branches'
[git] / gitweb / gitweb.perl
1 #!/usr/bin/perl
2
3 # gitweb - simple web interface to track changes in git repositories
4 #
5 # (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
6 # (C) 2005, Christian Gierke
7 #
8 # This program is licensed under the GPLv2
9
10 use 5.008;
11 use strict;
12 use warnings;
13 use CGI qw(:standard :escapeHTML -nosticky);
14 use CGI::Util qw(unescape);
15 use CGI::Carp qw(fatalsToBrowser set_message);
16 use Encode;
17 use Fcntl ':mode';
18 use File::Find qw();
19 use File::Basename qw(basename);
20 use Time::HiRes qw(gettimeofday tv_interval);
21 binmode STDOUT, ':utf8';
22
23 our $t0 = [ gettimeofday() ];
24 our $number_of_git_cmds = 0;
25
26 BEGIN {
27         CGI->compile() if $ENV{'MOD_PERL'};
28 }
29
30 our $version = "++GIT_VERSION++";
31
32 our ($my_url, $my_uri, $base_url, $path_info, $home_link);
33 sub evaluate_uri {
34         our $cgi;
35
36         our $my_url = $cgi->url();
37         our $my_uri = $cgi->url(-absolute => 1);
38
39         # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
40         # needed and used only for URLs with nonempty PATH_INFO
41         our $base_url = $my_url;
42
43         # When the script is used as DirectoryIndex, the URL does not contain the name
44         # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
45         # have to do it ourselves. We make $path_info global because it's also used
46         # later on.
47         #
48         # Another issue with the script being the DirectoryIndex is that the resulting
49         # $my_url data is not the full script URL: this is good, because we want
50         # generated links to keep implying the script name if it wasn't explicitly
51         # indicated in the URL we're handling, but it means that $my_url cannot be used
52         # as base URL.
53         # Therefore, if we needed to strip PATH_INFO, then we know that we have
54         # to build the base URL ourselves:
55         our $path_info = decode_utf8($ENV{"PATH_INFO"});
56         if ($path_info) {
57                 if ($my_url =~ s,\Q$path_info\E$,, &&
58                     $my_uri =~ s,\Q$path_info\E$,, &&
59                     defined $ENV{'SCRIPT_NAME'}) {
60                         $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
61                 }
62         }
63
64         # target of the home link on top of all pages
65         our $home_link = $my_uri || "/";
66 }
67
68 # core git executable to use
69 # this can just be "git" if your webserver has a sensible PATH
70 our $GIT = "++GIT_BINDIR++/git";
71
72 # absolute fs-path which will be prepended to the project path
73 #our $projectroot = "/pub/scm";
74 our $projectroot = "++GITWEB_PROJECTROOT++";
75
76 # fs traversing limit for getting project list
77 # the number is relative to the projectroot
78 our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
79
80 # string of the home link on top of all pages
81 our $home_link_str = "++GITWEB_HOME_LINK_STR++";
82
83 # name of your site or organization to appear in page titles
84 # replace this with something more descriptive for clearer bookmarks
85 our $site_name = "++GITWEB_SITENAME++"
86                  || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
87
88 # html snippet to include in the <head> section of each page
89 our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
90 # filename of html text to include at top of each page
91 our $site_header = "++GITWEB_SITE_HEADER++";
92 # html text to include at home page
93 our $home_text = "++GITWEB_HOMETEXT++";
94 # filename of html text to include at bottom of each page
95 our $site_footer = "++GITWEB_SITE_FOOTER++";
96
97 # URI of stylesheets
98 our @stylesheets = ("++GITWEB_CSS++");
99 # URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
100 our $stylesheet = undef;
101 # URI of GIT logo (72x27 size)
102 our $logo = "++GITWEB_LOGO++";
103 # URI of GIT favicon, assumed to be image/png type
104 our $favicon = "++GITWEB_FAVICON++";
105 # URI of gitweb.js (JavaScript code for gitweb)
106 our $javascript = "++GITWEB_JS++";
107
108 # URI and label (title) of GIT logo link
109 #our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
110 #our $logo_label = "git documentation";
111 our $logo_url = "http://git-scm.com/";
112 our $logo_label = "git homepage";
113
114 # source of projects list
115 our $projects_list = "++GITWEB_LIST++";
116
117 # the width (in characters) of the projects list "Description" column
118 our $projects_list_description_width = 25;
119
120 # group projects by category on the projects list
121 # (enabled if this variable evaluates to true)
122 our $projects_list_group_categories = 0;
123
124 # default category if none specified
125 # (leave the empty string for no category)
126 our $project_list_default_category = "";
127
128 # default order of projects list
129 # valid values are none, project, descr, owner, and age
130 our $default_projects_order = "project";
131
132 # show repository only if this file exists
133 # (only effective if this variable evaluates to true)
134 our $export_ok = "++GITWEB_EXPORT_OK++";
135
136 # show repository only if this subroutine returns true
137 # when given the path to the project, for example:
138 #    sub { return -e "$_[0]/git-daemon-export-ok"; }
139 our $export_auth_hook = undef;
140
141 # only allow viewing of repositories also shown on the overview page
142 our $strict_export = "++GITWEB_STRICT_EXPORT++";
143
144 # list of git base URLs used for URL to where fetch project from,
145 # i.e. full URL is "$git_base_url/$project"
146 our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
147
148 # default blob_plain mimetype and default charset for text/plain blob
149 our $default_blob_plain_mimetype = 'text/plain';
150 our $default_text_plain_charset  = undef;
151
152 # file to use for guessing MIME types before trying /etc/mime.types
153 # (relative to the current git repository)
154 our $mimetypes_file = undef;
155
156 # assume this charset if line contains non-UTF-8 characters;
157 # it should be valid encoding (see Encoding::Supported(3pm) for list),
158 # for which encoding all byte sequences are valid, for example
159 # 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
160 # could be even 'utf-8' for the old behavior)
161 our $fallback_encoding = 'latin1';
162
163 # rename detection options for git-diff and git-diff-tree
164 # - default is '-M', with the cost proportional to
165 #   (number of removed files) * (number of new files).
166 # - more costly is '-C' (which implies '-M'), with the cost proportional to
167 #   (number of changed files + number of removed files) * (number of new files)
168 # - even more costly is '-C', '--find-copies-harder' with cost
169 #   (number of files in the original tree) * (number of new files)
170 # - one might want to include '-B' option, e.g. '-B', '-M'
171 our @diff_opts = ('-M'); # taken from git_commit
172
173 # Disables features that would allow repository owners to inject script into
174 # the gitweb domain.
175 our $prevent_xss = 0;
176
177 # Path to the highlight executable to use (must be the one from
178 # http://www.andre-simon.de due to assumptions about parameters and output).
179 # Useful if highlight is not installed on your webserver's PATH.
180 # [Default: highlight]
181 our $highlight_bin = "++HIGHLIGHT_BIN++";
182
183 # information about snapshot formats that gitweb is capable of serving
184 our %known_snapshot_formats = (
185         # name => {
186         #       'display' => display name,
187         #       'type' => mime type,
188         #       'suffix' => filename suffix,
189         #       'format' => --format for git-archive,
190         #       'compressor' => [compressor command and arguments]
191         #                       (array reference, optional)
192         #       'disabled' => boolean (optional)}
193         #
194         'tgz' => {
195                 'display' => 'tar.gz',
196                 'type' => 'application/x-gzip',
197                 'suffix' => '.tar.gz',
198                 'format' => 'tar',
199                 'compressor' => ['gzip', '-n']},
200
201         'tbz2' => {
202                 'display' => 'tar.bz2',
203                 'type' => 'application/x-bzip2',
204                 'suffix' => '.tar.bz2',
205                 'format' => 'tar',
206                 'compressor' => ['bzip2']},
207
208         'txz' => {
209                 'display' => 'tar.xz',
210                 'type' => 'application/x-xz',
211                 'suffix' => '.tar.xz',
212                 'format' => 'tar',
213                 'compressor' => ['xz'],
214                 'disabled' => 1},
215
216         'zip' => {
217                 'display' => 'zip',
218                 'type' => 'application/x-zip',
219                 'suffix' => '.zip',
220                 'format' => 'zip'},
221 );
222
223 # Aliases so we understand old gitweb.snapshot values in repository
224 # configuration.
225 our %known_snapshot_format_aliases = (
226         'gzip'  => 'tgz',
227         'bzip2' => 'tbz2',
228         'xz'    => 'txz',
229
230         # backward compatibility: legacy gitweb config support
231         'x-gzip' => undef, 'gz' => undef,
232         'x-bzip2' => undef, 'bz2' => undef,
233         'x-zip' => undef, '' => undef,
234 );
235
236 # Pixel sizes for icons and avatars. If the default font sizes or lineheights
237 # are changed, it may be appropriate to change these values too via
238 # $GITWEB_CONFIG.
239 our %avatar_size = (
240         'default' => 16,
241         'double'  => 32
242 );
243
244 # Used to set the maximum load that we will still respond to gitweb queries.
245 # If server load exceed this value then return "503 server busy" error.
246 # If gitweb cannot determined server load, it is taken to be 0.
247 # Leave it undefined (or set to 'undef') to turn off load checking.
248 our $maxload = 300;
249
250 # configuration for 'highlight' (http://www.andre-simon.de/)
251 # match by basename
252 our %highlight_basename = (
253         #'Program' => 'py',
254         #'Library' => 'py',
255         'SConstruct' => 'py', # SCons equivalent of Makefile
256         'Makefile' => 'make',
257 );
258 # match by extension
259 our %highlight_ext = (
260         # main extensions, defining name of syntax;
261         # see files in /usr/share/highlight/langDefs/ directory
262         map { $_ => $_ }
263                 qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
264         # alternate extensions, see /etc/highlight/filetypes.conf
265         'h' => 'c',
266         map { $_ => 'sh'  } qw(bash zsh ksh),
267         map { $_ => 'cpp' } qw(cxx c++ cc),
268         map { $_ => 'php' } qw(php3 php4 php5 phps),
269         map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
270         map { $_ => 'make'} qw(mak mk),
271         map { $_ => 'xml' } qw(xhtml html htm),
272 );
273
274 # You define site-wide feature defaults here; override them with
275 # $GITWEB_CONFIG as necessary.
276 our %feature = (
277         # feature => {
278         #       'sub' => feature-sub (subroutine),
279         #       'override' => allow-override (boolean),
280         #       'default' => [ default options...] (array reference)}
281         #
282         # if feature is overridable (it means that allow-override has true value),
283         # then feature-sub will be called with default options as parameters;
284         # return value of feature-sub indicates if to enable specified feature
285         #
286         # if there is no 'sub' key (no feature-sub), then feature cannot be
287         # overridden
288         #
289         # use gitweb_get_feature(<feature>) to retrieve the <feature> value
290         # (an array) or gitweb_check_feature(<feature>) to check if <feature>
291         # is enabled
292
293         # Enable the 'blame' blob view, showing the last commit that modified
294         # each line in the file. This can be very CPU-intensive.
295
296         # To enable system wide have in $GITWEB_CONFIG
297         # $feature{'blame'}{'default'} = [1];
298         # To have project specific config enable override in $GITWEB_CONFIG
299         # $feature{'blame'}{'override'} = 1;
300         # and in project config gitweb.blame = 0|1;
301         'blame' => {
302                 'sub' => sub { feature_bool('blame', @_) },
303                 'override' => 0,
304                 'default' => [0]},
305
306         # Enable the 'snapshot' link, providing a compressed archive of any
307         # tree. This can potentially generate high traffic if you have large
308         # project.
309
310         # Value is a list of formats defined in %known_snapshot_formats that
311         # you wish to offer.
312         # To disable system wide have in $GITWEB_CONFIG
313         # $feature{'snapshot'}{'default'} = [];
314         # To have project specific config enable override in $GITWEB_CONFIG
315         # $feature{'snapshot'}{'override'} = 1;
316         # and in project config, a comma-separated list of formats or "none"
317         # to disable.  Example: gitweb.snapshot = tbz2,zip;
318         'snapshot' => {
319                 'sub' => \&feature_snapshot,
320                 'override' => 0,
321                 'default' => ['tgz']},
322
323         # Enable text search, which will list the commits which match author,
324         # committer or commit text to a given string.  Enabled by default.
325         # Project specific override is not supported.
326         #
327         # Note that this controls all search features, which means that if
328         # it is disabled, then 'grep' and 'pickaxe' search would also be
329         # disabled.
330         'search' => {
331                 'override' => 0,
332                 'default' => [1]},
333
334         # Enable grep search, which will list the files in currently selected
335         # tree containing the given string. Enabled by default. This can be
336         # potentially CPU-intensive, of course.
337         # Note that you need to have 'search' feature enabled too.
338
339         # To enable system wide have in $GITWEB_CONFIG
340         # $feature{'grep'}{'default'} = [1];
341         # To have project specific config enable override in $GITWEB_CONFIG
342         # $feature{'grep'}{'override'} = 1;
343         # and in project config gitweb.grep = 0|1;
344         'grep' => {
345                 'sub' => sub { feature_bool('grep', @_) },
346                 'override' => 0,
347                 'default' => [1]},
348
349         # Enable the pickaxe search, which will list the commits that modified
350         # a given string in a file. This can be practical and quite faster
351         # alternative to 'blame', but still potentially CPU-intensive.
352         # Note that you need to have 'search' feature enabled too.
353
354         # To enable system wide have in $GITWEB_CONFIG
355         # $feature{'pickaxe'}{'default'} = [1];
356         # To have project specific config enable override in $GITWEB_CONFIG
357         # $feature{'pickaxe'}{'override'} = 1;
358         # and in project config gitweb.pickaxe = 0|1;
359         'pickaxe' => {
360                 'sub' => sub { feature_bool('pickaxe', @_) },
361                 'override' => 0,
362                 'default' => [1]},
363
364         # Enable showing size of blobs in a 'tree' view, in a separate
365         # column, similar to what 'ls -l' does.  This cost a bit of IO.
366
367         # To disable system wide have in $GITWEB_CONFIG
368         # $feature{'show-sizes'}{'default'} = [0];
369         # To have project specific config enable override in $GITWEB_CONFIG
370         # $feature{'show-sizes'}{'override'} = 1;
371         # and in project config gitweb.showsizes = 0|1;
372         'show-sizes' => {
373                 'sub' => sub { feature_bool('showsizes', @_) },
374                 'override' => 0,
375                 'default' => [1]},
376
377         # Make gitweb use an alternative format of the URLs which can be
378         # more readable and natural-looking: project name is embedded
379         # directly in the path and the query string contains other
380         # auxiliary information. All gitweb installations recognize
381         # URL in either format; this configures in which formats gitweb
382         # generates links.
383
384         # To enable system wide have in $GITWEB_CONFIG
385         # $feature{'pathinfo'}{'default'} = [1];
386         # Project specific override is not supported.
387
388         # Note that you will need to change the default location of CSS,
389         # favicon, logo and possibly other files to an absolute URL. Also,
390         # if gitweb.cgi serves as your indexfile, you will need to force
391         # $my_uri to contain the script name in your $GITWEB_CONFIG.
392         'pathinfo' => {
393                 'override' => 0,
394                 'default' => [0]},
395
396         # Make gitweb consider projects in project root subdirectories
397         # to be forks of existing projects. Given project $projname.git,
398         # projects matching $projname/*.git will not be shown in the main
399         # projects list, instead a '+' mark will be added to $projname
400         # there and a 'forks' view will be enabled for the project, listing
401         # all the forks. If project list is taken from a file, forks have
402         # to be listed after the main project.
403
404         # To enable system wide have in $GITWEB_CONFIG
405         # $feature{'forks'}{'default'} = [1];
406         # Project specific override is not supported.
407         'forks' => {
408                 'override' => 0,
409                 'default' => [0]},
410
411         # Insert custom links to the action bar of all project pages.
412         # This enables you mainly to link to third-party scripts integrating
413         # into gitweb; e.g. git-browser for graphical history representation
414         # or custom web-based repository administration interface.
415
416         # The 'default' value consists of a list of triplets in the form
417         # (label, link, position) where position is the label after which
418         # to insert the link and link is a format string where %n expands
419         # to the project name, %f to the project path within the filesystem,
420         # %h to the current hash (h gitweb parameter) and %b to the current
421         # hash base (hb gitweb parameter); %% expands to %.
422
423         # To enable system wide have in $GITWEB_CONFIG e.g.
424         # $feature{'actions'}{'default'} = [('graphiclog',
425         #       '/git-browser/by-commit.html?r=%n', 'summary')];
426         # Project specific override is not supported.
427         'actions' => {
428                 'override' => 0,
429                 'default' => []},
430
431         # Allow gitweb scan project content tags of project repository,
432         # and display the popular Web 2.0-ish "tag cloud" near the projects
433         # list.  Note that this is something COMPLETELY different from the
434         # normal Git tags.
435
436         # gitweb by itself can show existing tags, but it does not handle
437         # tagging itself; you need to do it externally, outside gitweb.
438         # The format is described in git_get_project_ctags() subroutine.
439         # You may want to install the HTML::TagCloud Perl module to get
440         # a pretty tag cloud instead of just a list of tags.
441
442         # To enable system wide have in $GITWEB_CONFIG
443         # $feature{'ctags'}{'default'} = [1];
444         # Project specific override is not supported.
445
446         # In the future whether ctags editing is enabled might depend
447         # on the value, but using 1 should always mean no editing of ctags.
448         'ctags' => {
449                 'override' => 0,
450                 'default' => [0]},
451
452         # The maximum number of patches in a patchset generated in patch
453         # view. Set this to 0 or undef to disable patch view, or to a
454         # negative number to remove any limit.
455
456         # To disable system wide have in $GITWEB_CONFIG
457         # $feature{'patches'}{'default'} = [0];
458         # To have project specific config enable override in $GITWEB_CONFIG
459         # $feature{'patches'}{'override'} = 1;
460         # and in project config gitweb.patches = 0|n;
461         # where n is the maximum number of patches allowed in a patchset.
462         'patches' => {
463                 'sub' => \&feature_patches,
464                 'override' => 0,
465                 'default' => [16]},
466
467         # Avatar support. When this feature is enabled, views such as
468         # shortlog or commit will display an avatar associated with
469         # the email of the committer(s) and/or author(s).
470
471         # Currently available providers are gravatar and picon.
472         # If an unknown provider is specified, the feature is disabled.
473
474         # Gravatar depends on Digest::MD5.
475         # Picon currently relies on the indiana.edu database.
476
477         # To enable system wide have in $GITWEB_CONFIG
478         # $feature{'avatar'}{'default'} = ['<provider>'];
479         # where <provider> is either gravatar or picon.
480         # To have project specific config enable override in $GITWEB_CONFIG
481         # $feature{'avatar'}{'override'} = 1;
482         # and in project config gitweb.avatar = <provider>;
483         'avatar' => {
484                 'sub' => \&feature_avatar,
485                 'override' => 0,
486                 'default' => ['']},
487
488         # Enable displaying how much time and how many git commands
489         # it took to generate and display page.  Disabled by default.
490         # Project specific override is not supported.
491         'timed' => {
492                 'override' => 0,
493                 'default' => [0]},
494
495         # Enable turning some links into links to actions which require
496         # JavaScript to run (like 'blame_incremental').  Not enabled by
497         # default.  Project specific override is currently not supported.
498         'javascript-actions' => {
499                 'override' => 0,
500                 'default' => [0]},
501
502         # Enable and configure ability to change common timezone for dates
503         # in gitweb output via JavaScript.  Enabled by default.
504         # Project specific override is not supported.
505         'javascript-timezone' => {
506                 'override' => 0,
507                 'default' => [
508                         'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
509                                      # or undef to turn off this feature
510                         'gitweb_tz', # name of cookie where to store selected timezone
511                         'datetime',  # CSS class used to mark up dates for manipulation
512                 ]},
513
514         # Syntax highlighting support. This is based on Daniel Svensson's
515         # and Sham Chukoury's work in gitweb-xmms2.git.
516         # It requires the 'highlight' program present in $PATH,
517         # and therefore is disabled by default.
518
519         # To enable system wide have in $GITWEB_CONFIG
520         # $feature{'highlight'}{'default'} = [1];
521
522         'highlight' => {
523                 'sub' => sub { feature_bool('highlight', @_) },
524                 'override' => 0,
525                 'default' => [0]},
526
527         # Enable displaying of remote heads in the heads list
528
529         # To enable system wide have in $GITWEB_CONFIG
530         # $feature{'remote_heads'}{'default'} = [1];
531         # To have project specific config enable override in $GITWEB_CONFIG
532         # $feature{'remote_heads'}{'override'} = 1;
533         # and in project config gitweb.remote_heads = 0|1;
534         'remote_heads' => {
535                 'sub' => sub { feature_bool('remote_heads', @_) },
536                 'override' => 0,
537                 'default' => [0]},
538 );
539
540 sub gitweb_get_feature {
541         my ($name) = @_;
542         return unless exists $feature{$name};
543         my ($sub, $override, @defaults) = (
544                 $feature{$name}{'sub'},
545                 $feature{$name}{'override'},
546                 @{$feature{$name}{'default'}});
547         # project specific override is possible only if we have project
548         our $git_dir; # global variable, declared later
549         if (!$override || !defined $git_dir) {
550                 return @defaults;
551         }
552         if (!defined $sub) {
553                 warn "feature $name is not overridable";
554                 return @defaults;
555         }
556         return $sub->(@defaults);
557 }
558
559 # A wrapper to check if a given feature is enabled.
560 # With this, you can say
561 #
562 #   my $bool_feat = gitweb_check_feature('bool_feat');
563 #   gitweb_check_feature('bool_feat') or somecode;
564 #
565 # instead of
566 #
567 #   my ($bool_feat) = gitweb_get_feature('bool_feat');
568 #   (gitweb_get_feature('bool_feat'))[0] or somecode;
569 #
570 sub gitweb_check_feature {
571         return (gitweb_get_feature(@_))[0];
572 }
573
574
575 sub feature_bool {
576         my $key = shift;
577         my ($val) = git_get_project_config($key, '--bool');
578
579         if (!defined $val) {
580                 return ($_[0]);
581         } elsif ($val eq 'true') {
582                 return (1);
583         } elsif ($val eq 'false') {
584                 return (0);
585         }
586 }
587
588 sub feature_snapshot {
589         my (@fmts) = @_;
590
591         my ($val) = git_get_project_config('snapshot');
592
593         if ($val) {
594                 @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
595         }
596
597         return @fmts;
598 }
599
600 sub feature_patches {
601         my @val = (git_get_project_config('patches', '--int'));
602
603         if (@val) {
604                 return @val;
605         }
606
607         return ($_[0]);
608 }
609
610 sub feature_avatar {
611         my @val = (git_get_project_config('avatar'));
612
613         return @val ? @val : @_;
614 }
615
616 # checking HEAD file with -e is fragile if the repository was
617 # initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
618 # and then pruned.
619 sub check_head_link {
620         my ($dir) = @_;
621         my $headfile = "$dir/HEAD";
622         return ((-e $headfile) ||
623                 (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
624 }
625
626 sub check_export_ok {
627         my ($dir) = @_;
628         return (check_head_link($dir) &&
629                 (!$export_ok || -e "$dir/$export_ok") &&
630                 (!$export_auth_hook || $export_auth_hook->($dir)));
631 }
632
633 # process alternate names for backward compatibility
634 # filter out unsupported (unknown) snapshot formats
635 sub filter_snapshot_fmts {
636         my @fmts = @_;
637
638         @fmts = map {
639                 exists $known_snapshot_format_aliases{$_} ?
640                        $known_snapshot_format_aliases{$_} : $_} @fmts;
641         @fmts = grep {
642                 exists $known_snapshot_formats{$_} &&
643                 !$known_snapshot_formats{$_}{'disabled'}} @fmts;
644 }
645
646 # If it is set to code reference, it is code that it is to be run once per
647 # request, allowing updating configurations that change with each request,
648 # while running other code in config file only once.
649 #
650 # Otherwise, if it is false then gitweb would process config file only once;
651 # if it is true then gitweb config would be run for each request.
652 our $per_request_config = 1;
653
654 # read and parse gitweb config file given by its parameter.
655 # returns true on success, false on recoverable error, allowing
656 # to chain this subroutine, using first file that exists.
657 # dies on errors during parsing config file, as it is unrecoverable.
658 sub read_config_file {
659         my $filename = shift;
660         return unless defined $filename;
661         # die if there are errors parsing config file
662         if (-e $filename) {
663                 do $filename;
664                 die $@ if $@;
665                 return 1;
666         }
667         return;
668 }
669
670 our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
671 sub evaluate_gitweb_config {
672         our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
673         our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
674         our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
675
676         # Protect agains duplications of file names, to not read config twice.
677         # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
678         # there possibility of duplication of filename there doesn't matter.
679         $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
680         $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
681
682         # Common system-wide settings for convenience.
683         # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
684         read_config_file($GITWEB_CONFIG_COMMON);
685
686         # Use first config file that exists.  This means use the per-instance
687         # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
688         read_config_file($GITWEB_CONFIG) and return;
689         read_config_file($GITWEB_CONFIG_SYSTEM);
690 }
691
692 # Get loadavg of system, to compare against $maxload.
693 # Currently it requires '/proc/loadavg' present to get loadavg;
694 # if it is not present it returns 0, which means no load checking.
695 sub get_loadavg {
696         if( -e '/proc/loadavg' ){
697                 open my $fd, '<', '/proc/loadavg'
698                         or return 0;
699                 my @load = split(/\s+/, scalar <$fd>);
700                 close $fd;
701
702                 # The first three columns measure CPU and IO utilization of the last one,
703                 # five, and 10 minute periods.  The fourth column shows the number of
704                 # currently running processes and the total number of processes in the m/n
705                 # format.  The last column displays the last process ID used.
706                 return $load[0] || 0;
707         }
708         # additional checks for load average should go here for things that don't export
709         # /proc/loadavg
710
711         return 0;
712 }
713
714 # version of the core git binary
715 our $git_version;
716 sub evaluate_git_version {
717         our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
718         $number_of_git_cmds++;
719 }
720
721 sub check_loadavg {
722         if (defined $maxload && get_loadavg() > $maxload) {
723                 die_error(503, "The load average on the server is too high");
724         }
725 }
726
727 # ======================================================================
728 # input validation and dispatch
729
730 # input parameters can be collected from a variety of sources (presently, CGI
731 # and PATH_INFO), so we define an %input_params hash that collects them all
732 # together during validation: this allows subsequent uses (e.g. href()) to be
733 # agnostic of the parameter origin
734
735 our %input_params = ();
736
737 # input parameters are stored with the long parameter name as key. This will
738 # also be used in the href subroutine to convert parameters to their CGI
739 # equivalent, and since the href() usage is the most frequent one, we store
740 # the name -> CGI key mapping here, instead of the reverse.
741 #
742 # XXX: Warning: If you touch this, check the search form for updating,
743 # too.
744
745 our @cgi_param_mapping = (
746         project => "p",
747         action => "a",
748         file_name => "f",
749         file_parent => "fp",
750         hash => "h",
751         hash_parent => "hp",
752         hash_base => "hb",
753         hash_parent_base => "hpb",
754         page => "pg",
755         order => "o",
756         searchtext => "s",
757         searchtype => "st",
758         snapshot_format => "sf",
759         extra_options => "opt",
760         search_use_regexp => "sr",
761         ctag => "by_tag",
762         diff_style => "ds",
763         project_filter => "pf",
764         # this must be last entry (for manipulation from JavaScript)
765         javascript => "js"
766 );
767 our %cgi_param_mapping = @cgi_param_mapping;
768
769 # we will also need to know the possible actions, for validation
770 our %actions = (
771         "blame" => \&git_blame,
772         "blame_incremental" => \&git_blame_incremental,
773         "blame_data" => \&git_blame_data,
774         "blobdiff" => \&git_blobdiff,
775         "blobdiff_plain" => \&git_blobdiff_plain,
776         "blob" => \&git_blob,
777         "blob_plain" => \&git_blob_plain,
778         "commitdiff" => \&git_commitdiff,
779         "commitdiff_plain" => \&git_commitdiff_plain,
780         "commit" => \&git_commit,
781         "forks" => \&git_forks,
782         "heads" => \&git_heads,
783         "history" => \&git_history,
784         "log" => \&git_log,
785         "patch" => \&git_patch,
786         "patches" => \&git_patches,
787         "remotes" => \&git_remotes,
788         "rss" => \&git_rss,
789         "atom" => \&git_atom,
790         "search" => \&git_search,
791         "search_help" => \&git_search_help,
792         "shortlog" => \&git_shortlog,
793         "summary" => \&git_summary,
794         "tag" => \&git_tag,
795         "tags" => \&git_tags,
796         "tree" => \&git_tree,
797         "snapshot" => \&git_snapshot,
798         "object" => \&git_object,
799         # those below don't need $project
800         "opml" => \&git_opml,
801         "project_list" => \&git_project_list,
802         "project_index" => \&git_project_index,
803 );
804
805 # finally, we have the hash of allowed extra_options for the commands that
806 # allow them
807 our %allowed_options = (
808         "--no-merges" => [ qw(rss atom log shortlog history) ],
809 );
810
811 # fill %input_params with the CGI parameters. All values except for 'opt'
812 # should be single values, but opt can be an array. We should probably
813 # build an array of parameters that can be multi-valued, but since for the time
814 # being it's only this one, we just single it out
815 sub evaluate_query_params {
816         our $cgi;
817
818         while (my ($name, $symbol) = each %cgi_param_mapping) {
819                 if ($symbol eq 'opt') {
820                         $input_params{$name} = [ map { decode_utf8($_) } $cgi->param($symbol) ];
821                 } else {
822                         $input_params{$name} = decode_utf8($cgi->param($symbol));
823                 }
824         }
825 }
826
827 # now read PATH_INFO and update the parameter list for missing parameters
828 sub evaluate_path_info {
829         return if defined $input_params{'project'};
830         return if !$path_info;
831         $path_info =~ s,^/+,,;
832         return if !$path_info;
833
834         # find which part of PATH_INFO is project
835         my $project = $path_info;
836         $project =~ s,/+$,,;
837         while ($project && !check_head_link("$projectroot/$project")) {
838                 $project =~ s,/*[^/]*$,,;
839         }
840         return unless $project;
841         $input_params{'project'} = $project;
842
843         # do not change any parameters if an action is given using the query string
844         return if $input_params{'action'};
845         $path_info =~ s,^\Q$project\E/*,,;
846
847         # next, check if we have an action
848         my $action = $path_info;
849         $action =~ s,/.*$,,;
850         if (exists $actions{$action}) {
851                 $path_info =~ s,^$action/*,,;
852                 $input_params{'action'} = $action;
853         }
854
855         # list of actions that want hash_base instead of hash, but can have no
856         # pathname (f) parameter
857         my @wants_base = (
858                 'tree',
859                 'history',
860         );
861
862         # we want to catch, among others
863         # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
864         my ($parentrefname, $parentpathname, $refname, $pathname) =
865                 ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
866
867         # first, analyze the 'current' part
868         if (defined $pathname) {
869                 # we got "branch:filename" or "branch:dir/"
870                 # we could use git_get_type(branch:pathname), but:
871                 # - it needs $git_dir
872                 # - it does a git() call
873                 # - the convention of terminating directories with a slash
874                 #   makes it superfluous
875                 # - embedding the action in the PATH_INFO would make it even
876                 #   more superfluous
877                 $pathname =~ s,^/+,,;
878                 if (!$pathname || substr($pathname, -1) eq "/") {
879                         $input_params{'action'} ||= "tree";
880                         $pathname =~ s,/$,,;
881                 } else {
882                         # the default action depends on whether we had parent info
883                         # or not
884                         if ($parentrefname) {
885                                 $input_params{'action'} ||= "blobdiff_plain";
886                         } else {
887                                 $input_params{'action'} ||= "blob_plain";
888                         }
889                 }
890                 $input_params{'hash_base'} ||= $refname;
891                 $input_params{'file_name'} ||= $pathname;
892         } elsif (defined $refname) {
893                 # we got "branch". In this case we have to choose if we have to
894                 # set hash or hash_base.
895                 #
896                 # Most of the actions without a pathname only want hash to be
897                 # set, except for the ones specified in @wants_base that want
898                 # hash_base instead. It should also be noted that hand-crafted
899                 # links having 'history' as an action and no pathname or hash
900                 # set will fail, but that happens regardless of PATH_INFO.
901                 if (defined $parentrefname) {
902                         # if there is parent let the default be 'shortlog' action
903                         # (for http://git.example.com/repo.git/A..B links); if there
904                         # is no parent, dispatch will detect type of object and set
905                         # action appropriately if required (if action is not set)
906                         $input_params{'action'} ||= "shortlog";
907                 }
908                 if ($input_params{'action'} &&
909                     grep { $_ eq $input_params{'action'} } @wants_base) {
910                         $input_params{'hash_base'} ||= $refname;
911                 } else {
912                         $input_params{'hash'} ||= $refname;
913                 }
914         }
915
916         # next, handle the 'parent' part, if present
917         if (defined $parentrefname) {
918                 # a missing pathspec defaults to the 'current' filename, allowing e.g.
919                 # someproject/blobdiff/oldrev..newrev:/filename
920                 if ($parentpathname) {
921                         $parentpathname =~ s,^/+,,;
922                         $parentpathname =~ s,/$,,;
923                         $input_params{'file_parent'} ||= $parentpathname;
924                 } else {
925                         $input_params{'file_parent'} ||= $input_params{'file_name'};
926                 }
927                 # we assume that hash_parent_base is wanted if a path was specified,
928                 # or if the action wants hash_base instead of hash
929                 if (defined $input_params{'file_parent'} ||
930                         grep { $_ eq $input_params{'action'} } @wants_base) {
931                         $input_params{'hash_parent_base'} ||= $parentrefname;
932                 } else {
933                         $input_params{'hash_parent'} ||= $parentrefname;
934                 }
935         }
936
937         # for the snapshot action, we allow URLs in the form
938         # $project/snapshot/$hash.ext
939         # where .ext determines the snapshot and gets removed from the
940         # passed $refname to provide the $hash.
941         #
942         # To be able to tell that $refname includes the format extension, we
943         # require the following two conditions to be satisfied:
944         # - the hash input parameter MUST have been set from the $refname part
945         #   of the URL (i.e. they must be equal)
946         # - the snapshot format MUST NOT have been defined already (e.g. from
947         #   CGI parameter sf)
948         # It's also useless to try any matching unless $refname has a dot,
949         # so we check for that too
950         if (defined $input_params{'action'} &&
951                 $input_params{'action'} eq 'snapshot' &&
952                 defined $refname && index($refname, '.') != -1 &&
953                 $refname eq $input_params{'hash'} &&
954                 !defined $input_params{'snapshot_format'}) {
955                 # We loop over the known snapshot formats, checking for
956                 # extensions. Allowed extensions are both the defined suffix
957                 # (which includes the initial dot already) and the snapshot
958                 # format key itself, with a prepended dot
959                 while (my ($fmt, $opt) = each %known_snapshot_formats) {
960                         my $hash = $refname;
961                         unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
962                                 next;
963                         }
964                         my $sfx = $1;
965                         # a valid suffix was found, so set the snapshot format
966                         # and reset the hash parameter
967                         $input_params{'snapshot_format'} = $fmt;
968                         $input_params{'hash'} = $hash;
969                         # we also set the format suffix to the one requested
970                         # in the URL: this way a request for e.g. .tgz returns
971                         # a .tgz instead of a .tar.gz
972                         $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
973                         last;
974                 }
975         }
976 }
977
978 our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
979      $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
980      $searchtext, $search_regexp, $project_filter);
981 sub evaluate_and_validate_params {
982         our $action = $input_params{'action'};
983         if (defined $action) {
984                 if (!validate_action($action)) {
985                         die_error(400, "Invalid action parameter");
986                 }
987         }
988
989         # parameters which are pathnames
990         our $project = $input_params{'project'};
991         if (defined $project) {
992                 if (!validate_project($project)) {
993                         undef $project;
994                         die_error(404, "No such project");
995                 }
996         }
997
998         our $project_filter = $input_params{'project_filter'};
999         if (defined $project_filter) {
1000                 if (!validate_pathname($project_filter)) {
1001                         die_error(404, "Invalid project_filter parameter");
1002                 }
1003         }
1004
1005         our $file_name = $input_params{'file_name'};
1006         if (defined $file_name) {
1007                 if (!validate_pathname($file_name)) {
1008                         die_error(400, "Invalid file parameter");
1009                 }
1010         }
1011
1012         our $file_parent = $input_params{'file_parent'};
1013         if (defined $file_parent) {
1014                 if (!validate_pathname($file_parent)) {
1015                         die_error(400, "Invalid file parent parameter");
1016                 }
1017         }
1018
1019         # parameters which are refnames
1020         our $hash = $input_params{'hash'};
1021         if (defined $hash) {
1022                 if (!validate_refname($hash)) {
1023                         die_error(400, "Invalid hash parameter");
1024                 }
1025         }
1026
1027         our $hash_parent = $input_params{'hash_parent'};
1028         if (defined $hash_parent) {
1029                 if (!validate_refname($hash_parent)) {
1030                         die_error(400, "Invalid hash parent parameter");
1031                 }
1032         }
1033
1034         our $hash_base = $input_params{'hash_base'};
1035         if (defined $hash_base) {
1036                 if (!validate_refname($hash_base)) {
1037                         die_error(400, "Invalid hash base parameter");
1038                 }
1039         }
1040
1041         our @extra_options = @{$input_params{'extra_options'}};
1042         # @extra_options is always defined, since it can only be (currently) set from
1043         # CGI, and $cgi->param() returns the empty array in array context if the param
1044         # is not set
1045         foreach my $opt (@extra_options) {
1046                 if (not exists $allowed_options{$opt}) {
1047                         die_error(400, "Invalid option parameter");
1048                 }
1049                 if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1050                         die_error(400, "Invalid option parameter for this action");
1051                 }
1052         }
1053
1054         our $hash_parent_base = $input_params{'hash_parent_base'};
1055         if (defined $hash_parent_base) {
1056                 if (!validate_refname($hash_parent_base)) {
1057                         die_error(400, "Invalid hash parent base parameter");
1058                 }
1059         }
1060
1061         # other parameters
1062         our $page = $input_params{'page'};
1063         if (defined $page) {
1064                 if ($page =~ m/[^0-9]/) {
1065                         die_error(400, "Invalid page parameter");
1066                 }
1067         }
1068
1069         our $searchtype = $input_params{'searchtype'};
1070         if (defined $searchtype) {
1071                 if ($searchtype =~ m/[^a-z]/) {
1072                         die_error(400, "Invalid searchtype parameter");
1073                 }
1074         }
1075
1076         our $search_use_regexp = $input_params{'search_use_regexp'};
1077
1078         our $searchtext = $input_params{'searchtext'};
1079         our $search_regexp;
1080         if (defined $searchtext) {
1081                 if (length($searchtext) < 2) {
1082                         die_error(403, "At least two characters are required for search parameter");
1083                 }
1084                 $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
1085         }
1086 }
1087
1088 # path to the current git repository
1089 our $git_dir;
1090 sub evaluate_git_dir {
1091         our $git_dir = "$projectroot/$project" if $project;
1092 }
1093
1094 our (@snapshot_fmts, $git_avatar);
1095 sub configure_gitweb_features {
1096         # list of supported snapshot formats
1097         our @snapshot_fmts = gitweb_get_feature('snapshot');
1098         @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1099
1100         # check that the avatar feature is set to a known provider name,
1101         # and for each provider check if the dependencies are satisfied.
1102         # if the provider name is invalid or the dependencies are not met,
1103         # reset $git_avatar to the empty string.
1104         our ($git_avatar) = gitweb_get_feature('avatar');
1105         if ($git_avatar eq 'gravatar') {
1106                 $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1107         } elsif ($git_avatar eq 'picon') {
1108                 # no dependencies
1109         } else {
1110                 $git_avatar = '';
1111         }
1112 }
1113
1114 # custom error handler: 'die <message>' is Internal Server Error
1115 sub handle_errors_html {
1116         my $msg = shift; # it is already HTML escaped
1117
1118         # to avoid infinite loop where error occurs in die_error,
1119         # change handler to default handler, disabling handle_errors_html
1120         set_message("Error occured when inside die_error:\n$msg");
1121
1122         # you cannot jump out of die_error when called as error handler;
1123         # the subroutine set via CGI::Carp::set_message is called _after_
1124         # HTTP headers are already written, so it cannot write them itself
1125         die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1126 }
1127 set_message(\&handle_errors_html);
1128
1129 # dispatch
1130 sub dispatch {
1131         if (!defined $action) {
1132                 if (defined $hash) {
1133                         $action = git_get_type($hash);
1134                         $action or die_error(404, "Object does not exist");
1135                 } elsif (defined $hash_base && defined $file_name) {
1136                         $action = git_get_type("$hash_base:$file_name");
1137                         $action or die_error(404, "File or directory does not exist");
1138                 } elsif (defined $project) {
1139                         $action = 'summary';
1140                 } else {
1141                         $action = 'project_list';
1142                 }
1143         }
1144         if (!defined($actions{$action})) {
1145                 die_error(400, "Unknown action");
1146         }
1147         if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1148             !$project) {
1149                 die_error(400, "Project needed");
1150         }
1151         $actions{$action}->();
1152 }
1153
1154 sub reset_timer {
1155         our $t0 = [ gettimeofday() ]
1156                 if defined $t0;
1157         our $number_of_git_cmds = 0;
1158 }
1159
1160 our $first_request = 1;
1161 sub run_request {
1162         reset_timer();
1163
1164         evaluate_uri();
1165         if ($first_request) {
1166                 evaluate_gitweb_config();
1167                 evaluate_git_version();
1168         }
1169         if ($per_request_config) {
1170                 if (ref($per_request_config) eq 'CODE') {
1171                         $per_request_config->();
1172                 } elsif (!$first_request) {
1173                         evaluate_gitweb_config();
1174                 }
1175         }
1176         check_loadavg();
1177
1178         # $projectroot and $projects_list might be set in gitweb config file
1179         $projects_list ||= $projectroot;
1180
1181         evaluate_query_params();
1182         evaluate_path_info();
1183         evaluate_and_validate_params();
1184         evaluate_git_dir();
1185
1186         configure_gitweb_features();
1187
1188         dispatch();
1189 }
1190
1191 our $is_last_request = sub { 1 };
1192 our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1193 our $CGI = 'CGI';
1194 our $cgi;
1195 sub configure_as_fcgi {
1196         require CGI::Fast;
1197         our $CGI = 'CGI::Fast';
1198
1199         my $request_number = 0;
1200         # let each child service 100 requests
1201         our $is_last_request = sub { ++$request_number > 100 };
1202 }
1203 sub evaluate_argv {
1204         my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1205         configure_as_fcgi()
1206                 if $script_name =~ /\.fcgi$/;
1207
1208         return unless (@ARGV);
1209
1210         require Getopt::Long;
1211         Getopt::Long::GetOptions(
1212                 'fastcgi|fcgi|f' => \&configure_as_fcgi,
1213                 'nproc|n=i' => sub {
1214                         my ($arg, $val) = @_;
1215                         return unless eval { require FCGI::ProcManager; 1; };
1216                         my $proc_manager = FCGI::ProcManager->new({
1217                                 n_processes => $val,
1218                         });
1219                         our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1220                         our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1221                         our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1222                 },
1223         );
1224 }
1225
1226 sub run {
1227         evaluate_argv();
1228
1229         $first_request = 1;
1230         $pre_listen_hook->()
1231                 if $pre_listen_hook;
1232
1233  REQUEST:
1234         while ($cgi = $CGI->new()) {
1235                 $pre_dispatch_hook->()
1236                         if $pre_dispatch_hook;
1237
1238                 run_request();
1239
1240                 $post_dispatch_hook->()
1241                         if $post_dispatch_hook;
1242                 $first_request = 0;
1243
1244                 last REQUEST if ($is_last_request->());
1245         }
1246
1247  DONE_GITWEB:
1248         1;
1249 }
1250
1251 run();
1252
1253 if (defined caller) {
1254         # wrapped in a subroutine processing requests,
1255         # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1256         return;
1257 } else {
1258         # pure CGI script, serving single request
1259         exit;
1260 }
1261
1262 ## ======================================================================
1263 ## action links
1264
1265 # possible values of extra options
1266 # -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1267 # -replay => 1      - start from a current view (replay with modifications)
1268 # -path_info => 0|1 - don't use/use path_info URL (if possible)
1269 # -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1270 sub href {
1271         my %params = @_;
1272         # default is to use -absolute url() i.e. $my_uri
1273         my $href = $params{-full} ? $my_url : $my_uri;
1274
1275         # implicit -replay, must be first of implicit params
1276         $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1277
1278         $params{'project'} = $project unless exists $params{'project'};
1279
1280         if ($params{-replay}) {
1281                 while (my ($name, $symbol) = each %cgi_param_mapping) {
1282                         if (!exists $params{$name}) {
1283                                 $params{$name} = $input_params{$name};
1284                         }
1285                 }
1286         }
1287
1288         my $use_pathinfo = gitweb_check_feature('pathinfo');
1289         if (defined $params{'project'} &&
1290             (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1291                 # try to put as many parameters as possible in PATH_INFO:
1292                 #   - project name
1293                 #   - action
1294                 #   - hash_parent or hash_parent_base:/file_parent
1295                 #   - hash or hash_base:/filename
1296                 #   - the snapshot_format as an appropriate suffix
1297
1298                 # When the script is the root DirectoryIndex for the domain,
1299                 # $href here would be something like http://gitweb.example.com/
1300                 # Thus, we strip any trailing / from $href, to spare us double
1301                 # slashes in the final URL
1302                 $href =~ s,/$,,;
1303
1304                 # Then add the project name, if present
1305                 $href .= "/".esc_path_info($params{'project'});
1306                 delete $params{'project'};
1307
1308                 # since we destructively absorb parameters, we keep this
1309                 # boolean that remembers if we're handling a snapshot
1310                 my $is_snapshot = $params{'action'} eq 'snapshot';
1311
1312                 # Summary just uses the project path URL, any other action is
1313                 # added to the URL
1314                 if (defined $params{'action'}) {
1315                         $href .= "/".esc_path_info($params{'action'})
1316                                 unless $params{'action'} eq 'summary';
1317                         delete $params{'action'};
1318                 }
1319
1320                 # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1321                 # stripping nonexistent or useless pieces
1322                 $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1323                         || $params{'hash_parent'} || $params{'hash'});
1324                 if (defined $params{'hash_base'}) {
1325                         if (defined $params{'hash_parent_base'}) {
1326                                 $href .= esc_path_info($params{'hash_parent_base'});
1327                                 # skip the file_parent if it's the same as the file_name
1328                                 if (defined $params{'file_parent'}) {
1329                                         if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1330                                                 delete $params{'file_parent'};
1331                                         } elsif ($params{'file_parent'} !~ /\.\./) {
1332                                                 $href .= ":/".esc_path_info($params{'file_parent'});
1333                                                 delete $params{'file_parent'};
1334                                         }
1335                                 }
1336                                 $href .= "..";
1337                                 delete $params{'hash_parent'};
1338                                 delete $params{'hash_parent_base'};
1339                         } elsif (defined $params{'hash_parent'}) {
1340                                 $href .= esc_path_info($params{'hash_parent'}). "..";
1341                                 delete $params{'hash_parent'};
1342                         }
1343
1344                         $href .= esc_path_info($params{'hash_base'});
1345                         if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1346                                 $href .= ":/".esc_path_info($params{'file_name'});
1347                                 delete $params{'file_name'};
1348                         }
1349                         delete $params{'hash'};
1350                         delete $params{'hash_base'};
1351                 } elsif (defined $params{'hash'}) {
1352                         $href .= esc_path_info($params{'hash'});
1353                         delete $params{'hash'};
1354                 }
1355
1356                 # If the action was a snapshot, we can absorb the
1357                 # snapshot_format parameter too
1358                 if ($is_snapshot) {
1359                         my $fmt = $params{'snapshot_format'};
1360                         # snapshot_format should always be defined when href()
1361                         # is called, but just in case some code forgets, we
1362                         # fall back to the default
1363                         $fmt ||= $snapshot_fmts[0];
1364                         $href .= $known_snapshot_formats{$fmt}{'suffix'};
1365                         delete $params{'snapshot_format'};
1366                 }
1367         }
1368
1369         # now encode the parameters explicitly
1370         my @result = ();
1371         for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1372                 my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1373                 if (defined $params{$name}) {
1374                         if (ref($params{$name}) eq "ARRAY") {
1375                                 foreach my $par (@{$params{$name}}) {
1376                                         push @result, $symbol . "=" . esc_param($par);
1377                                 }
1378                         } else {
1379                                 push @result, $symbol . "=" . esc_param($params{$name});
1380                         }
1381                 }
1382         }
1383         $href .= "?" . join(';', @result) if scalar @result;
1384
1385         # final transformation: trailing spaces must be escaped (URI-encoded)
1386         $href =~ s/(\s+)$/CGI::escape($1)/e;
1387
1388         if ($params{-anchor}) {
1389                 $href .= "#".esc_param($params{-anchor});
1390         }
1391
1392         return $href;
1393 }
1394
1395
1396 ## ======================================================================
1397 ## validation, quoting/unquoting and escaping
1398
1399 sub validate_action {
1400         my $input = shift || return undef;
1401         return undef unless exists $actions{$input};
1402         return $input;
1403 }
1404
1405 sub validate_project {
1406         my $input = shift || return undef;
1407         if (!validate_pathname($input) ||
1408                 !(-d "$projectroot/$input") ||
1409                 !check_export_ok("$projectroot/$input") ||
1410                 ($strict_export && !project_in_list($input))) {
1411                 return undef;
1412         } else {
1413                 return $input;
1414         }
1415 }
1416
1417 sub validate_pathname {
1418         my $input = shift || return undef;
1419
1420         # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1421         # at the beginning, at the end, and between slashes.
1422         # also this catches doubled slashes
1423         if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1424                 return undef;
1425         }
1426         # no null characters
1427         if ($input =~ m!\0!) {
1428                 return undef;
1429         }
1430         return $input;
1431 }
1432
1433 sub validate_refname {
1434         my $input = shift || return undef;
1435
1436         # textual hashes are O.K.
1437         if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1438                 return $input;
1439         }
1440         # it must be correct pathname
1441         $input = validate_pathname($input)
1442                 or return undef;
1443         # restrictions on ref name according to git-check-ref-format
1444         if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1445                 return undef;
1446         }
1447         return $input;
1448 }
1449
1450 # decode sequences of octets in utf8 into Perl's internal form,
1451 # which is utf-8 with utf8 flag set if needed.  gitweb writes out
1452 # in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1453 sub to_utf8 {
1454         my $str = shift;
1455         return undef unless defined $str;
1456
1457         if (utf8::is_utf8($str) || utf8::decode($str)) {
1458                 return $str;
1459         } else {
1460                 return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1461         }
1462 }
1463
1464 # quote unsafe chars, but keep the slash, even when it's not
1465 # correct, but quoted slashes look too horrible in bookmarks
1466 sub esc_param {
1467         my $str = shift;
1468         return undef unless defined $str;
1469         $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1470         $str =~ s/ /\+/g;
1471         return $str;
1472 }
1473
1474 # the quoting rules for path_info fragment are slightly different
1475 sub esc_path_info {
1476         my $str = shift;
1477         return undef unless defined $str;
1478
1479         # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1480         $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1481
1482         return $str;
1483 }
1484
1485 # quote unsafe chars in whole URL, so some characters cannot be quoted
1486 sub esc_url {
1487         my $str = shift;
1488         return undef unless defined $str;
1489         $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1490         $str =~ s/ /\+/g;
1491         return $str;
1492 }
1493
1494 # quote unsafe characters in HTML attributes
1495 sub esc_attr {
1496
1497         # for XHTML conformance escaping '"' to '&quot;' is not enough
1498         return esc_html(@_);
1499 }
1500
1501 # replace invalid utf8 character with SUBSTITUTION sequence
1502 sub esc_html {
1503         my $str = shift;
1504         my %opts = @_;
1505
1506         return undef unless defined $str;
1507
1508         $str = to_utf8($str);
1509         $str = $cgi->escapeHTML($str);
1510         if ($opts{'-nbsp'}) {
1511                 $str =~ s/ /&nbsp;/g;
1512         }
1513         $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1514         return $str;
1515 }
1516
1517 # quote control characters and escape filename to HTML
1518 sub esc_path {
1519         my $str = shift;
1520         my %opts = @_;
1521
1522         return undef unless defined $str;
1523
1524         $str = to_utf8($str);
1525         $str = $cgi->escapeHTML($str);
1526         if ($opts{'-nbsp'}) {
1527                 $str =~ s/ /&nbsp;/g;
1528         }
1529         $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1530         return $str;
1531 }
1532
1533 # Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1534 sub sanitize {
1535         my $str = shift;
1536
1537         return undef unless defined $str;
1538
1539         $str = to_utf8($str);
1540         $str =~ s|([[:cntrl:]])|($1 =~ /[\t\n\r]/ ? $1 : quot_cec($1))|eg;
1541         return $str;
1542 }
1543
1544 # Make control characters "printable", using character escape codes (CEC)
1545 sub quot_cec {
1546         my $cntrl = shift;
1547         my %opts = @_;
1548         my %es = ( # character escape codes, aka escape sequences
1549                 "\t" => '\t',   # tab            (HT)
1550                 "\n" => '\n',   # line feed      (LF)
1551                 "\r" => '\r',   # carrige return (CR)
1552                 "\f" => '\f',   # form feed      (FF)
1553                 "\b" => '\b',   # backspace      (BS)
1554                 "\a" => '\a',   # alarm (bell)   (BEL)
1555                 "\e" => '\e',   # escape         (ESC)
1556                 "\013" => '\v', # vertical tab   (VT)
1557                 "\000" => '\0', # nul character  (NUL)
1558         );
1559         my $chr = ( (exists $es{$cntrl})
1560                     ? $es{$cntrl}
1561                     : sprintf('\%2x', ord($cntrl)) );
1562         if ($opts{-nohtml}) {
1563                 return $chr;
1564         } else {
1565                 return "<span class=\"cntrl\">$chr</span>";
1566         }
1567 }
1568
1569 # Alternatively use unicode control pictures codepoints,
1570 # Unicode "printable representation" (PR)
1571 sub quot_upr {
1572         my $cntrl = shift;
1573         my %opts = @_;
1574
1575         my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1576         if ($opts{-nohtml}) {
1577                 return $chr;
1578         } else {
1579                 return "<span class=\"cntrl\">$chr</span>";
1580         }
1581 }
1582
1583 # git may return quoted and escaped filenames
1584 sub unquote {
1585         my $str = shift;
1586
1587         sub unq {
1588                 my $seq = shift;
1589                 my %es = ( # character escape codes, aka escape sequences
1590                         't' => "\t",   # tab            (HT, TAB)
1591                         'n' => "\n",   # newline        (NL)
1592                         'r' => "\r",   # return         (CR)
1593                         'f' => "\f",   # form feed      (FF)
1594                         'b' => "\b",   # backspace      (BS)
1595                         'a' => "\a",   # alarm (bell)   (BEL)
1596                         'e' => "\e",   # escape         (ESC)
1597                         'v' => "\013", # vertical tab   (VT)
1598                 );
1599
1600                 if ($seq =~ m/^[0-7]{1,3}$/) {
1601                         # octal char sequence
1602                         return chr(oct($seq));
1603                 } elsif (exists $es{$seq}) {
1604                         # C escape sequence, aka character escape code
1605                         return $es{$seq};
1606                 }
1607                 # quoted ordinary character
1608                 return $seq;
1609         }
1610
1611         if ($str =~ m/^"(.*)"$/) {
1612                 # needs unquoting
1613                 $str = $1;
1614                 $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1615         }
1616         return $str;
1617 }
1618
1619 # escape tabs (convert tabs to spaces)
1620 sub untabify {
1621         my $line = shift;
1622
1623         while ((my $pos = index($line, "\t")) != -1) {
1624                 if (my $count = (8 - ($pos % 8))) {
1625                         my $spaces = ' ' x $count;
1626                         $line =~ s/\t/$spaces/;
1627                 }
1628         }
1629
1630         return $line;
1631 }
1632
1633 sub project_in_list {
1634         my $project = shift;
1635         my @list = git_get_projects_list();
1636         return @list && scalar(grep { $_->{'path'} eq $project } @list);
1637 }
1638
1639 ## ----------------------------------------------------------------------
1640 ## HTML aware string manipulation
1641
1642 # Try to chop given string on a word boundary between position
1643 # $len and $len+$add_len. If there is no word boundary there,
1644 # chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1645 # (marking chopped part) would be longer than given string.
1646 sub chop_str {
1647         my $str = shift;
1648         my $len = shift;
1649         my $add_len = shift || 10;
1650         my $where = shift || 'right'; # 'left' | 'center' | 'right'
1651
1652         # Make sure perl knows it is utf8 encoded so we don't
1653         # cut in the middle of a utf8 multibyte char.
1654         $str = to_utf8($str);
1655
1656         # allow only $len chars, but don't cut a word if it would fit in $add_len
1657         # if it doesn't fit, cut it if it's still longer than the dots we would add
1658         # remove chopped character entities entirely
1659
1660         # when chopping in the middle, distribute $len into left and right part
1661         # return early if chopping wouldn't make string shorter
1662         if ($where eq 'center') {
1663                 return $str if ($len + 5 >= length($str)); # filler is length 5
1664                 $len = int($len/2);
1665         } else {
1666                 return $str if ($len + 4 >= length($str)); # filler is length 4
1667         }
1668
1669         # regexps: ending and beginning with word part up to $add_len
1670         my $endre = qr/.{$len}\w{0,$add_len}/;
1671         my $begre = qr/\w{0,$add_len}.{$len}/;
1672
1673         if ($where eq 'left') {
1674                 $str =~ m/^(.*?)($begre)$/;
1675                 my ($lead, $body) = ($1, $2);
1676                 if (length($lead) > 4) {
1677                         $lead = " ...";
1678                 }
1679                 return "$lead$body";
1680
1681         } elsif ($where eq 'center') {
1682                 $str =~ m/^($endre)(.*)$/;
1683                 my ($left, $str)  = ($1, $2);
1684                 $str =~ m/^(.*?)($begre)$/;
1685                 my ($mid, $right) = ($1, $2);
1686                 if (length($mid) > 5) {
1687                         $mid = " ... ";
1688                 }
1689                 return "$left$mid$right";
1690
1691         } else {
1692                 $str =~ m/^($endre)(.*)$/;
1693                 my $body = $1;
1694                 my $tail = $2;
1695                 if (length($tail) > 4) {
1696                         $tail = "... ";
1697                 }
1698                 return "$body$tail";
1699         }
1700 }
1701
1702 # takes the same arguments as chop_str, but also wraps a <span> around the
1703 # result with a title attribute if it does get chopped. Additionally, the
1704 # string is HTML-escaped.
1705 sub chop_and_escape_str {
1706         my ($str) = @_;
1707
1708         my $chopped = chop_str(@_);
1709         $str = to_utf8($str);
1710         if ($chopped eq $str) {
1711                 return esc_html($chopped);
1712         } else {
1713                 $str =~ s/[[:cntrl:]]/?/g;
1714                 return $cgi->span({-title=>$str}, esc_html($chopped));
1715         }
1716 }
1717
1718 ## ----------------------------------------------------------------------
1719 ## functions returning short strings
1720
1721 # CSS class for given age value (in seconds)
1722 sub age_class {
1723         my $age = shift;
1724
1725         if (!defined $age) {
1726                 return "noage";
1727         } elsif ($age < 60*60*2) {
1728                 return "age0";
1729         } elsif ($age < 60*60*24*2) {
1730                 return "age1";
1731         } else {
1732                 return "age2";
1733         }
1734 }
1735
1736 # convert age in seconds to "nn units ago" string
1737 sub age_string {
1738         my $age = shift;
1739         my $age_str;
1740
1741         if ($age > 60*60*24*365*2) {
1742                 $age_str = (int $age/60/60/24/365);
1743                 $age_str .= " years ago";
1744         } elsif ($age > 60*60*24*(365/12)*2) {
1745                 $age_str = int $age/60/60/24/(365/12);
1746                 $age_str .= " months ago";
1747         } elsif ($age > 60*60*24*7*2) {
1748                 $age_str = int $age/60/60/24/7;
1749                 $age_str .= " weeks ago";
1750         } elsif ($age > 60*60*24*2) {
1751                 $age_str = int $age/60/60/24;
1752                 $age_str .= " days ago";
1753         } elsif ($age > 60*60*2) {
1754                 $age_str = int $age/60/60;
1755                 $age_str .= " hours ago";
1756         } elsif ($age > 60*2) {
1757                 $age_str = int $age/60;
1758                 $age_str .= " min ago";
1759         } elsif ($age > 2) {
1760                 $age_str = int $age;
1761                 $age_str .= " sec ago";
1762         } else {
1763                 $age_str .= " right now";
1764         }
1765         return $age_str;
1766 }
1767
1768 use constant {
1769         S_IFINVALID => 0030000,
1770         S_IFGITLINK => 0160000,
1771 };
1772
1773 # submodule/subproject, a commit object reference
1774 sub S_ISGITLINK {
1775         my $mode = shift;
1776
1777         return (($mode & S_IFMT) == S_IFGITLINK)
1778 }
1779
1780 # convert file mode in octal to symbolic file mode string
1781 sub mode_str {
1782         my $mode = oct shift;
1783
1784         if (S_ISGITLINK($mode)) {
1785                 return 'm---------';
1786         } elsif (S_ISDIR($mode & S_IFMT)) {
1787                 return 'drwxr-xr-x';
1788         } elsif (S_ISLNK($mode)) {
1789                 return 'lrwxrwxrwx';
1790         } elsif (S_ISREG($mode)) {
1791                 # git cares only about the executable bit
1792                 if ($mode & S_IXUSR) {
1793                         return '-rwxr-xr-x';
1794                 } else {
1795                         return '-rw-r--r--';
1796                 };
1797         } else {
1798                 return '----------';
1799         }
1800 }
1801
1802 # convert file mode in octal to file type string
1803 sub file_type {
1804         my $mode = shift;
1805
1806         if ($mode !~ m/^[0-7]+$/) {
1807                 return $mode;
1808         } else {
1809                 $mode = oct $mode;
1810         }
1811
1812         if (S_ISGITLINK($mode)) {
1813                 return "submodule";
1814         } elsif (S_ISDIR($mode & S_IFMT)) {
1815                 return "directory";
1816         } elsif (S_ISLNK($mode)) {
1817                 return "symlink";
1818         } elsif (S_ISREG($mode)) {
1819                 return "file";
1820         } else {
1821                 return "unknown";
1822         }
1823 }
1824
1825 # convert file mode in octal to file type description string
1826 sub file_type_long {
1827         my $mode = shift;
1828
1829         if ($mode !~ m/^[0-7]+$/) {
1830                 return $mode;
1831         } else {
1832                 $mode = oct $mode;
1833         }
1834
1835         if (S_ISGITLINK($mode)) {
1836                 return "submodule";
1837         } elsif (S_ISDIR($mode & S_IFMT)) {
1838                 return "directory";
1839         } elsif (S_ISLNK($mode)) {
1840                 return "symlink";
1841         } elsif (S_ISREG($mode)) {
1842                 if ($mode & S_IXUSR) {
1843                         return "executable";
1844                 } else {
1845                         return "file";
1846                 };
1847         } else {
1848                 return "unknown";
1849         }
1850 }
1851
1852
1853 ## ----------------------------------------------------------------------
1854 ## functions returning short HTML fragments, or transforming HTML fragments
1855 ## which don't belong to other sections
1856
1857 # format line of commit message.
1858 sub format_log_line_html {
1859         my $line = shift;
1860
1861         $line = esc_html($line, -nbsp=>1);
1862         $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1863                 $cgi->a({-href => href(action=>"object", hash=>$1),
1864                                         -class => "text"}, $1);
1865         }eg;
1866
1867         return $line;
1868 }
1869
1870 # format marker of refs pointing to given object
1871
1872 # the destination action is chosen based on object type and current context:
1873 # - for annotated tags, we choose the tag view unless it's the current view
1874 #   already, in which case we go to shortlog view
1875 # - for other refs, we keep the current view if we're in history, shortlog or
1876 #   log view, and select shortlog otherwise
1877 sub format_ref_marker {
1878         my ($refs, $id) = @_;
1879         my $markers = '';
1880
1881         if (defined $refs->{$id}) {
1882                 foreach my $ref (@{$refs->{$id}}) {
1883                         # this code exploits the fact that non-lightweight tags are the
1884                         # only indirect objects, and that they are the only objects for which
1885                         # we want to use tag instead of shortlog as action
1886                         my ($type, $name) = qw();
1887                         my $indirect = ($ref =~ s/\^\{\}$//);
1888                         # e.g. tags/v2.6.11 or heads/next
1889                         if ($ref =~ m!^(.*?)s?/(.*)$!) {
1890                                 $type = $1;
1891                                 $name = $2;
1892                         } else {
1893                                 $type = "ref";
1894                                 $name = $ref;
1895                         }
1896
1897                         my $class = $type;
1898                         $class .= " indirect" if $indirect;
1899
1900                         my $dest_action = "shortlog";
1901
1902                         if ($indirect) {
1903                                 $dest_action = "tag" unless $action eq "tag";
1904                         } elsif ($action =~ /^(history|(short)?log)$/) {
1905                                 $dest_action = $action;
1906                         }
1907
1908                         my $dest = "";
1909                         $dest .= "refs/" unless $ref =~ m!^refs/!;
1910                         $dest .= $ref;
1911
1912                         my $link = $cgi->a({
1913                                 -href => href(
1914                                         action=>$dest_action,
1915                                         hash=>$dest
1916                                 )}, $name);
1917
1918                         $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
1919                                 $link . "</span>";
1920                 }
1921         }
1922
1923         if ($markers) {
1924                 return ' <span class="refs">'. $markers . '</span>';
1925         } else {
1926                 return "";
1927         }
1928 }
1929
1930 # format, perhaps shortened and with markers, title line
1931 sub format_subject_html {
1932         my ($long, $short, $href, $extra) = @_;
1933         $extra = '' unless defined($extra);
1934
1935         if (length($short) < length($long)) {
1936                 $long =~ s/[[:cntrl:]]/?/g;
1937                 return $cgi->a({-href => $href, -class => "list subject",
1938                                 -title => to_utf8($long)},
1939                        esc_html($short)) . $extra;
1940         } else {
1941                 return $cgi->a({-href => $href, -class => "list subject"},
1942                        esc_html($long)) . $extra;
1943         }
1944 }
1945
1946 # Rather than recomputing the url for an email multiple times, we cache it
1947 # after the first hit. This gives a visible benefit in views where the avatar
1948 # for the same email is used repeatedly (e.g. shortlog).
1949 # The cache is shared by all avatar engines (currently gravatar only), which
1950 # are free to use it as preferred. Since only one avatar engine is used for any
1951 # given page, there's no risk for cache conflicts.
1952 our %avatar_cache = ();
1953
1954 # Compute the picon url for a given email, by using the picon search service over at
1955 # http://www.cs.indiana.edu/picons/search.html
1956 sub picon_url {
1957         my $email = lc shift;
1958         if (!$avatar_cache{$email}) {
1959                 my ($user, $domain) = split('@', $email);
1960                 $avatar_cache{$email} =
1961                         "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1962                         "$domain/$user/" .
1963                         "users+domains+unknown/up/single";
1964         }
1965         return $avatar_cache{$email};
1966 }
1967
1968 # Compute the gravatar url for a given email, if it's not in the cache already.
1969 # Gravatar stores only the part of the URL before the size, since that's the
1970 # one computationally more expensive. This also allows reuse of the cache for
1971 # different sizes (for this particular engine).
1972 sub gravatar_url {
1973         my $email = lc shift;
1974         my $size = shift;
1975         $avatar_cache{$email} ||=
1976                 "http://www.gravatar.com/avatar/" .
1977                         Digest::MD5::md5_hex($email) . "?s=";
1978         return $avatar_cache{$email} . $size;
1979 }
1980
1981 # Insert an avatar for the given $email at the given $size if the feature
1982 # is enabled.
1983 sub git_get_avatar {
1984         my ($email, %opts) = @_;
1985         my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1986         my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1987         $opts{-size} ||= 'default';
1988         my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1989         my $url = "";
1990         if ($git_avatar eq 'gravatar') {
1991                 $url = gravatar_url($email, $size);
1992         } elsif ($git_avatar eq 'picon') {
1993                 $url = picon_url($email);
1994         }
1995         # Other providers can be added by extending the if chain, defining $url
1996         # as needed. If no variant puts something in $url, we assume avatars
1997         # are completely disabled/unavailable.
1998         if ($url) {
1999                 return $pre_white .
2000                        "<img width=\"$size\" " .
2001                             "class=\"avatar\" " .
2002                             "src=\"".esc_url($url)."\" " .
2003                             "alt=\"\" " .
2004                        "/>" . $post_white;
2005         } else {
2006                 return "";
2007         }
2008 }
2009
2010 sub format_search_author {
2011         my ($author, $searchtype, $displaytext) = @_;
2012         my $have_search = gitweb_check_feature('search');
2013
2014         if ($have_search) {
2015                 my $performed = "";
2016                 if ($searchtype eq 'author') {
2017                         $performed = "authored";
2018                 } elsif ($searchtype eq 'committer') {
2019                         $performed = "committed";
2020                 }
2021
2022                 return $cgi->a({-href => href(action=>"search", hash=>$hash,
2023                                 searchtext=>$author,
2024                                 searchtype=>$searchtype), class=>"list",
2025                                 title=>"Search for commits $performed by $author"},
2026                                 $displaytext);
2027
2028         } else {
2029                 return $displaytext;
2030         }
2031 }
2032
2033 # format the author name of the given commit with the given tag
2034 # the author name is chopped and escaped according to the other
2035 # optional parameters (see chop_str).
2036 sub format_author_html {
2037         my $tag = shift;
2038         my $co = shift;
2039         my $author = chop_and_escape_str($co->{'author_name'}, @_);
2040         return "<$tag class=\"author\">" .
2041                format_search_author($co->{'author_name'}, "author",
2042                        git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2043                        $author) .
2044                "</$tag>";
2045 }
2046
2047 # format git diff header line, i.e. "diff --(git|combined|cc) ..."
2048 sub format_git_diff_header_line {
2049         my $line = shift;
2050         my $diffinfo = shift;
2051         my ($from, $to) = @_;
2052
2053         if ($diffinfo->{'nparents'}) {
2054                 # combined diff
2055                 $line =~ s!^(diff (.*?) )"?.*$!$1!;
2056                 if ($to->{'href'}) {
2057                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2058                                          esc_path($to->{'file'}));
2059                 } else { # file was deleted (no href)
2060                         $line .= esc_path($to->{'file'});
2061                 }
2062         } else {
2063                 # "ordinary" diff
2064                 $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2065                 if ($from->{'href'}) {
2066                         $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2067                                          'a/' . esc_path($from->{'file'}));
2068                 } else { # file was added (no href)
2069                         $line .= 'a/' . esc_path($from->{'file'});
2070                 }
2071                 $line .= ' ';
2072                 if ($to->{'href'}) {
2073                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2074                                          'b/' . esc_path($to->{'file'}));
2075                 } else { # file was deleted
2076                         $line .= 'b/' . esc_path($to->{'file'});
2077                 }
2078         }
2079
2080         return "<div class=\"diff header\">$line</div>\n";
2081 }
2082
2083 # format extended diff header line, before patch itself
2084 sub format_extended_diff_header_line {
2085         my $line = shift;
2086         my $diffinfo = shift;
2087         my ($from, $to) = @_;
2088
2089         # match <path>
2090         if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2091                 $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2092                                        esc_path($from->{'file'}));
2093         }
2094         if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2095                 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2096                                  esc_path($to->{'file'}));
2097         }
2098         # match single <mode>
2099         if ($line =~ m/\s(\d{6})$/) {
2100                 $line .= '<span class="info"> (' .
2101                          file_type_long($1) .
2102                          ')</span>';
2103         }
2104         # match <hash>
2105         if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2106                 # can match only for combined diff
2107                 $line = 'index ';
2108                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2109                         if ($from->{'href'}[$i]) {
2110                                 $line .= $cgi->a({-href=>$from->{'href'}[$i],
2111                                                   -class=>"hash"},
2112                                                  substr($diffinfo->{'from_id'}[$i],0,7));
2113                         } else {
2114                                 $line .= '0' x 7;
2115                         }
2116                         # separator
2117                         $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2118                 }
2119                 $line .= '..';
2120                 if ($to->{'href'}) {
2121                         $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2122                                          substr($diffinfo->{'to_id'},0,7));
2123                 } else {
2124                         $line .= '0' x 7;
2125                 }
2126
2127         } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2128                 # can match only for ordinary diff
2129                 my ($from_link, $to_link);
2130                 if ($from->{'href'}) {
2131                         $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2132                                              substr($diffinfo->{'from_id'},0,7));
2133                 } else {
2134                         $from_link = '0' x 7;
2135                 }
2136                 if ($to->{'href'}) {
2137                         $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2138                                            substr($diffinfo->{'to_id'},0,7));
2139                 } else {
2140                         $to_link = '0' x 7;
2141                 }
2142                 my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2143                 $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2144         }
2145
2146         return $line . "<br/>\n";
2147 }
2148
2149 # format from-file/to-file diff header
2150 sub format_diff_from_to_header {
2151         my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2152         my $line;
2153         my $result = '';
2154
2155         $line = $from_line;
2156         #assert($line =~ m/^---/) if DEBUG;
2157         # no extra formatting for "^--- /dev/null"
2158         if (! $diffinfo->{'nparents'}) {
2159                 # ordinary (single parent) diff
2160                 if ($line =~ m!^--- "?a/!) {
2161                         if ($from->{'href'}) {
2162                                 $line = '--- a/' .
2163                                         $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2164                                                 esc_path($from->{'file'}));
2165                         } else {
2166                                 $line = '--- a/' .
2167                                         esc_path($from->{'file'});
2168                         }
2169                 }
2170                 $result .= qq!<div class="diff from_file">$line</div>\n!;
2171
2172         } else {
2173                 # combined diff (merge commit)
2174                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2175                         if ($from->{'href'}[$i]) {
2176                                 $line = '--- ' .
2177                                         $cgi->a({-href=>href(action=>"blobdiff",
2178                                                              hash_parent=>$diffinfo->{'from_id'}[$i],
2179                                                              hash_parent_base=>$parents[$i],
2180                                                              file_parent=>$from->{'file'}[$i],
2181                                                              hash=>$diffinfo->{'to_id'},
2182                                                              hash_base=>$hash,
2183                                                              file_name=>$to->{'file'}),
2184                                                  -class=>"path",
2185                                                  -title=>"diff" . ($i+1)},
2186                                                 $i+1) .
2187                                         '/' .
2188                                         $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2189                                                 esc_path($from->{'file'}[$i]));
2190                         } else {
2191                                 $line = '--- /dev/null';
2192                         }
2193                         $result .= qq!<div class="diff from_file">$line</div>\n!;
2194                 }
2195         }
2196
2197         $line = $to_line;
2198         #assert($line =~ m/^\+\+\+/) if DEBUG;
2199         # no extra formatting for "^+++ /dev/null"
2200         if ($line =~ m!^\+\+\+ "?b/!) {
2201                 if ($to->{'href'}) {
2202                         $line = '+++ b/' .
2203                                 $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2204                                         esc_path($to->{'file'}));
2205                 } else {
2206                         $line = '+++ b/' .
2207                                 esc_path($to->{'file'});
2208                 }
2209         }
2210         $result .= qq!<div class="diff to_file">$line</div>\n!;
2211
2212         return $result;
2213 }
2214
2215 # create note for patch simplified by combined diff
2216 sub format_diff_cc_simplified {
2217         my ($diffinfo, @parents) = @_;
2218         my $result = '';
2219
2220         $result .= "<div class=\"diff header\">" .
2221                    "diff --cc ";
2222         if (!is_deleted($diffinfo)) {
2223                 $result .= $cgi->a({-href => href(action=>"blob",
2224                                                   hash_base=>$hash,
2225                                                   hash=>$diffinfo->{'to_id'},
2226                                                   file_name=>$diffinfo->{'to_file'}),
2227                                     -class => "path"},
2228                                    esc_path($diffinfo->{'to_file'}));
2229         } else {
2230                 $result .= esc_path($diffinfo->{'to_file'});
2231         }
2232         $result .= "</div>\n" . # class="diff header"
2233                    "<div class=\"diff nodifferences\">" .
2234                    "Simple merge" .
2235                    "</div>\n"; # class="diff nodifferences"
2236
2237         return $result;
2238 }
2239
2240 sub diff_line_class {
2241         my ($line, $from, $to) = @_;
2242
2243         # ordinary diff
2244         my $num_sign = 1;
2245         # combined diff
2246         if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2247                 $num_sign = scalar @{$from->{'href'}};
2248         }
2249
2250         my @diff_line_classifier = (
2251                 { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2252                 { regexp => qr/^\\/,               class => "incomplete"  },
2253                 { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2254                 # classifier for context must come before classifier add/rem,
2255                 # or we would have to use more complicated regexp, for example
2256                 # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2257                 { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2258                 { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2259         );
2260         for my $clsfy (@diff_line_classifier) {
2261                 return $clsfy->{'class'}
2262                         if ($line =~ $clsfy->{'regexp'});
2263         }
2264
2265         # fallback
2266         return "";
2267 }
2268
2269 # assumes that $from and $to are defined and correctly filled,
2270 # and that $line holds a line of chunk header for unified diff
2271 sub format_unidiff_chunk_header {
2272         my ($line, $from, $to) = @_;
2273
2274         my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2275                 $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2276
2277         $from_lines = 0 unless defined $from_lines;
2278         $to_lines   = 0 unless defined $to_lines;
2279
2280         if ($from->{'href'}) {
2281                 $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2282                                      -class=>"list"}, $from_text);
2283         }
2284         if ($to->{'href'}) {
2285                 $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2286                                      -class=>"list"}, $to_text);
2287         }
2288         $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2289                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2290         return $line;
2291 }
2292
2293 # assumes that $from and $to are defined and correctly filled,
2294 # and that $line holds a line of chunk header for combined diff
2295 sub format_cc_diff_chunk_header {
2296         my ($line, $from, $to) = @_;
2297
2298         my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2299         my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2300
2301         @from_text = split(' ', $ranges);
2302         for (my $i = 0; $i < @from_text; ++$i) {
2303                 ($from_start[$i], $from_nlines[$i]) =
2304                         (split(',', substr($from_text[$i], 1)), 0);
2305         }
2306
2307         $to_text   = pop @from_text;
2308         $to_start  = pop @from_start;
2309         $to_nlines = pop @from_nlines;
2310
2311         $line = "<span class=\"chunk_info\">$prefix ";
2312         for (my $i = 0; $i < @from_text; ++$i) {
2313                 if ($from->{'href'}[$i]) {
2314                         $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2315                                           -class=>"list"}, $from_text[$i]);
2316                 } else {
2317                         $line .= $from_text[$i];
2318                 }
2319                 $line .= " ";
2320         }
2321         if ($to->{'href'}) {
2322                 $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2323                                   -class=>"list"}, $to_text);
2324         } else {
2325                 $line .= $to_text;
2326         }
2327         $line .= " $prefix</span>" .
2328                  "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2329         return $line;
2330 }
2331
2332 # process patch (diff) line (not to be used for diff headers),
2333 # returning class and HTML-formatted (but not wrapped) line
2334 sub process_diff_line {
2335         my $line = shift;
2336         my ($from, $to) = @_;
2337
2338         my $diff_class = diff_line_class($line, $from, $to);
2339
2340         chomp $line;
2341         $line = untabify($line);
2342
2343         if ($from && $to && $line =~ m/^\@{2} /) {
2344                 $line = format_unidiff_chunk_header($line, $from, $to);
2345                 return $diff_class, $line;
2346
2347         } elsif ($from && $to && $line =~ m/^\@{3}/) {
2348                 $line = format_cc_diff_chunk_header($line, $from, $to);
2349                 return $diff_class, $line;
2350
2351         }
2352         return $diff_class, esc_html($line, -nbsp=>1);
2353 }
2354
2355 # Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2356 # linked.  Pass the hash of the tree/commit to snapshot.
2357 sub format_snapshot_links {
2358         my ($hash) = @_;
2359         my $num_fmts = @snapshot_fmts;
2360         if ($num_fmts > 1) {
2361                 # A parenthesized list of links bearing format names.
2362                 # e.g. "snapshot (_tar.gz_ _zip_)"
2363                 return "snapshot (" . join(' ', map
2364                         $cgi->a({
2365                                 -href => href(
2366                                         action=>"snapshot",
2367                                         hash=>$hash,
2368                                         snapshot_format=>$_
2369                                 )
2370                         }, $known_snapshot_formats{$_}{'display'})
2371                 , @snapshot_fmts) . ")";
2372         } elsif ($num_fmts == 1) {
2373                 # A single "snapshot" link whose tooltip bears the format name.
2374                 # i.e. "_snapshot_"
2375                 my ($fmt) = @snapshot_fmts;
2376                 return
2377                         $cgi->a({
2378                                 -href => href(
2379                                         action=>"snapshot",
2380                                         hash=>$hash,
2381                                         snapshot_format=>$fmt
2382                                 ),
2383                                 -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2384                         }, "snapshot");
2385         } else { # $num_fmts == 0
2386                 return undef;
2387         }
2388 }
2389
2390 ## ......................................................................
2391 ## functions returning values to be passed, perhaps after some
2392 ## transformation, to other functions; e.g. returning arguments to href()
2393
2394 # returns hash to be passed to href to generate gitweb URL
2395 # in -title key it returns description of link
2396 sub get_feed_info {
2397         my $format = shift || 'Atom';
2398         my %res = (action => lc($format));
2399
2400         # feed links are possible only for project views
2401         return unless (defined $project);
2402         # some views should link to OPML, or to generic project feed,
2403         # or don't have specific feed yet (so they should use generic)
2404         return if (!$action || $action =~ /^(?:tags|heads|forks|tag|search)$/x);
2405
2406         my $branch;
2407         # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2408         # from tag links; this also makes possible to detect branch links
2409         if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2410             (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2411                 $branch = $1;
2412         }
2413         # find log type for feed description (title)
2414         my $type = 'log';
2415         if (defined $file_name) {
2416                 $type  = "history of $file_name";
2417                 $type .= "/" if ($action eq 'tree');
2418                 $type .= " on '$branch'" if (defined $branch);
2419         } else {
2420                 $type = "log of $branch" if (defined $branch);
2421         }
2422
2423         $res{-title} = $type;
2424         $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2425         $res{'file_name'} = $file_name;
2426
2427         return %res;
2428 }
2429
2430 ## ----------------------------------------------------------------------
2431 ## git utility subroutines, invoking git commands
2432
2433 # returns path to the core git executable and the --git-dir parameter as list
2434 sub git_cmd {
2435         $number_of_git_cmds++;
2436         return $GIT, '--git-dir='.$git_dir;
2437 }
2438
2439 # quote the given arguments for passing them to the shell
2440 # quote_command("command", "arg 1", "arg with ' and ! characters")
2441 # => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2442 # Try to avoid using this function wherever possible.
2443 sub quote_command {
2444         return join(' ',
2445                 map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2446 }
2447
2448 # get HEAD ref of given project as hash
2449 sub git_get_head_hash {
2450         return git_get_full_hash(shift, 'HEAD');
2451 }
2452
2453 sub git_get_full_hash {
2454         return git_get_hash(@_);
2455 }
2456
2457 sub git_get_short_hash {
2458         return git_get_hash(@_, '--short=7');
2459 }
2460
2461 sub git_get_hash {
2462         my ($project, $hash, @options) = @_;
2463         my $o_git_dir = $git_dir;
2464         my $retval = undef;
2465         $git_dir = "$projectroot/$project";
2466         if (open my $fd, '-|', git_cmd(), 'rev-parse',
2467             '--verify', '-q', @options, $hash) {
2468                 $retval = <$fd>;
2469                 chomp $retval if defined $retval;
2470                 close $fd;
2471         }
2472         if (defined $o_git_dir) {
2473                 $git_dir = $o_git_dir;
2474         }
2475         return $retval;
2476 }
2477
2478 # get type of given object
2479 sub git_get_type {
2480         my $hash = shift;
2481
2482         open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2483         my $type = <$fd>;
2484         close $fd or return;
2485         chomp $type;
2486         return $type;
2487 }
2488
2489 # repository configuration
2490 our $config_file = '';
2491 our %config;
2492
2493 # store multiple values for single key as anonymous array reference
2494 # single values stored directly in the hash, not as [ <value> ]
2495 sub hash_set_multi {
2496         my ($hash, $key, $value) = @_;
2497
2498         if (!exists $hash->{$key}) {
2499                 $hash->{$key} = $value;
2500         } elsif (!ref $hash->{$key}) {
2501                 $hash->{$key} = [ $hash->{$key}, $value ];
2502         } else {
2503                 push @{$hash->{$key}}, $value;
2504         }
2505 }
2506
2507 # return hash of git project configuration
2508 # optionally limited to some section, e.g. 'gitweb'
2509 sub git_parse_project_config {
2510         my $section_regexp = shift;
2511         my %config;
2512
2513         local $/ = "\0";
2514
2515         open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2516                 or return;
2517
2518         while (my $keyval = <$fh>) {
2519                 chomp $keyval;
2520                 my ($key, $value) = split(/\n/, $keyval, 2);
2521
2522                 hash_set_multi(\%config, $key, $value)
2523                         if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2524         }
2525         close $fh;
2526
2527         return %config;
2528 }
2529
2530 # convert config value to boolean: 'true' or 'false'
2531 # no value, number > 0, 'true' and 'yes' values are true
2532 # rest of values are treated as false (never as error)
2533 sub config_to_bool {
2534         my $val = shift;
2535
2536         return 1 if !defined $val;             # section.key
2537
2538         # strip leading and trailing whitespace
2539         $val =~ s/^\s+//;
2540         $val =~ s/\s+$//;
2541
2542         return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2543                 ($val =~ /^(?:true|yes)$/i));  # section.key = true
2544 }
2545
2546 # convert config value to simple decimal number
2547 # an optional value suffix of 'k', 'm', or 'g' will cause the value
2548 # to be multiplied by 1024, 1048576, or 1073741824
2549 sub config_to_int {
2550         my $val = shift;
2551
2552         # strip leading and trailing whitespace
2553         $val =~ s/^\s+//;
2554         $val =~ s/\s+$//;
2555
2556         if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2557                 $unit = lc($unit);
2558                 # unknown unit is treated as 1
2559                 return $num * ($unit eq 'g' ? 1073741824 :
2560                                $unit eq 'm' ?    1048576 :
2561                                $unit eq 'k' ?       1024 : 1);
2562         }
2563         return $val;
2564 }
2565
2566 # convert config value to array reference, if needed
2567 sub config_to_multi {
2568         my $val = shift;
2569
2570         return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2571 }
2572
2573 sub git_get_project_config {
2574         my ($key, $type) = @_;
2575
2576         return unless defined $git_dir;
2577
2578         # key sanity check
2579         return unless ($key);
2580         # only subsection, if exists, is case sensitive,
2581         # and not lowercased by 'git config -z -l'
2582         if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2583                 $key = join(".", lc($hi), $mi, lc($lo));
2584         } else {
2585                 $key = lc($key);
2586         }
2587         $key =~ s/^gitweb\.//;
2588         return if ($key =~ m/\W/);
2589
2590         # type sanity check
2591         if (defined $type) {
2592                 $type =~ s/^--//;
2593                 $type = undef
2594                         unless ($type eq 'bool' || $type eq 'int');
2595         }
2596
2597         # get config
2598         if (!defined $config_file ||
2599             $config_file ne "$git_dir/config") {
2600                 %config = git_parse_project_config('gitweb');
2601                 $config_file = "$git_dir/config";
2602         }
2603
2604         # check if config variable (key) exists
2605         return unless exists $config{"gitweb.$key"};
2606
2607         # ensure given type
2608         if (!defined $type) {
2609                 return $config{"gitweb.$key"};
2610         } elsif ($type eq 'bool') {
2611                 # backward compatibility: 'git config --bool' returns true/false
2612                 return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2613         } elsif ($type eq 'int') {
2614                 return config_to_int($config{"gitweb.$key"});
2615         }
2616         return $config{"gitweb.$key"};
2617 }
2618
2619 # get hash of given path at given ref
2620 sub git_get_hash_by_path {
2621         my $base = shift;
2622         my $path = shift || return undef;
2623         my $type = shift;
2624
2625         $path =~ s,/+$,,;
2626
2627         open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2628                 or die_error(500, "Open git-ls-tree failed");
2629         my $line = <$fd>;
2630         close $fd or return undef;
2631
2632         if (!defined $line) {
2633                 # there is no tree or hash given by $path at $base
2634                 return undef;
2635         }
2636
2637         #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2638         $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2639         if (defined $type && $type ne $2) {
2640                 # type doesn't match
2641                 return undef;
2642         }
2643         return $3;
2644 }
2645
2646 # get path of entry with given hash at given tree-ish (ref)
2647 # used to get 'from' filename for combined diff (merge commit) for renames
2648 sub git_get_path_by_hash {
2649         my $base = shift || return;
2650         my $hash = shift || return;
2651
2652         local $/ = "\0";
2653
2654         open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2655                 or return undef;
2656         while (my $line = <$fd>) {
2657                 chomp $line;
2658
2659                 #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2660                 #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2661                 if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2662                         close $fd;
2663                         return $1;
2664                 }
2665         }
2666         close $fd;
2667         return undef;
2668 }
2669
2670 ## ......................................................................
2671 ## git utility functions, directly accessing git repository
2672
2673 # get the value of config variable either from file named as the variable
2674 # itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2675 # configuration variable in the repository config file.
2676 sub git_get_file_or_project_config {
2677         my ($path, $name) = @_;
2678
2679         $git_dir = "$projectroot/$path";
2680         open my $fd, '<', "$git_dir/$name"
2681                 or return git_get_project_config($name);
2682         my $conf = <$fd>;
2683         close $fd;
2684         if (defined $conf) {
2685                 chomp $conf;
2686         }
2687         return $conf;
2688 }
2689
2690 sub git_get_project_description {
2691         my $path = shift;
2692         return git_get_file_or_project_config($path, 'description');
2693 }
2694
2695 sub git_get_project_category {
2696         my $path = shift;
2697         return git_get_file_or_project_config($path, 'category');
2698 }
2699
2700
2701 # supported formats:
2702 # * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2703 #   - if its contents is a number, use it as tag weight,
2704 #   - otherwise add a tag with weight 1
2705 # * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2706 #   the same value multiple times increases tag weight
2707 # * `gitweb.ctag' multi-valued repo config variable
2708 sub git_get_project_ctags {
2709         my $project = shift;
2710         my $ctags = {};
2711
2712         $git_dir = "$projectroot/$project";
2713         if (opendir my $dh, "$git_dir/ctags") {
2714                 my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2715                 foreach my $tagfile (@files) {
2716                         open my $ct, '<', $tagfile
2717                                 or next;
2718                         my $val = <$ct>;
2719                         chomp $val if $val;
2720                         close $ct;
2721
2722                         (my $ctag = $tagfile) =~ s#.*/##;
2723                         if ($val =~ /^\d+$/) {
2724                                 $ctags->{$ctag} = $val;
2725                         } else {
2726                                 $ctags->{$ctag} = 1;
2727                         }
2728                 }
2729                 closedir $dh;
2730
2731         } elsif (open my $fh, '<', "$git_dir/ctags") {
2732                 while (my $line = <$fh>) {
2733                         chomp $line;
2734                         $ctags->{$line}++ if $line;
2735                 }
2736                 close $fh;
2737
2738         } else {
2739                 my $taglist = config_to_multi(git_get_project_config('ctag'));
2740                 foreach my $tag (@$taglist) {
2741                         $ctags->{$tag}++;
2742                 }
2743         }
2744
2745         return $ctags;
2746 }
2747
2748 # return hash, where keys are content tags ('ctags'),
2749 # and values are sum of weights of given tag in every project
2750 sub git_gather_all_ctags {
2751         my $projects = shift;
2752         my $ctags = {};
2753
2754         foreach my $p (@$projects) {
2755                 foreach my $ct (keys %{$p->{'ctags'}}) {
2756                         $ctags->{$ct} += $p->{'ctags'}->{$ct};
2757                 }
2758         }
2759
2760         return $ctags;
2761 }
2762
2763 sub git_populate_project_tagcloud {
2764         my $ctags = shift;
2765
2766         # First, merge different-cased tags; tags vote on casing
2767         my %ctags_lc;
2768         foreach (keys %$ctags) {
2769                 $ctags_lc{lc $_}->{count} += $ctags->{$_};
2770                 if (not $ctags_lc{lc $_}->{topcount}
2771                     or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2772                         $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2773                         $ctags_lc{lc $_}->{topname} = $_;
2774                 }
2775         }
2776
2777         my $cloud;
2778         my $matched = $input_params{'ctag'};
2779         if (eval { require HTML::TagCloud; 1; }) {
2780                 $cloud = HTML::TagCloud->new;
2781                 foreach my $ctag (sort keys %ctags_lc) {
2782                         # Pad the title with spaces so that the cloud looks
2783                         # less crammed.
2784                         my $title = esc_html($ctags_lc{$ctag}->{topname});
2785                         $title =~ s/ /&nbsp;/g;
2786                         $title =~ s/^/&nbsp;/g;
2787                         $title =~ s/$/&nbsp;/g;
2788                         if (defined $matched && $matched eq $ctag) {
2789                                 $title = qq(<span class="match">$title</span>);
2790                         }
2791                         $cloud->add($title, href(project=>undef, ctag=>$ctag),
2792                                     $ctags_lc{$ctag}->{count});
2793                 }
2794         } else {
2795                 $cloud = {};
2796                 foreach my $ctag (keys %ctags_lc) {
2797                         my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2798                         if (defined $matched && $matched eq $ctag) {
2799                                 $title = qq(<span class="match">$title</span>);
2800                         }
2801                         $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2802                         $cloud->{$ctag}{ctag} =
2803                                 $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2804                 }
2805         }
2806         return $cloud;
2807 }
2808
2809 sub git_show_project_tagcloud {
2810         my ($cloud, $count) = @_;
2811         if (ref $cloud eq 'HTML::TagCloud') {
2812                 return $cloud->html_and_css($count);
2813         } else {
2814                 my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2815                 return
2816                         '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2817                         join (', ', map {
2818                                 $cloud->{$_}->{'ctag'}
2819                         } splice(@tags, 0, $count)) .
2820                         '</div>';
2821         }
2822 }
2823
2824 sub git_get_project_url_list {
2825         my $path = shift;
2826
2827         $git_dir = "$projectroot/$path";
2828         open my $fd, '<', "$git_dir/cloneurl"
2829                 or return wantarray ?
2830                 @{ config_to_multi(git_get_project_config('url')) } :
2831                    config_to_multi(git_get_project_config('url'));
2832         my @git_project_url_list = map { chomp; $_ } <$fd>;
2833         close $fd;
2834
2835         return wantarray ? @git_project_url_list : \@git_project_url_list;
2836 }
2837
2838 sub git_get_projects_list {
2839         my $filter = shift || '';
2840         my $paranoid = shift;
2841         my @list;
2842
2843         if (-d $projects_list) {
2844                 # search in directory
2845                 my $dir = $projects_list;
2846                 # remove the trailing "/"
2847                 $dir =~ s!/+$!!;
2848                 my $pfxlen = length("$dir");
2849                 my $pfxdepth = ($dir =~ tr!/!!);
2850                 # when filtering, search only given subdirectory
2851                 if ($filter && !$paranoid) {
2852                         $dir .= "/$filter";
2853                         $dir =~ s!/+$!!;
2854                 }
2855
2856                 File::Find::find({
2857                         follow_fast => 1, # follow symbolic links
2858                         follow_skip => 2, # ignore duplicates
2859                         dangling_symlinks => 0, # ignore dangling symlinks, silently
2860                         wanted => sub {
2861                                 # global variables
2862                                 our $project_maxdepth;
2863                                 our $projectroot;
2864                                 # skip project-list toplevel, if we get it.
2865                                 return if (m!^[/.]$!);
2866                                 # only directories can be git repositories
2867                                 return unless (-d $_);
2868                                 # don't traverse too deep (Find is super slow on os x)
2869                                 # $project_maxdepth excludes depth of $projectroot
2870                                 if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2871                                         $File::Find::prune = 1;
2872                                         return;
2873                                 }
2874
2875                                 my $path = substr($File::Find::name, $pfxlen + 1);
2876                                 # paranoidly only filter here
2877                                 if ($paranoid && $filter && $path !~ m!^\Q$filter\E/!) {
2878                                         next;
2879                                 }
2880                                 # we check related file in $projectroot
2881                                 if (check_export_ok("$projectroot/$path")) {
2882                                         push @list, { path => $path };
2883                                         $File::Find::prune = 1;
2884                                 }
2885                         },
2886                 }, "$dir");
2887
2888         } elsif (-f $projects_list) {
2889                 # read from file(url-encoded):
2890                 # 'git%2Fgit.git Linus+Torvalds'
2891                 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2892                 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2893                 open my $fd, '<', $projects_list or return;
2894         PROJECT:
2895                 while (my $line = <$fd>) {
2896                         chomp $line;
2897                         my ($path, $owner) = split ' ', $line;
2898                         $path = unescape($path);
2899                         $owner = unescape($owner);
2900                         if (!defined $path) {
2901                                 next;
2902                         }
2903                         # if $filter is rpovided, check if $path begins with $filter
2904                         if ($filter && $path !~ m!^\Q$filter\E/!) {
2905                                 next;
2906                         }
2907                         if (check_export_ok("$projectroot/$path")) {
2908                                 my $pr = {
2909                                         path => $path,
2910                                         owner => to_utf8($owner),
2911                                 };
2912                                 push @list, $pr;
2913                         }
2914                 }
2915                 close $fd;
2916         }
2917         return @list;
2918 }
2919
2920 # written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
2921 # as side effects it sets 'forks' field to list of forks for forked projects
2922 sub filter_forks_from_projects_list {
2923         my $projects = shift;
2924
2925         my %trie; # prefix tree of directories (path components)
2926         # generate trie out of those directories that might contain forks
2927         foreach my $pr (@$projects) {
2928                 my $path = $pr->{'path'};
2929                 $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
2930                 next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
2931                 next unless ($path);      # skip '.git' repository: tests, git-instaweb
2932                 next unless (-d "$projectroot/$path"); # containing directory exists
2933                 $pr->{'forks'} = [];      # there can be 0 or more forks of project
2934
2935                 # add to trie
2936                 my @dirs = split('/', $path);
2937                 # walk the trie, until either runs out of components or out of trie
2938                 my $ref = \%trie;
2939                 while (scalar @dirs &&
2940                        exists($ref->{$dirs[0]})) {
2941                         $ref = $ref->{shift @dirs};
2942                 }
2943                 # create rest of trie structure from rest of components
2944                 foreach my $dir (@dirs) {
2945                         $ref = $ref->{$dir} = {};
2946                 }
2947                 # create end marker, store $pr as a data
2948                 $ref->{''} = $pr if (!exists $ref->{''});
2949         }
2950
2951         # filter out forks, by finding shortest prefix match for paths
2952         my @filtered;
2953  PROJECT:
2954         foreach my $pr (@$projects) {
2955                 # trie lookup
2956                 my $ref = \%trie;
2957         DIR:
2958                 foreach my $dir (split('/', $pr->{'path'})) {
2959                         if (exists $ref->{''}) {
2960                                 # found [shortest] prefix, is a fork - skip it
2961                                 push @{$ref->{''}{'forks'}}, $pr;
2962                                 next PROJECT;
2963                         }
2964                         if (!exists $ref->{$dir}) {
2965                                 # not in trie, cannot have prefix, not a fork
2966                                 push @filtered, $pr;
2967                                 next PROJECT;
2968                         }
2969                         # If the dir is there, we just walk one step down the trie.
2970                         $ref = $ref->{$dir};
2971                 }
2972                 # we ran out of trie
2973                 # (shouldn't happen: it's either no match, or end marker)
2974                 push @filtered, $pr;
2975         }
2976
2977         return @filtered;
2978 }
2979
2980 # note: fill_project_list_info must be run first,
2981 # for 'descr_long' and 'ctags' to be filled
2982 sub search_projects_list {
2983         my ($projlist, %opts) = @_;
2984         my $tagfilter  = $opts{'tagfilter'};
2985         my $searchtext = $opts{'searchtext'};
2986
2987         return @$projlist
2988                 unless ($tagfilter || $searchtext);
2989
2990         # searching projects require filling to be run before it;
2991         fill_project_list_info($projlist,
2992                                $tagfilter  ? 'ctags' : (),
2993                                $searchtext ? ('path', 'descr') : ());
2994         my @projects;
2995  PROJECT:
2996         foreach my $pr (@$projlist) {
2997
2998                 if ($tagfilter) {
2999                         next unless ref($pr->{'ctags'}) eq 'HASH';
3000                         next unless
3001                                 grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
3002                 }
3003
3004                 if ($searchtext) {
3005                         next unless
3006                                 $pr->{'path'} =~ /$searchtext/ ||
3007                                 $pr->{'descr_long'} =~ /$searchtext/;
3008                 }
3009
3010                 push @projects, $pr;
3011         }
3012
3013         return @projects;
3014 }
3015
3016 our $gitweb_project_owner = undef;
3017 sub git_get_project_list_from_file {
3018
3019         return if (defined $gitweb_project_owner);
3020
3021         $gitweb_project_owner = {};
3022         # read from file (url-encoded):
3023         # 'git%2Fgit.git Linus+Torvalds'
3024         # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3025         # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3026         if (-f $projects_list) {
3027                 open(my $fd, '<', $projects_list);
3028                 while (my $line = <$fd>) {
3029                         chomp $line;
3030                         my ($pr, $ow) = split ' ', $line;
3031                         $pr = unescape($pr);
3032                         $ow = unescape($ow);
3033                         $gitweb_project_owner->{$pr} = to_utf8($ow);
3034                 }
3035                 close $fd;
3036         }
3037 }
3038
3039 sub git_get_project_owner {
3040         my $project = shift;
3041         my $owner;
3042
3043         return undef unless $project;
3044         $git_dir = "$projectroot/$project";
3045
3046         if (!defined $gitweb_project_owner) {
3047                 git_get_project_list_from_file();
3048         }
3049
3050         if (exists $gitweb_project_owner->{$project}) {
3051                 $owner = $gitweb_project_owner->{$project};
3052         }
3053         if (!defined $owner){
3054                 $owner = git_get_project_config('owner');
3055         }
3056         if (!defined $owner) {
3057                 $owner = get_file_owner("$git_dir");
3058         }
3059
3060         return $owner;
3061 }
3062
3063 sub git_get_last_activity {
3064         my ($path) = @_;
3065         my $fd;
3066
3067         $git_dir = "$projectroot/$path";
3068         open($fd, "-|", git_cmd(), 'for-each-ref',
3069              '--format=%(committer)',
3070              '--sort=-committerdate',
3071              '--count=1',
3072              'refs/heads') or return;
3073         my $most_recent = <$fd>;
3074         close $fd or return;
3075         if (defined $most_recent &&
3076             $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3077                 my $timestamp = $1;
3078                 my $age = time - $timestamp;
3079                 return ($age, age_string($age));
3080         }
3081         return (undef, undef);
3082 }
3083
3084 # Implementation note: when a single remote is wanted, we cannot use 'git
3085 # remote show -n' because that command always work (assuming it's a remote URL
3086 # if it's not defined), and we cannot use 'git remote show' because that would
3087 # try to make a network roundtrip. So the only way to find if that particular
3088 # remote is defined is to walk the list provided by 'git remote -v' and stop if
3089 # and when we find what we want.
3090 sub git_get_remotes_list {
3091         my $wanted = shift;
3092         my %remotes = ();
3093
3094         open my $fd, '-|' , git_cmd(), 'remote', '-v';
3095         return unless $fd;
3096         while (my $remote = <$fd>) {
3097                 chomp $remote;
3098                 $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3099                 next if $wanted and not $remote eq $wanted;
3100                 my ($url, $key) = ($1, $2);
3101
3102                 $remotes{$remote} ||= { 'heads' => () };
3103                 $remotes{$remote}{$key} = $url;
3104         }
3105         close $fd or return;
3106         return wantarray ? %remotes : \%remotes;
3107 }
3108
3109 # Takes a hash of remotes as first parameter and fills it by adding the
3110 # available remote heads for each of the indicated remotes.
3111 sub fill_remote_heads {
3112         my $remotes = shift;
3113         my @heads = map { "remotes/$_" } keys %$remotes;
3114         my @remoteheads = git_get_heads_list(undef, @heads);
3115         foreach my $remote (keys %$remotes) {
3116                 $remotes->{$remote}{'heads'} = [ grep {
3117                         $_->{'name'} =~ s!^$remote/!!
3118                         } @remoteheads ];
3119         }
3120 }
3121
3122 sub git_get_references {
3123         my $type = shift || "";
3124         my %refs;
3125         # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3126         # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3127         open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3128                 ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3129                 or return;
3130
3131         while (my $line = <$fd>) {
3132                 chomp $line;
3133                 if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3134                         if (defined $refs{$1}) {
3135                                 push @{$refs{$1}}, $2;
3136                         } else {
3137                                 $refs{$1} = [ $2 ];
3138                         }
3139                 }
3140         }
3141         close $fd or return;
3142         return \%refs;
3143 }
3144
3145 sub git_get_rev_name_tags {
3146         my $hash = shift || return undef;
3147
3148         open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3149                 or return;
3150         my $name_rev = <$fd>;
3151         close $fd;
3152
3153         if ($name_rev =~ m|^$hash tags/(.*)$|) {
3154                 return $1;
3155         } else {
3156                 # catches also '$hash undefined' output
3157                 return undef;
3158         }
3159 }
3160
3161 ## ----------------------------------------------------------------------
3162 ## parse to hash functions
3163
3164 sub parse_date {
3165         my $epoch = shift;
3166         my $tz = shift || "-0000";
3167
3168         my %date;
3169         my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3170         my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3171         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3172         $date{'hour'} = $hour;
3173         $date{'minute'} = $min;
3174         $date{'mday'} = $mday;
3175         $date{'day'} = $days[$wday];
3176         $date{'month'} = $months[$mon];
3177         $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3178                              $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3179         $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3180                              $mday, $months[$mon], $hour ,$min;
3181         $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3182                              1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3183
3184         my ($tz_sign, $tz_hour, $tz_min) =
3185                 ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3186         $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3187         my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3188         ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3189         $date{'hour_local'} = $hour;
3190         $date{'minute_local'} = $min;
3191         $date{'tz_local'} = $tz;
3192         $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3193                                   1900+$year, $mon+1, $mday,
3194                                   $hour, $min, $sec, $tz);
3195         return %date;
3196 }
3197
3198 sub parse_tag {
3199         my $tag_id = shift;
3200         my %tag;
3201         my @comment;
3202
3203         open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3204         $tag{'id'} = $tag_id;
3205         while (my $line = <$fd>) {
3206                 chomp $line;
3207                 if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3208                         $tag{'object'} = $1;
3209                 } elsif ($line =~ m/^type (.+)$/) {
3210                         $tag{'type'} = $1;
3211                 } elsif ($line =~ m/^tag (.+)$/) {
3212                         $tag{'name'} = $1;
3213                 } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3214                         $tag{'author'} = $1;
3215                         $tag{'author_epoch'} = $2;
3216                         $tag{'author_tz'} = $3;
3217                         if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3218                                 $tag{'author_name'}  = $1;
3219                                 $tag{'author_email'} = $2;
3220                         } else {
3221                                 $tag{'author_name'} = $tag{'author'};
3222                         }
3223                 } elsif ($line =~ m/--BEGIN/) {
3224                         push @comment, $line;
3225                         last;
3226                 } elsif ($line eq "") {
3227                         last;
3228                 }
3229         }
3230         push @comment, <$fd>;
3231         $tag{'comment'} = \@comment;
3232         close $fd or return;
3233         if (!defined $tag{'name'}) {
3234                 return
3235         };
3236         return %tag
3237 }
3238
3239 sub parse_commit_text {
3240         my ($commit_text, $withparents) = @_;
3241         my @commit_lines = split '\n', $commit_text;
3242         my %co;
3243
3244         pop @commit_lines; # Remove '\0'
3245
3246         if (! @commit_lines) {
3247                 return;
3248         }
3249
3250         my $header = shift @commit_lines;
3251         if ($header !~ m/^[0-9a-fA-F]{40}/) {
3252                 return;
3253         }
3254         ($co{'id'}, my @parents) = split ' ', $header;
3255         while (my $line = shift @commit_lines) {
3256                 last if $line eq "\n";
3257                 if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3258                         $co{'tree'} = $1;
3259                 } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3260                         push @parents, $1;
3261                 } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3262                         $co{'author'} = to_utf8($1);
3263                         $co{'author_epoch'} = $2;
3264                         $co{'author_tz'} = $3;
3265                         if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3266                                 $co{'author_name'}  = $1;
3267                                 $co{'author_email'} = $2;
3268                         } else {
3269                                 $co{'author_name'} = $co{'author'};
3270                         }
3271                 } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3272                         $co{'committer'} = to_utf8($1);
3273                         $co{'committer_epoch'} = $2;
3274                         $co{'committer_tz'} = $3;
3275                         if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3276                                 $co{'committer_name'}  = $1;
3277                                 $co{'committer_email'} = $2;
3278                         } else {
3279                                 $co{'committer_name'} = $co{'committer'};
3280                         }
3281                 }
3282         }
3283         if (!defined $co{'tree'}) {
3284                 return;
3285         };
3286         $co{'parents'} = \@parents;
3287         $co{'parent'} = $parents[0];
3288
3289         foreach my $title (@commit_lines) {
3290                 $title =~ s/^    //;
3291                 if ($title ne "") {
3292                         $co{'title'} = chop_str($title, 80, 5);
3293                         # remove leading stuff of merges to make the interesting part visible
3294                         if (length($title) > 50) {
3295                                 $title =~ s/^Automatic //;
3296                                 $title =~ s/^merge (of|with) /Merge ... /i;
3297                                 if (length($title) > 50) {
3298                                         $title =~ s/(http|rsync):\/\///;
3299                                 }
3300                                 if (length($title) > 50) {
3301                                         $title =~ s/(master|www|rsync)\.//;
3302                                 }
3303                                 if (length($title) > 50) {
3304                                         $title =~ s/kernel.org:?//;
3305                                 }
3306                                 if (length($title) > 50) {
3307                                         $title =~ s/\/pub\/scm//;
3308                                 }
3309                         }
3310                         $co{'title_short'} = chop_str($title, 50, 5);
3311                         last;
3312                 }
3313         }
3314         if (! defined $co{'title'} || $co{'title'} eq "") {
3315                 $co{'title'} = $co{'title_short'} = '(no commit message)';
3316         }
3317         # remove added spaces
3318         foreach my $line (@commit_lines) {
3319                 $line =~ s/^    //;
3320         }
3321         $co{'comment'} = \@commit_lines;
3322
3323         my $age = time - $co{'committer_epoch'};
3324         $co{'age'} = $age;
3325         $co{'age_string'} = age_string($age);
3326         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3327         if ($age > 60*60*24*7*2) {
3328                 $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3329                 $co{'age_string_age'} = $co{'age_string'};
3330         } else {
3331                 $co{'age_string_date'} = $co{'age_string'};
3332                 $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3333         }
3334         return %co;
3335 }
3336
3337 sub parse_commit {
3338         my ($commit_id) = @_;
3339         my %co;
3340
3341         local $/ = "\0";
3342
3343         open my $fd, "-|", git_cmd(), "rev-list",
3344                 "--parents",
3345                 "--header",
3346                 "--max-count=1",
3347                 $commit_id,
3348                 "--",
3349                 or die_error(500, "Open git-rev-list failed");
3350         %co = parse_commit_text(<$fd>, 1);
3351         close $fd;
3352
3353         return %co;
3354 }
3355
3356 sub parse_commits {
3357         my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3358         my @cos;
3359
3360         $maxcount ||= 1;
3361         $skip ||= 0;
3362
3363         local $/ = "\0";
3364
3365         open my $fd, "-|", git_cmd(), "rev-list",
3366                 "--header",
3367                 @args,
3368                 ("--max-count=" . $maxcount),
3369                 ("--skip=" . $skip),
3370                 @extra_options,
3371                 $commit_id,
3372                 "--",
3373                 ($filename ? ($filename) : ())
3374                 or die_error(500, "Open git-rev-list failed");
3375         while (my $line = <$fd>) {
3376                 my %co = parse_commit_text($line);
3377                 push @cos, \%co;
3378         }
3379         close $fd;
3380
3381         return wantarray ? @cos : \@cos;
3382 }
3383
3384 # parse line of git-diff-tree "raw" output
3385 sub parse_difftree_raw_line {
3386         my $line = shift;
3387         my %res;
3388
3389         # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3390         # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3391         if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3392                 $res{'from_mode'} = $1;
3393                 $res{'to_mode'} = $2;
3394                 $res{'from_id'} = $3;
3395                 $res{'to_id'} = $4;
3396                 $res{'status'} = $5;
3397                 $res{'similarity'} = $6;
3398                 if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3399                         ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3400                 } else {
3401                         $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3402                 }
3403         }
3404         # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3405         # combined diff (for merge commit)
3406         elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3407                 $res{'nparents'}  = length($1);
3408                 $res{'from_mode'} = [ split(' ', $2) ];
3409                 $res{'to_mode'} = pop @{$res{'from_mode'}};
3410                 $res{'from_id'} = [ split(' ', $3) ];
3411                 $res{'to_id'} = pop @{$res{'from_id'}};
3412                 $res{'status'} = [ split('', $4) ];
3413                 $res{'to_file'} = unquote($5);
3414         }
3415         # 'c512b523472485aef4fff9e57b229d9d243c967f'
3416         elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3417                 $res{'commit'} = $1;
3418         }
3419
3420         return wantarray ? %res : \%res;
3421 }
3422
3423 # wrapper: return parsed line of git-diff-tree "raw" output
3424 # (the argument might be raw line, or parsed info)
3425 sub parsed_difftree_line {
3426         my $line_or_ref = shift;
3427
3428         if (ref($line_or_ref) eq "HASH") {
3429                 # pre-parsed (or generated by hand)
3430                 return $line_or_ref;
3431         } else {
3432                 return parse_difftree_raw_line($line_or_ref);
3433         }
3434 }
3435
3436 # parse line of git-ls-tree output
3437 sub parse_ls_tree_line {
3438         my $line = shift;
3439         my %opts = @_;
3440         my %res;
3441
3442         if ($opts{'-l'}) {
3443                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3444                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3445
3446                 $res{'mode'} = $1;
3447                 $res{'type'} = $2;
3448                 $res{'hash'} = $3;
3449                 $res{'size'} = $4;
3450                 if ($opts{'-z'}) {
3451                         $res{'name'} = $5;
3452                 } else {
3453                         $res{'name'} = unquote($5);
3454                 }
3455         } else {
3456                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3457                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3458
3459                 $res{'mode'} = $1;
3460                 $res{'type'} = $2;
3461                 $res{'hash'} = $3;
3462                 if ($opts{'-z'}) {
3463                         $res{'name'} = $4;
3464                 } else {
3465                         $res{'name'} = unquote($4);
3466                 }
3467         }
3468
3469         return wantarray ? %res : \%res;
3470 }
3471
3472 # generates _two_ hashes, references to which are passed as 2 and 3 argument
3473 sub parse_from_to_diffinfo {
3474         my ($diffinfo, $from, $to, @parents) = @_;
3475
3476         if ($diffinfo->{'nparents'}) {
3477                 # combined diff
3478                 $from->{'file'} = [];
3479                 $from->{'href'} = [];
3480                 fill_from_file_info($diffinfo, @parents)
3481                         unless exists $diffinfo->{'from_file'};
3482                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3483                         $from->{'file'}[$i] =
3484                                 defined $diffinfo->{'from_file'}[$i] ?
3485                                         $diffinfo->{'from_file'}[$i] :
3486                                         $diffinfo->{'to_file'};
3487                         if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3488                                 $from->{'href'}[$i] = href(action=>"blob",
3489                                                            hash_base=>$parents[$i],
3490                                                            hash=>$diffinfo->{'from_id'}[$i],
3491                                                            file_name=>$from->{'file'}[$i]);
3492                         } else {
3493                                 $from->{'href'}[$i] = undef;
3494                         }
3495                 }
3496         } else {
3497                 # ordinary (not combined) diff
3498                 $from->{'file'} = $diffinfo->{'from_file'};
3499                 if ($diffinfo->{'status'} ne "A") { # not new (added) file
3500                         $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3501                                                hash=>$diffinfo->{'from_id'},
3502                                                file_name=>$from->{'file'});
3503                 } else {
3504                         delete $from->{'href'};
3505                 }
3506         }
3507
3508         $to->{'file'} = $diffinfo->{'to_file'};
3509         if (!is_deleted($diffinfo)) { # file exists in result
3510                 $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3511                                      hash=>$diffinfo->{'to_id'},
3512                                      file_name=>$to->{'file'});
3513         } else {
3514                 delete $to->{'href'};
3515         }
3516 }
3517
3518 ## ......................................................................
3519 ## parse to array of hashes functions
3520
3521 sub git_get_heads_list {
3522         my ($limit, @classes) = @_;
3523         @classes = ('heads') unless @classes;
3524         my @patterns = map { "refs/$_" } @classes;
3525         my @headslist;
3526
3527         open my $fd, '-|', git_cmd(), 'for-each-ref',
3528                 ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3529                 '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3530                 @patterns
3531                 or return;
3532         while (my $line = <$fd>) {
3533                 my %ref_item;
3534
3535                 chomp $line;
3536                 my ($refinfo, $committerinfo) = split(/\0/, $line);
3537                 my ($hash, $name, $title) = split(' ', $refinfo, 3);
3538                 my ($committer, $epoch, $tz) =
3539                         ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3540                 $ref_item{'fullname'}  = $name;
3541                 $name =~ s!^refs/(?:head|remote)s/!!;
3542
3543                 $ref_item{'name'}  = $name;
3544                 $ref_item{'id'}    = $hash;
3545                 $ref_item{'title'} = $title || '(no commit message)';
3546                 $ref_item{'epoch'} = $epoch;
3547                 if ($epoch) {
3548                         $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3549                 } else {
3550                         $ref_item{'age'} = "unknown";
3551                 }
3552
3553                 push @headslist, \%ref_item;
3554         }
3555         close $fd;
3556
3557         return wantarray ? @headslist : \@headslist;
3558 }
3559
3560 sub git_get_tags_list {
3561         my $limit = shift;
3562         my @tagslist;
3563
3564         open my $fd, '-|', git_cmd(), 'for-each-ref',
3565                 ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3566                 '--format=%(objectname) %(objecttype) %(refname) '.
3567                 '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3568                 'refs/tags'
3569                 or return;
3570         while (my $line = <$fd>) {
3571                 my %ref_item;
3572
3573                 chomp $line;
3574                 my ($refinfo, $creatorinfo) = split(/\0/, $line);
3575                 my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3576                 my ($creator, $epoch, $tz) =
3577                         ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3578                 $ref_item{'fullname'} = $name;
3579                 $name =~ s!^refs/tags/!!;
3580
3581                 $ref_item{'type'} = $type;
3582                 $ref_item{'id'} = $id;
3583                 $ref_item{'name'} = $name;
3584                 if ($type eq "tag") {
3585                         $ref_item{'subject'} = $title;
3586                         $ref_item{'reftype'} = $reftype;
3587                         $ref_item{'refid'}   = $refid;
3588                 } else {
3589                         $ref_item{'reftype'} = $type;
3590                         $ref_item{'refid'}   = $id;
3591                 }
3592
3593                 if ($type eq "tag" || $type eq "commit") {
3594                         $ref_item{'epoch'} = $epoch;
3595                         if ($epoch) {
3596                                 $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3597                         } else {
3598                                 $ref_item{'age'} = "unknown";
3599                         }
3600                 }
3601
3602                 push @tagslist, \%ref_item;
3603         }
3604         close $fd;
3605
3606         return wantarray ? @tagslist : \@tagslist;
3607 }
3608
3609 ## ----------------------------------------------------------------------
3610 ## filesystem-related functions
3611
3612 sub get_file_owner {
3613         my $path = shift;
3614
3615         my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3616         my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3617         if (!defined $gcos) {
3618                 return undef;
3619         }
3620         my $owner = $gcos;
3621         $owner =~ s/[,;].*$//;
3622         return to_utf8($owner);
3623 }
3624
3625 # assume that file exists
3626 sub insert_file {
3627         my $filename = shift;
3628
3629         open my $fd, '<', $filename;
3630         print map { to_utf8($_) } <$fd>;
3631         close $fd;
3632 }
3633
3634 ## ......................................................................
3635 ## mimetype related functions
3636
3637 sub mimetype_guess_file {
3638         my $filename = shift;
3639         my $mimemap = shift;
3640         -r $mimemap or return undef;
3641
3642         my %mimemap;
3643         open(my $mh, '<', $mimemap) or return undef;
3644         while (<$mh>) {
3645                 next if m/^#/; # skip comments
3646                 my ($mimetype, @exts) = split(/\s+/);
3647                 foreach my $ext (@exts) {
3648                         $mimemap{$ext} = $mimetype;
3649                 }
3650         }
3651         close($mh);
3652
3653         $filename =~ /\.([^.]*)$/;
3654         return $mimemap{$1};
3655 }
3656
3657 sub mimetype_guess {
3658         my $filename = shift;
3659         my $mime;
3660         $filename =~ /\./ or return undef;
3661
3662         if ($mimetypes_file) {
3663                 my $file = $mimetypes_file;
3664                 if ($file !~ m!^/!) { # if it is relative path
3665                         # it is relative to project
3666                         $file = "$projectroot/$project/$file";
3667                 }
3668                 $mime = mimetype_guess_file($filename, $file);
3669         }
3670         $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3671         return $mime;
3672 }
3673
3674 sub blob_mimetype {
3675         my $fd = shift;
3676         my $filename = shift;
3677
3678         if ($filename) {
3679                 my $mime = mimetype_guess($filename);
3680                 $mime and return $mime;
3681         }
3682
3683         # just in case
3684         return $default_blob_plain_mimetype unless $fd;
3685
3686         if (-T $fd) {
3687                 return 'text/plain';
3688         } elsif (! $filename) {
3689                 return 'application/octet-stream';
3690         } elsif ($filename =~ m/\.png$/i) {
3691                 return 'image/png';
3692         } elsif ($filename =~ m/\.gif$/i) {
3693                 return 'image/gif';
3694         } elsif ($filename =~ m/\.jpe?g$/i) {
3695                 return 'image/jpeg';
3696         } else {
3697                 return 'application/octet-stream';
3698         }
3699 }
3700
3701 sub blob_contenttype {
3702         my ($fd, $file_name, $type) = @_;
3703
3704         $type ||= blob_mimetype($fd, $file_name);
3705         if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3706                 $type .= "; charset=$default_text_plain_charset";
3707         }
3708
3709         return $type;
3710 }
3711
3712 # guess file syntax for syntax highlighting; return undef if no highlighting
3713 # the name of syntax can (in the future) depend on syntax highlighter used
3714 sub guess_file_syntax {
3715         my ($highlight, $mimetype, $file_name) = @_;
3716         return undef unless ($highlight && defined $file_name);
3717         my $basename = basename($file_name, '.in');
3718         return $highlight_basename{$basename}
3719                 if exists $highlight_basename{$basename};
3720
3721         $basename =~ /\.([^.]*)$/;
3722         my $ext = $1 or return undef;
3723         return $highlight_ext{$ext}
3724                 if exists $highlight_ext{$ext};
3725
3726         return undef;
3727 }
3728
3729 # run highlighter and return FD of its output,
3730 # or return original FD if no highlighting
3731 sub run_highlighter {
3732         my ($fd, $highlight, $syntax) = @_;
3733         return $fd unless ($highlight && defined $syntax);
3734
3735         close $fd;
3736         open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3737                   quote_command($highlight_bin).
3738                   " --replace-tabs=8 --fragment --syntax $syntax |"
3739                 or die_error(500, "Couldn't open file or run syntax highlighter");
3740         return $fd;
3741 }
3742
3743 ## ======================================================================
3744 ## functions printing HTML: header, footer, error page
3745
3746 sub get_page_title {
3747         my $title = to_utf8($site_name);
3748
3749         unless (defined $project) {
3750                 if (defined $project_filter) {
3751                         $title .= " - projects in '" . esc_path($project_filter) . "'";
3752                 }
3753                 return $title;
3754         }
3755         $title .= " - " . to_utf8($project);
3756
3757         return $title unless (defined $action);
3758         $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3759
3760         return $title unless (defined $file_name);
3761         $title .= " - " . esc_path($file_name);
3762         if ($action eq "tree" && $file_name !~ m|/$|) {
3763                 $title .= "/";
3764         }
3765
3766         return $title;
3767 }
3768
3769 sub get_content_type_html {
3770         # require explicit support from the UA if we are to send the page as
3771         # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3772         # we have to do this because MSIE sometimes globs '*/*', pretending to
3773         # support xhtml+xml but choking when it gets what it asked for.
3774         if (defined $cgi->http('HTTP_ACCEPT') &&
3775             $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3776             $cgi->Accept('application/xhtml+xml') != 0) {
3777                 return 'application/xhtml+xml';
3778         } else {
3779                 return 'text/html';
3780         }
3781 }
3782
3783 sub print_feed_meta {
3784         if (defined $project) {
3785                 my %href_params = get_feed_info();
3786                 if (!exists $href_params{'-title'}) {
3787                         $href_params{'-title'} = 'log';
3788                 }
3789
3790                 foreach my $format (qw(RSS Atom)) {
3791                         my $type = lc($format);
3792                         my %link_attr = (
3793                                 '-rel' => 'alternate',
3794                                 '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3795                                 '-type' => "application/$type+xml"
3796                         );
3797
3798                         $href_params{'action'} = $type;
3799                         $link_attr{'-href'} = href(%href_params);
3800                         print "<link ".
3801                               "rel=\"$link_attr{'-rel'}\" ".
3802                               "title=\"$link_attr{'-title'}\" ".
3803                               "href=\"$link_attr{'-href'}\" ".
3804                               "type=\"$link_attr{'-type'}\" ".
3805                               "/>\n";
3806
3807                         $href_params{'extra_options'} = '--no-merges';
3808                         $link_attr{'-href'} = href(%href_params);
3809                         $link_attr{'-title'} .= ' (no merges)';
3810                         print "<link ".
3811                               "rel=\"$link_attr{'-rel'}\" ".
3812                               "title=\"$link_attr{'-title'}\" ".
3813                               "href=\"$link_attr{'-href'}\" ".
3814                               "type=\"$link_attr{'-type'}\" ".
3815                               "/>\n";
3816                 }
3817
3818         } else {
3819                 printf('<link rel="alternate" title="%s projects list" '.
3820                        'href="%s" type="text/plain; charset=utf-8" />'."\n",
3821                        esc_attr($site_name), href(project=>undef, action=>"project_index"));
3822                 printf('<link rel="alternate" title="%s projects feeds" '.
3823                        'href="%s" type="text/x-opml" />'."\n",
3824                        esc_attr($site_name), href(project=>undef, action=>"opml"));
3825         }
3826 }
3827
3828 sub print_header_links {
3829         my $status = shift;
3830
3831         # print out each stylesheet that exist, providing backwards capability
3832         # for those people who defined $stylesheet in a config file
3833         if (defined $stylesheet) {
3834                 print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3835         } else {
3836                 foreach my $stylesheet (@stylesheets) {
3837                         next unless $stylesheet;
3838                         print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3839                 }
3840         }
3841         print_feed_meta()
3842                 if ($status eq '200 OK');
3843         if (defined $favicon) {
3844                 print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3845         }
3846 }
3847
3848 sub print_nav_breadcrumbs_path {
3849         my $dirprefix = undef;
3850         while (my $part = shift) {
3851                 $dirprefix .= "/" if defined $dirprefix;
3852                 $dirprefix .= $part;
3853                 print $cgi->a({-href => href(project => undef,
3854                                              project_filter => $dirprefix,
3855                                              action => "project_list")},
3856                               esc_html($part)) . " / ";
3857         }
3858 }
3859
3860 sub print_nav_breadcrumbs {
3861         my %opts = @_;
3862
3863         print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3864         if (defined $project) {
3865                 my @dirname = split '/', $project;
3866                 my $projectbasename = pop @dirname;
3867                 print_nav_breadcrumbs_path(@dirname);
3868                 print $cgi->a({-href => href(action=>"summary")}, esc_html($projectbasename));
3869                 if (defined $action) {
3870                         my $action_print = $action ;
3871                         if (defined $opts{-action_extra}) {
3872                                 $action_print = $cgi->a({-href => href(action=>$action)},
3873                                         $action);
3874                         }
3875                         print " / $action_print";
3876                 }
3877                 if (defined $opts{-action_extra}) {
3878                         print " / $opts{-action_extra}";
3879                 }
3880                 print "\n";
3881         } elsif (defined $project_filter) {
3882                 print_nav_breadcrumbs_path(split '/', $project_filter);
3883         }
3884 }
3885
3886 sub print_search_form {
3887         if (!defined $searchtext) {
3888                 $searchtext = "";
3889         }
3890         my $search_hash;
3891         if (defined $hash_base) {
3892                 $search_hash = $hash_base;
3893         } elsif (defined $hash) {
3894                 $search_hash = $hash;
3895         } else {
3896                 $search_hash = "HEAD";
3897         }
3898         my $action = $my_uri;
3899         my $use_pathinfo = gitweb_check_feature('pathinfo');
3900         if ($use_pathinfo) {
3901                 $action .= "/".esc_url($project);
3902         }
3903         print $cgi->startform(-method => "get", -action => $action) .
3904               "<div class=\"search\">\n" .
3905               (!$use_pathinfo &&
3906               $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3907               $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3908               $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3909               $cgi->popup_menu(-name => 'st', -default => 'commit',
3910                                -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3911               $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3912               " search:\n",
3913               $cgi->textfield(-name => "s", -value => $searchtext, -override => 1) . "\n" .
3914               "<span title=\"Extended regular expression\">" .
3915               $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3916                              -checked => $search_use_regexp) .
3917               "</span>" .
3918               "</div>" .
3919               $cgi->end_form() . "\n";
3920 }
3921
3922 sub git_header_html {
3923         my $status = shift || "200 OK";
3924         my $expires = shift;
3925         my %opts = @_;
3926
3927         my $title = get_page_title();
3928         my $content_type = get_content_type_html();
3929         print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3930                            -status=> $status, -expires => $expires)
3931                 unless ($opts{'-no_http_header'});
3932         my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3933         print <<EOF;
3934 <?xml version="1.0" encoding="utf-8"?>
3935 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3936 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3937 <!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3938 <!-- git core binaries version $git_version -->
3939 <head>
3940 <meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3941 <meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3942 <meta name="robots" content="index, nofollow"/>
3943 <title>$title</title>
3944 EOF
3945         # the stylesheet, favicon etc urls won't work correctly with path_info
3946         # unless we set the appropriate base URL
3947         if ($ENV{'PATH_INFO'}) {
3948                 print "<base href=\"".esc_url($base_url)."\" />\n";
3949         }
3950         print_header_links($status);
3951
3952         if (defined $site_html_head_string) {
3953                 print to_utf8($site_html_head_string);
3954         }
3955
3956         print "</head>\n" .
3957               "<body>\n";
3958
3959         if (defined $site_header && -f $site_header) {
3960                 insert_file($site_header);
3961         }
3962
3963         print "<div class=\"page_header\">\n";
3964         if (defined $logo) {
3965                 print $cgi->a({-href => esc_url($logo_url),
3966                                -title => $logo_label},
3967                               $cgi->img({-src => esc_url($logo),
3968                                          -width => 72, -height => 27,
3969                                          -alt => "git",
3970                                          -class => "logo"}));
3971         }
3972         print_nav_breadcrumbs(%opts);
3973         print "</div>\n";
3974
3975         my $have_search = gitweb_check_feature('search');
3976         if (defined $project && $have_search) {
3977                 print_search_form();
3978         }
3979 }
3980
3981 sub git_footer_html {
3982         my $feed_class = 'rss_logo';
3983
3984         print "<div class=\"page_footer\">\n";
3985         if (defined $project) {
3986                 my $descr = git_get_project_description($project);
3987                 if (defined $descr) {
3988                         print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3989                 }
3990
3991                 my %href_params = get_feed_info();
3992                 if (!%href_params) {
3993                         $feed_class .= ' generic';
3994                 }
3995                 $href_params{'-title'} ||= 'log';
3996
3997                 foreach my $format (qw(RSS Atom)) {
3998                         $href_params{'action'} = lc($format);
3999                         print $cgi->a({-href => href(%href_params),
4000                                       -title => "$href_params{'-title'} $format feed",
4001                                       -class => $feed_class}, $format)."\n";
4002                 }
4003
4004         } else {
4005                 print $cgi->a({-href => href(project=>undef, action=>"opml",
4006                                              project_filter => $project_filter),
4007                               -class => $feed_class}, "OPML") . " ";
4008                 print $cgi->a({-href => href(project=>undef, action=>"project_index",
4009                                              project_filter => $project_filter),
4010                               -class => $feed_class}, "TXT") . "\n";
4011         }
4012         print "</div>\n"; # class="page_footer"
4013
4014         if (defined $t0 && gitweb_check_feature('timed')) {
4015                 print "<div id=\"generating_info\">\n";
4016                 print 'This page took '.
4017                       '<span id="generating_time" class="time_span">'.
4018                       tv_interval($t0, [ gettimeofday() ]).
4019                       ' seconds </span>'.
4020                       ' and '.
4021                       '<span id="generating_cmd">'.
4022                       $number_of_git_cmds.
4023                       '</span> git commands '.
4024                       " to generate.\n";
4025                 print "</div>\n"; # class="page_footer"
4026         }
4027
4028         if (defined $site_footer && -f $site_footer) {
4029                 insert_file($site_footer);
4030         }
4031
4032         print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
4033         if (defined $action &&
4034             $action eq 'blame_incremental') {
4035                 print qq!<script type="text/javascript">\n!.
4036                       qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
4037                       qq!           "!. href() .qq!");\n!.
4038                       qq!</script>\n!;
4039         } else {
4040                 my ($jstimezone, $tz_cookie, $datetime_class) =
4041                         gitweb_get_feature('javascript-timezone');
4042
4043                 print qq!<script type="text/javascript">\n!.
4044                       qq!window.onload = function () {\n!;
4045                 if (gitweb_check_feature('javascript-actions')) {
4046                         print qq!       fixLinks();\n!;
4047                 }
4048                 if ($jstimezone && $tz_cookie && $datetime_class) {
4049                         print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4050                               qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4051                 }
4052                 print qq!};\n!.
4053                       qq!</script>\n!;
4054         }
4055
4056         print "</body>\n" .
4057               "</html>";
4058 }
4059
4060 # die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4061 # Example: die_error(404, 'Hash not found')
4062 # By convention, use the following status codes (as defined in RFC 2616):
4063 # 400: Invalid or missing CGI parameters, or
4064 #      requested object exists but has wrong type.
4065 # 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4066 #      this server or project.
4067 # 404: Requested object/revision/project doesn't exist.
4068 # 500: The server isn't configured properly, or
4069 #      an internal error occurred (e.g. failed assertions caused by bugs), or
4070 #      an unknown error occurred (e.g. the git binary died unexpectedly).
4071 # 503: The server is currently unavailable (because it is overloaded,
4072 #      or down for maintenance).  Generally, this is a temporary state.
4073 sub die_error {
4074         my $status = shift || 500;
4075         my $error = esc_html(shift) || "Internal Server Error";
4076         my $extra = shift;
4077         my %opts = @_;
4078
4079         my %http_responses = (
4080                 400 => '400 Bad Request',
4081                 403 => '403 Forbidden',
4082                 404 => '404 Not Found',
4083                 500 => '500 Internal Server Error',
4084                 503 => '503 Service Unavailable',
4085         );
4086         git_header_html($http_responses{$status}, undef, %opts);
4087         print <<EOF;
4088 <div class="page_body">
4089 <br /><br />
4090 $status - $error
4091 <br />
4092 EOF
4093         if (defined $extra) {
4094                 print "<hr />\n" .
4095                       "$extra\n";
4096         }
4097         print "</div>\n";
4098
4099         git_footer_html();
4100         goto DONE_GITWEB
4101                 unless ($opts{'-error_handler'});
4102 }
4103
4104 ## ----------------------------------------------------------------------
4105 ## functions printing or outputting HTML: navigation
4106
4107 sub git_print_page_nav {
4108         my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4109         $extra = '' if !defined $extra; # pager or formats
4110
4111         my @navs = qw(summary shortlog log commit commitdiff tree);
4112         if ($suppress) {
4113                 @navs = grep { $_ ne $suppress } @navs;
4114         }
4115
4116         my %arg = map { $_ => {action=>$_} } @navs;
4117         if (defined $head) {
4118                 for (qw(commit commitdiff)) {
4119                         $arg{$_}{'hash'} = $head;
4120                 }
4121                 if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4122                         for (qw(shortlog log)) {
4123                                 $arg{$_}{'hash'} = $head;
4124                         }
4125                 }
4126         }
4127
4128         $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4129         $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4130
4131         my @actions = gitweb_get_feature('actions');
4132         my %repl = (
4133                 '%' => '%',
4134                 'n' => $project,         # project name
4135                 'f' => $git_dir,         # project path within filesystem
4136                 'h' => $treehead || '',  # current hash ('h' parameter)
4137                 'b' => $treebase || '',  # hash base ('hb' parameter)
4138         );
4139         while (@actions) {
4140                 my ($label, $link, $pos) = splice(@actions,0,3);
4141                 # insert
4142                 @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4143                 # munch munch
4144                 $link =~ s/%([%nfhb])/$repl{$1}/g;
4145                 $arg{$label}{'_href'} = $link;
4146         }
4147
4148         print "<div class=\"page_nav\">\n" .
4149                 (join " | ",
4150                  map { $_ eq $current ?
4151                        $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4152                  } @navs);
4153         print "<br/>\n$extra<br/>\n" .
4154               "</div>\n";
4155 }
4156
4157 # returns a submenu for the nagivation of the refs views (tags, heads,
4158 # remotes) with the current view disabled and the remotes view only
4159 # available if the feature is enabled
4160 sub format_ref_views {
4161         my ($current) = @_;
4162         my @ref_views = qw{tags heads};
4163         push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4164         return join " | ", map {
4165                 $_ eq $current ? $_ :
4166                 $cgi->a({-href => href(action=>$_)}, $_)
4167         } @ref_views
4168 }
4169
4170 sub format_paging_nav {
4171         my ($action, $page, $has_next_link) = @_;
4172         my $paging_nav;
4173
4174
4175         if ($page > 0) {
4176                 $paging_nav .=
4177                         $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4178                         " &sdot; " .
4179                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
4180                                  -accesskey => "p", -title => "Alt-p"}, "prev");
4181         } else {
4182                 $paging_nav .= "first &sdot; prev";
4183         }
4184
4185         if ($has_next_link) {
4186                 $paging_nav .= " &sdot; " .
4187                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
4188                                  -accesskey => "n", -title => "Alt-n"}, "next");
4189         } else {
4190                 $paging_nav .= " &sdot; next";
4191         }
4192
4193         return $paging_nav;
4194 }
4195
4196 ## ......................................................................
4197 ## functions printing or outputting HTML: div
4198
4199 sub git_print_header_div {
4200         my ($action, $title, $hash, $hash_base) = @_;
4201         my %args = ();
4202
4203         $args{'action'} = $action;
4204         $args{'hash'} = $hash if $hash;
4205         $args{'hash_base'} = $hash_base if $hash_base;
4206
4207         print "<div class=\"header\">\n" .
4208               $cgi->a({-href => href(%args), -class => "title"},
4209               $title ? $title : $action) .
4210               "\n</div>\n";
4211 }
4212
4213 sub format_repo_url {
4214         my ($name, $url) = @_;
4215         return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4216 }
4217
4218 # Group output by placing it in a DIV element and adding a header.
4219 # Options for start_div() can be provided by passing a hash reference as the
4220 # first parameter to the function.
4221 # Options to git_print_header_div() can be provided by passing an array
4222 # reference. This must follow the options to start_div if they are present.
4223 # The content can be a scalar, which is output as-is, a scalar reference, which
4224 # is output after html escaping, an IO handle passed either as *handle or
4225 # *handle{IO}, or a function reference. In the latter case all following
4226 # parameters will be taken as argument to the content function call.
4227 sub git_print_section {
4228         my ($div_args, $header_args, $content);
4229         my $arg = shift;
4230         if (ref($arg) eq 'HASH') {
4231                 $div_args = $arg;
4232                 $arg = shift;
4233         }
4234         if (ref($arg) eq 'ARRAY') {
4235                 $header_args = $arg;
4236                 $arg = shift;
4237         }
4238         $content = $arg;
4239
4240         print $cgi->start_div($div_args);
4241         git_print_header_div(@$header_args);
4242
4243         if (ref($content) eq 'CODE') {
4244                 $content->(@_);
4245         } elsif (ref($content) eq 'SCALAR') {
4246                 print esc_html($$content);
4247         } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4248                 print <$content>;
4249         } elsif (!ref($content) && defined($content)) {
4250                 print $content;
4251         }
4252
4253         print $cgi->end_div;
4254 }
4255
4256 sub format_timestamp_html {
4257         my $date = shift;
4258         my $strtime = $date->{'rfc2822'};
4259
4260         my (undef, undef, $datetime_class) =
4261                 gitweb_get_feature('javascript-timezone');
4262         if ($datetime_class) {
4263                 $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4264         }
4265
4266         my $localtime_format = '(%02d:%02d %s)';
4267         if ($date->{'hour_local'} < 6) {
4268                 $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4269         }
4270         $strtime .= ' ' .
4271                     sprintf($localtime_format,
4272                             $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4273
4274         return $strtime;
4275 }
4276
4277 # Outputs the author name and date in long form
4278 sub git_print_authorship {
4279         my $co = shift;
4280         my %opts = @_;
4281         my $tag = $opts{-tag} || 'div';
4282         my $author = $co->{'author_name'};
4283
4284         my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4285         print "<$tag class=\"author_date\">" .
4286               format_search_author($author, "author", esc_html($author)) .
4287               " [".format_timestamp_html(\%ad)."]".
4288               git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4289               "</$tag>\n";
4290 }
4291
4292 # Outputs table rows containing the full author or committer information,
4293 # in the format expected for 'commit' view (& similar).
4294 # Parameters are a commit hash reference, followed by the list of people
4295 # to output information for. If the list is empty it defaults to both
4296 # author and committer.
4297 sub git_print_authorship_rows {
4298         my $co = shift;
4299         # too bad we can't use @people = @_ || ('author', 'committer')
4300         my @people = @_;
4301         @people = ('author', 'committer') unless @people;
4302         foreach my $who (@people) {
4303                 my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4304                 print "<tr><td>$who</td><td>" .
4305                       format_search_author($co->{"${who}_name"}, $who,
4306                                            esc_html($co->{"${who}_name"})) . " " .
4307                       format_search_author($co->{"${who}_email"}, $who,
4308                                            esc_html("<" . $co->{"${who}_email"} . ">")) .
4309                       "</td><td rowspan=\"2\">" .
4310                       git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4311                       "</td></tr>\n" .
4312                       "<tr>" .
4313                       "<td></td><td>" .
4314                       format_timestamp_html(\%wd) .
4315                       "</td>" .
4316                       "</tr>\n";
4317         }
4318 }
4319
4320 sub git_print_page_path {
4321         my $name = shift;
4322         my $type = shift;
4323         my $hb = shift;
4324
4325
4326         print "<div class=\"page_path\">";
4327         print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4328                       -title => 'tree root'}, to_utf8("[$project]"));
4329         print " / ";
4330         if (defined $name) {
4331                 my @dirname = split '/', $name;
4332                 my $basename = pop @dirname;
4333                 my $fullname = '';
4334
4335                 foreach my $dir (@dirname) {
4336                         $fullname .= ($fullname ? '/' : '') . $dir;
4337                         print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4338                                                      hash_base=>$hb),
4339                                       -title => $fullname}, esc_path($dir));
4340                         print " / ";
4341                 }
4342                 if (defined $type && $type eq 'blob') {
4343                         print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4344                                                      hash_base=>$hb),
4345                                       -title => $name}, esc_path($basename));
4346                 } elsif (defined $type && $type eq 'tree') {
4347                         print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4348                                                      hash_base=>$hb),
4349                                       -title => $name}, esc_path($basename));
4350                         print " / ";
4351                 } else {
4352                         print esc_path($basename);
4353                 }
4354         }
4355         print "<br/></div>\n";
4356 }
4357
4358 sub git_print_log {
4359         my $log = shift;
4360         my %opts = @_;
4361
4362         if ($opts{'-remove_title'}) {
4363                 # remove title, i.e. first line of log
4364                 shift @$log;
4365         }
4366         # remove leading empty lines
4367         while (defined $log->[0] && $log->[0] eq "") {
4368                 shift @$log;
4369         }
4370
4371         # print log
4372         my $signoff = 0;
4373         my $empty = 0;
4374         foreach my $line (@$log) {
4375                 if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4376                         $signoff = 1;
4377                         $empty = 0;
4378                         if (! $opts{'-remove_signoff'}) {
4379                                 print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4380                                 next;
4381                         } else {
4382                                 # remove signoff lines
4383                                 next;
4384                         }
4385                 } else {
4386                         $signoff = 0;
4387                 }
4388
4389                 # print only one empty line
4390                 # do not print empty line after signoff
4391                 if ($line eq "") {
4392                         next if ($empty || $signoff);
4393                         $empty = 1;
4394                 } else {
4395                         $empty = 0;
4396                 }
4397
4398                 print format_log_line_html($line) . "<br/>\n";
4399         }
4400
4401         if ($opts{'-final_empty_line'}) {
4402                 # end with single empty line
4403                 print "<br/>\n" unless $empty;
4404         }
4405 }
4406
4407 # return link target (what link points to)
4408 sub git_get_link_target {
4409         my $hash = shift;
4410         my $link_target;
4411
4412         # read link
4413         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4414                 or return;
4415         {
4416                 local $/ = undef;
4417                 $link_target = <$fd>;
4418         }
4419         close $fd
4420                 or return;
4421
4422         return $link_target;
4423 }
4424
4425 # given link target, and the directory (basedir) the link is in,
4426 # return target of link relative to top directory (top tree);
4427 # return undef if it is not possible (including absolute links).
4428 sub normalize_link_target {
4429         my ($link_target, $basedir) = @_;
4430
4431         # absolute symlinks (beginning with '/') cannot be normalized
4432         return if (substr($link_target, 0, 1) eq '/');
4433
4434         # normalize link target to path from top (root) tree (dir)
4435         my $path;
4436         if ($basedir) {
4437                 $path = $basedir . '/' . $link_target;
4438         } else {
4439                 # we are in top (root) tree (dir)
4440                 $path = $link_target;
4441         }
4442
4443         # remove //, /./, and /../
4444         my @path_parts;
4445         foreach my $part (split('/', $path)) {
4446                 # discard '.' and ''
4447                 next if (!$part || $part eq '.');
4448                 # handle '..'
4449                 if ($part eq '..') {
4450                         if (@path_parts) {
4451                                 pop @path_parts;
4452                         } else {
4453                                 # link leads outside repository (outside top dir)
4454                                 return;
4455                         }
4456                 } else {
4457                         push @path_parts, $part;
4458                 }
4459         }
4460         $path = join('/', @path_parts);
4461
4462         return $path;
4463 }
4464
4465 # print tree entry (row of git_tree), but without encompassing <tr> element
4466 sub git_print_tree_entry {
4467         my ($t, $basedir, $hash_base, $have_blame) = @_;
4468
4469         my %base_key = ();
4470         $base_key{'hash_base'} = $hash_base if defined $hash_base;
4471
4472         # The format of a table row is: mode list link.  Where mode is
4473         # the mode of the entry, list is the name of the entry, an href,
4474         # and link is the action links of the entry.
4475
4476         print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4477         if (exists $t->{'size'}) {
4478                 print "<td class=\"size\">$t->{'size'}</td>\n";
4479         }
4480         if ($t->{'type'} eq "blob") {
4481                 print "<td class=\"list\">" .
4482                         $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4483                                                file_name=>"$basedir$t->{'name'}", %base_key),
4484                                 -class => "list"}, esc_path($t->{'name'}));
4485                 if (S_ISLNK(oct $t->{'mode'})) {
4486                         my $link_target = git_get_link_target($t->{'hash'});
4487                         if ($link_target) {
4488                                 my $norm_target = normalize_link_target($link_target, $basedir);
4489                                 if (defined $norm_target) {
4490                                         print " -> " .
4491                                               $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4492                                                                      file_name=>$norm_target),
4493                                                        -title => $norm_target}, esc_path($link_target));
4494                                 } else {
4495                                         print " -> " . esc_path($link_target);
4496                                 }
4497                         }
4498                 }
4499                 print "</td>\n";
4500                 print "<td class=\"link\">";
4501                 print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4502                                              file_name=>"$basedir$t->{'name'}", %base_key)},
4503                               "blob");
4504                 if ($have_blame) {
4505                         print " | " .
4506                               $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4507                                                      file_name=>"$basedir$t->{'name'}", %base_key)},
4508                                       "blame");
4509                 }
4510                 if (defined $hash_base) {
4511                         print " | " .
4512                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4513                                                      hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4514                                       "history");
4515                 }
4516                 print " | " .
4517                         $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4518                                                file_name=>"$basedir$t->{'name'}")},
4519                                 "raw");
4520                 print "</td>\n";
4521
4522         } elsif ($t->{'type'} eq "tree") {
4523                 print "<td class=\"list\">";
4524                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4525                                              file_name=>"$basedir$t->{'name'}",
4526                                              %base_key)},
4527                               esc_path($t->{'name'}));
4528                 print "</td>\n";
4529                 print "<td class=\"link\">";
4530                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4531                                              file_name=>"$basedir$t->{'name'}",
4532                                              %base_key)},
4533                               "tree");
4534                 if (defined $hash_base) {
4535                         print " | " .
4536                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4537                                                      file_name=>"$basedir$t->{'name'}")},
4538                                       "history");
4539                 }
4540                 print "</td>\n";
4541         } else {
4542                 # unknown object: we can only present history for it
4543                 # (this includes 'commit' object, i.e. submodule support)
4544                 print "<td class=\"list\">" .
4545                       esc_path($t->{'name'}) .
4546                       "</td>\n";
4547                 print "<td class=\"link\">";
4548                 if (defined $hash_base) {
4549                         print $cgi->a({-href => href(action=>"history",
4550                                                      hash_base=>$hash_base,
4551                                                      file_name=>"$basedir$t->{'name'}")},
4552                                       "history");
4553                 }
4554                 print "</td>\n";
4555         }
4556 }
4557
4558 ## ......................................................................
4559 ## functions printing large fragments of HTML
4560
4561 # get pre-image filenames for merge (combined) diff
4562 sub fill_from_file_info {
4563         my ($diff, @parents) = @_;
4564
4565         $diff->{'from_file'} = [ ];
4566         $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4567         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4568                 if ($diff->{'status'}[$i] eq 'R' ||
4569                     $diff->{'status'}[$i] eq 'C') {
4570                         $diff->{'from_file'}[$i] =
4571                                 git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4572                 }
4573         }
4574
4575         return $diff;
4576 }
4577
4578 # is current raw difftree line of file deletion
4579 sub is_deleted {
4580         my $diffinfo = shift;
4581
4582         return $diffinfo->{'to_id'} eq ('0' x 40);
4583 }
4584
4585 # does patch correspond to [previous] difftree raw line
4586 # $diffinfo  - hashref of parsed raw diff format
4587 # $patchinfo - hashref of parsed patch diff format
4588 #              (the same keys as in $diffinfo)
4589 sub is_patch_split {
4590         my ($diffinfo, $patchinfo) = @_;
4591
4592         return defined $diffinfo && defined $patchinfo
4593                 && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4594 }
4595
4596
4597 sub git_difftree_body {
4598         my ($difftree, $hash, @parents) = @_;
4599         my ($parent) = $parents[0];
4600         my $have_blame = gitweb_check_feature('blame');
4601         print "<div class=\"list_head\">\n";
4602         if ($#{$difftree} > 10) {
4603                 print(($#{$difftree} + 1) . " files changed:\n");
4604         }
4605         print "</div>\n";
4606
4607         print "<table class=\"" .
4608               (@parents > 1 ? "combined " : "") .
4609               "diff_tree\">\n";
4610
4611         # header only for combined diff in 'commitdiff' view
4612         my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4613         if ($has_header) {
4614                 # table header
4615                 print "<thead><tr>\n" .
4616                        "<th></th><th></th>\n"; # filename, patchN link
4617                 for (my $i = 0; $i < @parents; $i++) {
4618                         my $par = $parents[$i];
4619                         print "<th>" .
4620                               $cgi->a({-href => href(action=>"commitdiff",
4621                                                      hash=>$hash, hash_parent=>$par),
4622                                        -title => 'commitdiff to parent number ' .
4623                                                   ($i+1) . ': ' . substr($par,0,7)},
4624                                       $i+1) .
4625                               "&nbsp;</th>\n";
4626                 }
4627                 print "</tr></thead>\n<tbody>\n";
4628         }
4629
4630         my $alternate = 1;
4631         my $patchno = 0;
4632         foreach my $line (@{$difftree}) {
4633                 my $diff = parsed_difftree_line($line);
4634
4635                 if ($alternate) {
4636                         print "<tr class=\"dark\">\n";
4637                 } else {
4638                         print "<tr class=\"light\">\n";
4639                 }
4640                 $alternate ^= 1;
4641
4642                 if (exists $diff->{'nparents'}) { # combined diff
4643
4644                         fill_from_file_info($diff, @parents)
4645                                 unless exists $diff->{'from_file'};
4646
4647                         if (!is_deleted($diff)) {
4648                                 # file exists in the result (child) commit
4649                                 print "<td>" .
4650                                       $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4651                                                              file_name=>$diff->{'to_file'},
4652                                                              hash_base=>$hash),
4653                                               -class => "list"}, esc_path($diff->{'to_file'})) .
4654                                       "</td>\n";
4655                         } else {
4656                                 print "<td>" .
4657                                       esc_path($diff->{'to_file'}) .
4658                                       "</td>\n";
4659                         }
4660
4661                         if ($action eq 'commitdiff') {
4662                                 # link to patch
4663                                 $patchno++;
4664                                 print "<td class=\"link\">" .
4665                                       $cgi->a({-href => href(-anchor=>"patch$patchno")},
4666                                               "patch") .
4667                                       " | " .
4668                                       "</td>\n";
4669                         }
4670
4671                         my $has_history = 0;
4672                         my $not_deleted = 0;
4673                         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4674                                 my $hash_parent = $parents[$i];
4675                                 my $from_hash = $diff->{'from_id'}[$i];
4676                                 my $from_path = $diff->{'from_file'}[$i];
4677                                 my $status = $diff->{'status'}[$i];
4678
4679                                 $has_history ||= ($status ne 'A');
4680                                 $not_deleted ||= ($status ne 'D');
4681
4682                                 if ($status eq 'A') {
4683                                         print "<td  class=\"link\" align=\"right\"> | </td>\n";
4684                                 } elsif ($status eq 'D') {
4685                                         print "<td class=\"link\">" .
4686                                               $cgi->a({-href => href(action=>"blob",
4687                                                                      hash_base=>$hash,
4688                                                                      hash=>$from_hash,
4689                                                                      file_name=>$from_path)},
4690                                                       "blob" . ($i+1)) .
4691                                               " | </td>\n";
4692                                 } else {
4693                                         if ($diff->{'to_id'} eq $from_hash) {
4694                                                 print "<td class=\"link nochange\">";
4695                                         } else {
4696                                                 print "<td class=\"link\">";
4697                                         }
4698                                         print $cgi->a({-href => href(action=>"blobdiff",
4699                                                                      hash=>$diff->{'to_id'},
4700                                                                      hash_parent=>$from_hash,
4701                                                                      hash_base=>$hash,
4702                                                                      hash_parent_base=>$hash_parent,
4703                                                                      file_name=>$diff->{'to_file'},
4704                                                                      file_parent=>$from_path)},
4705                                                       "diff" . ($i+1)) .
4706                                               " | </td>\n";
4707                                 }
4708                         }
4709
4710                         print "<td class=\"link\">";
4711                         if ($not_deleted) {
4712                                 print $cgi->a({-href => href(action=>"blob",
4713                                                              hash=>$diff->{'to_id'},
4714                                                              file_name=>$diff->{'to_file'},
4715                                                              hash_base=>$hash)},
4716                                               "blob");
4717                                 print " | " if ($has_history);
4718                         }
4719                         if ($has_history) {
4720                                 print $cgi->a({-href => href(action=>"history",
4721                                                              file_name=>$diff->{'to_file'},
4722                                                              hash_base=>$hash)},
4723                                               "history");
4724                         }
4725                         print "</td>\n";
4726
4727                         print "</tr>\n";
4728                         next; # instead of 'else' clause, to avoid extra indent
4729                 }
4730                 # else ordinary diff
4731
4732                 my ($to_mode_oct, $to_mode_str, $to_file_type);
4733                 my ($from_mode_oct, $from_mode_str, $from_file_type);
4734                 if ($diff->{'to_mode'} ne ('0' x 6)) {
4735                         $to_mode_oct = oct $diff->{'to_mode'};
4736                         if (S_ISREG($to_mode_oct)) { # only for regular file
4737                                 $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4738                         }
4739                         $to_file_type = file_type($diff->{'to_mode'});
4740                 }
4741                 if ($diff->{'from_mode'} ne ('0' x 6)) {
4742                         $from_mode_oct = oct $diff->{'from_mode'};
4743                         if (S_ISREG($from_mode_oct)) { # only for regular file
4744                                 $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4745                         }
4746                         $from_file_type = file_type($diff->{'from_mode'});
4747                 }
4748
4749                 if ($diff->{'status'} eq "A") { # created
4750                         my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4751                         $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4752                         $mode_chng   .= "]</span>";
4753                         print "<td>";
4754                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4755                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4756                                       -class => "list"}, esc_path($diff->{'file'}));
4757                         print "</td>\n";
4758                         print "<td>$mode_chng</td>\n";
4759                         print "<td class=\"link\">";
4760                         if ($action eq 'commitdiff') {
4761                                 # link to patch
4762                                 $patchno++;
4763                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4764                                               "patch") .
4765                                       " | ";
4766                         }
4767                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4768                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4769                                       "blob");
4770                         print "</td>\n";
4771
4772                 } elsif ($diff->{'status'} eq "D") { # deleted
4773                         my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4774                         print "<td>";
4775                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4776                                                      hash_base=>$parent, file_name=>$diff->{'file'}),
4777                                        -class => "list"}, esc_path($diff->{'file'}));
4778                         print "</td>\n";
4779                         print "<td>$mode_chng</td>\n";
4780                         print "<td class=\"link\">";
4781                         if ($action eq 'commitdiff') {
4782                                 # link to patch
4783                                 $patchno++;
4784                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4785                                               "patch") .
4786                                       " | ";
4787                         }
4788                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4789                                                      hash_base=>$parent, file_name=>$diff->{'file'})},
4790                                       "blob") . " | ";
4791                         if ($have_blame) {
4792                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4793                                                              file_name=>$diff->{'file'})},
4794                                               "blame") . " | ";
4795                         }
4796                         print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4797                                                      file_name=>$diff->{'file'})},
4798                                       "history");
4799                         print "</td>\n";
4800
4801                 } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4802                         my $mode_chnge = "";
4803                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4804                                 $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4805                                 if ($from_file_type ne $to_file_type) {
4806                                         $mode_chnge .= " from $from_file_type to $to_file_type";
4807                                 }
4808                                 if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4809                                         if ($from_mode_str && $to_mode_str) {
4810                                                 $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4811                                         } elsif ($to_mode_str) {
4812                                                 $mode_chnge .= " mode: $to_mode_str";
4813                                         }
4814                                 }
4815                                 $mode_chnge .= "]</span>\n";
4816                         }
4817                         print "<td>";
4818                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4819                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4820                                       -class => "list"}, esc_path($diff->{'file'}));
4821                         print "</td>\n";
4822                         print "<td>$mode_chnge</td>\n";
4823                         print "<td class=\"link\">";
4824                         if ($action eq 'commitdiff') {
4825                                 # link to patch
4826                                 $patchno++;
4827                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4828                                               "patch") .
4829                                       " | ";
4830                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4831                                 # "commit" view and modified file (not onlu mode changed)
4832                                 print $cgi->a({-href => href(action=>"blobdiff",
4833                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4834                                                              hash_base=>$hash, hash_parent_base=>$parent,
4835                                                              file_name=>$diff->{'file'})},
4836                                               "diff") .
4837                                       " | ";
4838                         }
4839                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4840                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4841                                        "blob") . " | ";
4842                         if ($have_blame) {
4843                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4844                                                              file_name=>$diff->{'file'})},
4845                                               "blame") . " | ";
4846                         }
4847                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4848                                                      file_name=>$diff->{'file'})},
4849                                       "history");
4850                         print "</td>\n";
4851
4852                 } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4853                         my %status_name = ('R' => 'moved', 'C' => 'copied');
4854                         my $nstatus = $status_name{$diff->{'status'}};
4855                         my $mode_chng = "";
4856                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4857                                 # mode also for directories, so we cannot use $to_mode_str
4858                                 $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4859                         }
4860                         print "<td>" .
4861                               $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4862                                                      hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4863                                       -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4864                               "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4865                               $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4866                                                      hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4867                                       -class => "list"}, esc_path($diff->{'from_file'})) .
4868                               " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4869                               "<td class=\"link\">";
4870                         if ($action eq 'commitdiff') {
4871                                 # link to patch
4872                                 $patchno++;
4873                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4874                                               "patch") .
4875                                       " | ";
4876                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4877                                 # "commit" view and modified file (not only pure rename or copy)
4878                                 print $cgi->a({-href => href(action=>"blobdiff",
4879                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4880                                                              hash_base=>$hash, hash_parent_base=>$parent,
4881                                                              file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4882                                               "diff") .
4883                                       " | ";
4884                         }
4885                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4886                                                      hash_base=>$parent, file_name=>$diff->{'to_file'})},
4887                                       "blob") . " | ";
4888                         if ($have_blame) {
4889                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4890                                                              file_name=>$diff->{'to_file'})},
4891                                               "blame") . " | ";
4892                         }
4893                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4894                                                     file_name=>$diff->{'to_file'})},
4895                                       "history");
4896                         print "</td>\n";
4897
4898                 } # we should not encounter Unmerged (U) or Unknown (X) status
4899                 print "</tr>\n";
4900         }
4901         print "</tbody>" if $has_header;
4902         print "</table>\n";
4903 }
4904
4905 sub print_sidebyside_diff_chunk {
4906         my @chunk = @_;
4907         my (@ctx, @rem, @add);
4908
4909         return unless @chunk;
4910
4911         # incomplete last line might be among removed or added lines,
4912         # or both, or among context lines: find which
4913         for (my $i = 1; $i < @chunk; $i++) {
4914                 if ($chunk[$i][0] eq 'incomplete') {
4915                         $chunk[$i][0] = $chunk[$i-1][0];
4916                 }
4917         }
4918
4919         # guardian
4920         push @chunk, ["", ""];
4921
4922         foreach my $line_info (@chunk) {
4923                 my ($class, $line) = @$line_info;
4924
4925                 # print chunk headers
4926                 if ($class && $class eq 'chunk_header') {
4927                         print $line;
4928                         next;
4929                 }
4930
4931                 ## print from accumulator when type of class of lines change
4932                 # empty contents block on start rem/add block, or end of chunk
4933                 if (@ctx && (!$class || $class eq 'rem' || $class eq 'add')) {
4934                         print join '',
4935                                 '<div class="chunk_block ctx">',
4936                                         '<div class="old">',
4937                                         @ctx,
4938                                         '</div>',
4939                                         '<div class="new">',
4940                                         @ctx,
4941                                         '</div>',
4942                                 '</div>';
4943                         @ctx = ();
4944                 }
4945                 # empty add/rem block on start context block, or end of chunk
4946                 if ((@rem || @add) && (!$class || $class eq 'ctx')) {
4947                         if (!@add) {
4948                                 # pure removal
4949                                 print join '',
4950                                         '<div class="chunk_block rem">',
4951                                                 '<div class="old">',
4952                                                 @rem,
4953                                                 '</div>',
4954                                         '</div>';
4955                         } elsif (!@rem) {
4956                                 # pure addition
4957                                 print join '',
4958                                         '<div class="chunk_block add">',
4959                                                 '<div class="new">',
4960                                                 @add,
4961                                                 '</div>',
4962                                         '</div>';
4963                         } else {
4964                                 # assume that it is change
4965                                 print join '',
4966                                         '<div class="chunk_block chg">',
4967                                                 '<div class="old">',
4968                                                 @rem,
4969                                                 '</div>',
4970                                                 '<div class="new">',
4971                                                 @add,
4972                                                 '</div>',
4973                                         '</div>';
4974                         }
4975                         @rem = @add = ();
4976                 }
4977
4978                 ## adding lines to accumulator
4979                 # guardian value
4980                 last unless $line;
4981                 # rem, add or change
4982                 if ($class eq 'rem') {
4983                         push @rem, $line;
4984                 } elsif ($class eq 'add') {
4985                         push @add, $line;
4986                 }
4987                 # context line
4988                 if ($class eq 'ctx') {
4989                         push @ctx, $line;
4990                 }
4991         }
4992 }
4993
4994 sub git_patchset_body {
4995         my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
4996         my ($hash_parent) = $hash_parents[0];
4997
4998         my $is_combined = (@hash_parents > 1);
4999         my $patch_idx = 0;
5000         my $patch_number = 0;
5001         my $patch_line;
5002         my $diffinfo;
5003         my $to_name;
5004         my (%from, %to);
5005         my @chunk; # for side-by-side diff
5006
5007         print "<div class=\"patchset\">\n";
5008
5009         # skip to first patch
5010         while ($patch_line = <$fd>) {
5011                 chomp $patch_line;
5012
5013                 last if ($patch_line =~ m/^diff /);
5014         }
5015
5016  PATCH:
5017         while ($patch_line) {
5018
5019                 # parse "git diff" header line
5020                 if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
5021                         # $1 is from_name, which we do not use
5022                         $to_name = unquote($2);
5023                         $to_name =~ s!^b/!!;
5024                 } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
5025                         # $1 is 'cc' or 'combined', which we do not use
5026                         $to_name = unquote($2);
5027                 } else {
5028                         $to_name = undef;
5029                 }
5030
5031                 # check if current patch belong to current raw line
5032                 # and parse raw git-diff line if needed
5033                 if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
5034                         # this is continuation of a split patch
5035                         print "<div class=\"patch cont\">\n";
5036                 } else {
5037                         # advance raw git-diff output if needed
5038                         $patch_idx++ if defined $diffinfo;
5039
5040                         # read and prepare patch information
5041                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5042
5043                         # compact combined diff output can have some patches skipped
5044                         # find which patch (using pathname of result) we are at now;
5045                         if ($is_combined) {
5046                                 while ($to_name ne $diffinfo->{'to_file'}) {
5047                                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5048                                               format_diff_cc_simplified($diffinfo, @hash_parents) .
5049                                               "</div>\n";  # class="patch"
5050
5051                                         $patch_idx++;
5052                                         $patch_number++;
5053
5054                                         last if $patch_idx > $#$difftree;
5055                                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5056                                 }
5057                         }
5058
5059                         # modifies %from, %to hashes
5060                         parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5061
5062                         # this is first patch for raw difftree line with $patch_idx index
5063                         # we index @$difftree array from 0, but number patches from 1
5064                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5065                 }
5066
5067                 # git diff header
5068                 #assert($patch_line =~ m/^diff /) if DEBUG;
5069                 #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5070                 $patch_number++;
5071                 # print "git diff" header
5072                 print format_git_diff_header_line($patch_line, $diffinfo,
5073                                                   \%from, \%to);
5074
5075                 # print extended diff header
5076                 print "<div class=\"diff extended_header\">\n";
5077         EXTENDED_HEADER:
5078                 while ($patch_line = <$fd>) {
5079                         chomp $patch_line;
5080
5081                         last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5082
5083                         print format_extended_diff_header_line($patch_line, $diffinfo,
5084                                                                \%from, \%to);
5085                 }
5086                 print "</div>\n"; # class="diff extended_header"
5087
5088                 # from-file/to-file diff header
5089                 if (! $patch_line) {
5090                         print "</div>\n"; # class="patch"
5091                         last PATCH;
5092                 }
5093                 next PATCH if ($patch_line =~ m/^diff /);
5094                 #assert($patch_line =~ m/^---/) if DEBUG;
5095
5096                 my $last_patch_line = $patch_line;
5097                 $patch_line = <$fd>;
5098                 chomp $patch_line;
5099                 #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5100
5101                 print format_diff_from_to_header($last_patch_line, $patch_line,
5102                                                  $diffinfo, \%from, \%to,
5103                                                  @hash_parents);
5104
5105                 # the patch itself
5106         LINE:
5107                 while ($patch_line = <$fd>) {
5108                         chomp $patch_line;
5109
5110                         next PATCH if ($patch_line =~ m/^diff /);
5111
5112                         my ($class, $line) = process_diff_line($patch_line, \%from, \%to);
5113                         my $diff_classes = "diff";
5114                         $diff_classes .= " $class" if ($class);
5115                         $line = "<div class=\"$diff_classes\">$line</div>\n";
5116
5117                         if ($diff_style eq 'sidebyside' && !$is_combined) {
5118                                 if ($class eq 'chunk_header') {
5119                                         print_sidebyside_diff_chunk(@chunk);
5120                                         @chunk = ( [ $class, $line ] );
5121                                 } else {
5122                                         push @chunk, [ $class, $line ];
5123                                 }
5124                         } else {
5125                                 # default 'inline' style and unknown styles
5126                                 print $line;
5127                         }
5128                 }
5129
5130         } continue {
5131                 if (@chunk) {
5132                         print_sidebyside_diff_chunk(@chunk);
5133                         @chunk = ();
5134                 }
5135                 print "</div>\n"; # class="patch"
5136         }
5137
5138         # for compact combined (--cc) format, with chunk and patch simplification
5139         # the patchset might be empty, but there might be unprocessed raw lines
5140         for (++$patch_idx if $patch_number > 0;
5141              $patch_idx < @$difftree;
5142              ++$patch_idx) {
5143                 # read and prepare patch information
5144                 $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5145
5146                 # generate anchor for "patch" links in difftree / whatchanged part
5147                 print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5148                       format_diff_cc_simplified($diffinfo, @hash_parents) .
5149                       "</div>\n";  # class="patch"
5150
5151                 $patch_number++;
5152         }
5153
5154         if ($patch_number == 0) {
5155                 if (@hash_parents > 1) {
5156                         print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5157                 } else {
5158                         print "<div class=\"diff nodifferences\">No differences found</div>\n";
5159                 }
5160         }
5161
5162         print "</div>\n"; # class="patchset"
5163 }
5164
5165 # . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5166
5167 sub git_project_search_form {
5168         my ($searchtext, $search_use_regexp);
5169
5170         my $limit = '';
5171         if ($project_filter) {
5172                 $limit = " in '$project_filter/'";
5173         }
5174
5175         print "<div class=\"projsearch\">\n";
5176         print $cgi->startform(-method => 'get', -action => $my_uri) .
5177               $cgi->hidden(-name => 'a', -value => 'project_list')  . "\n";
5178         print $cgi->hidden(-name => 'pf', -value => $project_filter). "\n"
5179                 if (defined $project_filter);
5180         print $cgi->textfield(-name => 's', -value => $searchtext,
5181                               -title => "Search project by name and description$limit",
5182                               -size => 60) . "\n" .
5183               "<span title=\"Extended regular expression\">" .
5184               $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
5185                              -checked => $search_use_regexp) .
5186               "</span>\n" .
5187               $cgi->submit(-name => 'btnS', -value => 'Search') .
5188               $cgi->end_form() . "\n" .
5189               $cgi->a({-href => href(project => undef, searchtext => undef,
5190                                      project_filter => $project_filter)},
5191                       esc_html("List all projects$limit")) . "<br />\n";
5192         print "</div>\n";
5193 }
5194
5195 # entry for given @keys needs filling if at least one of keys in list
5196 # is not present in %$project_info
5197 sub project_info_needs_filling {
5198         my ($project_info, @keys) = @_;
5199
5200         # return List::MoreUtils::any { !exists $project_info->{$_} } @keys;
5201         foreach my $key (@keys) {
5202                 if (!exists $project_info->{$key}) {
5203                         return 1;
5204                 }
5205         }
5206         return;
5207 }
5208
5209 # fills project list info (age, description, owner, category, forks, etc.)
5210 # for each project in the list, removing invalid projects from
5211 # returned list, or fill only specified info.
5212 #
5213 # Invalid projects are removed from the returned list if and only if you
5214 # ask 'age' or 'age_string' to be filled, because they are the only fields
5215 # that run unconditionally git command that requires repository, and
5216 # therefore do always check if project repository is invalid.
5217 #
5218 # USAGE:
5219 # * fill_project_list_info(\@project_list, 'descr_long', 'ctags')
5220 #   ensures that 'descr_long' and 'ctags' fields are filled
5221 # * @project_list = fill_project_list_info(\@project_list)
5222 #   ensures that all fields are filled (and invalid projects removed)
5223 #
5224 # NOTE: modifies $projlist, but does not remove entries from it
5225 sub fill_project_list_info {
5226         my ($projlist, @wanted_keys) = @_;
5227         my @projects;
5228         my $filter_set = sub { return @_; };
5229         if (@wanted_keys) {
5230                 my %wanted_keys = map { $_ => 1 } @wanted_keys;
5231                 $filter_set = sub { return grep { $wanted_keys{$_} } @_; };
5232         }
5233
5234         my $show_ctags = gitweb_check_feature('ctags');
5235  PROJECT:
5236         foreach my $pr (@$projlist) {
5237                 if (project_info_needs_filling($pr, $filter_set->('age', 'age_string'))) {
5238                         my (@activity) = git_get_last_activity($pr->{'path'});
5239                         unless (@activity) {
5240                                 next PROJECT;
5241                         }
5242                         ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5243                 }
5244                 if (project_info_needs_filling($pr, $filter_set->('descr', 'descr_long'))) {
5245                         my $descr = git_get_project_description($pr->{'path'}) || "";
5246                         $descr = to_utf8($descr);
5247                         $pr->{'descr_long'} = $descr;
5248                         $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5249                 }
5250                 if (project_info_needs_filling($pr, $filter_set->('owner'))) {
5251                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5252                 }
5253                 if ($show_ctags &&
5254                     project_info_needs_filling($pr, $filter_set->('ctags'))) {
5255                         $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5256                 }
5257                 if ($projects_list_group_categories &&
5258                     project_info_needs_filling($pr, $filter_set->('category'))) {
5259                         my $cat = git_get_project_category($pr->{'path'}) ||
5260                                                            $project_list_default_category;
5261                         $pr->{'category'} = to_utf8($cat);
5262                 }
5263
5264                 push @projects, $pr;
5265         }
5266
5267         return @projects;
5268 }
5269
5270 sub sort_projects_list {
5271         my ($projlist, $order) = @_;
5272         my @projects;
5273
5274         my %order_info = (
5275                 project => { key => 'path', type => 'str' },
5276                 descr => { key => 'descr_long', type => 'str' },
5277                 owner => { key => 'owner', type => 'str' },
5278                 age => { key => 'age', type => 'num' }
5279         );
5280         my $oi = $order_info{$order};
5281         return @$projlist unless defined $oi;
5282         if ($oi->{'type'} eq 'str') {
5283                 @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5284         } else {
5285                 @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5286         }
5287
5288         return @projects;
5289 }
5290
5291 # returns a hash of categories, containing the list of project
5292 # belonging to each category
5293 sub build_projlist_by_category {
5294         my ($projlist, $from, $to) = @_;
5295         my %categories;
5296
5297         $from = 0 unless defined $from;
5298         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5299
5300         for (my $i = $from; $i <= $to; $i++) {
5301                 my $pr = $projlist->[$i];
5302                 push @{$categories{ $pr->{'category'} }}, $pr;
5303         }
5304
5305         return wantarray ? %categories : \%categories;
5306 }
5307
5308 # print 'sort by' <th> element, generating 'sort by $name' replay link
5309 # if that order is not selected
5310 sub print_sort_th {
5311         print format_sort_th(@_);
5312 }
5313
5314 sub format_sort_th {
5315         my ($name, $order, $header) = @_;
5316         my $sort_th = "";
5317         $header ||= ucfirst($name);
5318
5319         if ($order eq $name) {
5320                 $sort_th .= "<th>$header</th>\n";
5321         } else {
5322                 $sort_th .= "<th>" .
5323                             $cgi->a({-href => href(-replay=>1, order=>$name),
5324                                      -class => "header"}, $header) .
5325                             "</th>\n";
5326         }
5327
5328         return $sort_th;
5329 }
5330
5331 sub git_project_list_rows {
5332         my ($projlist, $from, $to, $check_forks) = @_;
5333
5334         $from = 0 unless defined $from;
5335         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5336
5337         my $alternate = 1;
5338         for (my $i = $from; $i <= $to; $i++) {
5339                 my $pr = $projlist->[$i];
5340
5341                 if ($alternate) {
5342                         print "<tr class=\"dark\">\n";
5343                 } else {
5344                         print "<tr class=\"light\">\n";
5345                 }
5346                 $alternate ^= 1;
5347
5348                 if ($check_forks) {
5349                         print "<td>";
5350                         if ($pr->{'forks'}) {
5351                                 my $nforks = scalar @{$pr->{'forks'}};
5352                                 if ($nforks > 0) {
5353                                         print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5354                                                        -title => "$nforks forks"}, "+");
5355                                 } else {
5356                                         print $cgi->span({-title => "$nforks forks"}, "+");
5357                                 }
5358                         }
5359                         print "</td>\n";
5360                 }
5361                 print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5362                                         -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
5363                       "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5364                                         -class => "list", -title => $pr->{'descr_long'}},
5365                                         esc_html($pr->{'descr'})) . "</td>\n" .
5366                       "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5367                 print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5368                       (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
5369                       "<td class=\"link\">" .
5370                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5371                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5372                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5373                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5374                       ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5375                       "</td>\n" .
5376                       "</tr>\n";
5377         }
5378 }
5379
5380 sub git_project_list_body {
5381         # actually uses global variable $project
5382         my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5383         my @projects = @$projlist;
5384
5385         my $check_forks = gitweb_check_feature('forks');
5386         my $show_ctags  = gitweb_check_feature('ctags');
5387         my $tagfilter = $show_ctags ? $input_params{'ctag'} : undef;
5388         $check_forks = undef
5389                 if ($tagfilter || $searchtext);
5390
5391         # filtering out forks before filling info allows to do less work
5392         @projects = filter_forks_from_projects_list(\@projects)
5393                 if ($check_forks);
5394         # search_projects_list pre-fills required info
5395         @projects = search_projects_list(\@projects,
5396                                          'searchtext' => $searchtext,
5397                                          'tagfilter'  => $tagfilter)
5398                 if ($tagfilter || $searchtext);
5399         # fill the rest
5400         @projects = fill_project_list_info(\@projects);
5401
5402         $order ||= $default_projects_order;
5403         $from = 0 unless defined $from;
5404         $to = $#projects if (!defined $to || $#projects < $to);
5405
5406         # short circuit
5407         if ($from > $to) {
5408                 print "<center>\n".
5409                       "<b>No such projects found</b><br />\n".
5410                       "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5411                       "</center>\n<br />\n";
5412                 return;
5413         }
5414
5415         @projects = sort_projects_list(\@projects, $order);
5416
5417         if ($show_ctags) {
5418                 my $ctags = git_gather_all_ctags(\@projects);
5419                 my $cloud = git_populate_project_tagcloud($ctags);
5420                 print git_show_project_tagcloud($cloud, 64);
5421         }
5422
5423         print "<table class=\"project_list\">\n";
5424         unless ($no_header) {
5425                 print "<tr>\n";
5426                 if ($check_forks) {
5427                         print "<th></th>\n";
5428                 }
5429                 print_sort_th('project', $order, 'Project');
5430                 print_sort_th('descr', $order, 'Description');
5431                 print_sort_th('owner', $order, 'Owner');
5432                 print_sort_th('age', $order, 'Last Change');
5433                 print "<th></th>\n" . # for links
5434                       "</tr>\n";
5435         }
5436
5437         if ($projects_list_group_categories) {
5438                 # only display categories with projects in the $from-$to window
5439                 @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5440                 my %categories = build_projlist_by_category(\@projects, $from, $to);
5441                 foreach my $cat (sort keys %categories) {
5442                         unless ($cat eq "") {
5443                                 print "<tr>\n";
5444                                 if ($check_forks) {
5445                                         print "<td></td>\n";
5446                                 }
5447                                 print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5448                                 print "</tr>\n";
5449                         }
5450
5451                         git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5452                 }
5453         } else {
5454                 git_project_list_rows(\@projects, $from, $to, $check_forks);
5455         }
5456
5457         if (defined $extra) {
5458                 print "<tr>\n";
5459                 if ($check_forks) {
5460                         print "<td></td>\n";
5461                 }
5462                 print "<td colspan=\"5\">$extra</td>\n" .
5463                       "</tr>\n";
5464         }
5465         print "</table>\n";
5466 }
5467
5468 sub git_log_body {
5469         # uses global variable $project
5470         my ($commitlist, $from, $to, $refs, $extra) = @_;
5471
5472         $from = 0 unless defined $from;
5473         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5474
5475         for (my $i = 0; $i <= $to; $i++) {
5476                 my %co = %{$commitlist->[$i]};
5477                 next if !%co;
5478                 my $commit = $co{'id'};
5479                 my $ref = format_ref_marker($refs, $commit);
5480                 git_print_header_div('commit',
5481                                "<span class=\"age\">$co{'age_string'}</span>" .
5482                                esc_html($co{'title'}) . $ref,
5483                                $commit);
5484                 print "<div class=\"title_text\">\n" .
5485                       "<div class=\"log_link\">\n" .
5486                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5487                       " | " .
5488                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5489                       " | " .
5490                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5491                       "<br/>\n" .
5492                       "</div>\n";
5493                       git_print_authorship(\%co, -tag => 'span');
5494                       print "<br/>\n</div>\n";
5495
5496                 print "<div class=\"log_body\">\n";
5497                 git_print_log($co{'comment'}, -final_empty_line=> 1);
5498                 print "</div>\n";
5499         }
5500         if ($extra) {
5501                 print "<div class=\"page_nav\">\n";
5502                 print "$extra\n";
5503                 print "</div>\n";
5504         }
5505 }
5506
5507 sub git_shortlog_body {
5508         # uses global variable $project
5509         my ($commitlist, $from, $to, $refs, $extra) = @_;
5510
5511         $from = 0 unless defined $from;
5512         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5513
5514         print "<table class=\"shortlog\">\n";
5515         my $alternate = 1;
5516         for (my $i = $from; $i <= $to; $i++) {
5517                 my %co = %{$commitlist->[$i]};
5518                 my $commit = $co{'id'};
5519                 my $ref = format_ref_marker($refs, $commit);
5520                 if ($alternate) {
5521                         print "<tr class=\"dark\">\n";
5522                 } else {
5523                         print "<tr class=\"light\">\n";
5524                 }
5525                 $alternate ^= 1;
5526                 # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5527                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5528                       format_author_html('td', \%co, 10) . "<td>";
5529                 print format_subject_html($co{'title'}, $co{'title_short'},
5530                                           href(action=>"commit", hash=>$commit), $ref);
5531                 print "</td>\n" .
5532                       "<td class=\"link\">" .
5533                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5534                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5535                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5536                 my $snapshot_links = format_snapshot_links($commit);
5537                 if (defined $snapshot_links) {
5538                         print " | " . $snapshot_links;
5539                 }
5540                 print "</td>\n" .
5541                       "</tr>\n";
5542         }
5543         if (defined $extra) {
5544                 print "<tr>\n" .
5545                       "<td colspan=\"4\">$extra</td>\n" .
5546                       "</tr>\n";
5547         }
5548         print "</table>\n";
5549 }
5550
5551 sub git_history_body {
5552         # Warning: assumes constant type (blob or tree) during history
5553         my ($commitlist, $from, $to, $refs, $extra,
5554             $file_name, $file_hash, $ftype) = @_;
5555
5556         $from = 0 unless defined $from;
5557         $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5558
5559         print "<table class=\"history\">\n";
5560         my $alternate = 1;
5561         for (my $i = $from; $i <= $to; $i++) {
5562                 my %co = %{$commitlist->[$i]};
5563                 if (!%co) {
5564                         next;
5565                 }
5566                 my $commit = $co{'id'};
5567
5568                 my $ref = format_ref_marker($refs, $commit);
5569
5570                 if ($alternate) {
5571                         print "<tr class=\"dark\">\n";
5572                 } else {
5573                         print "<tr class=\"light\">\n";
5574                 }
5575                 $alternate ^= 1;
5576                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5577         # shortlog:   format_author_html('td', \%co, 10)
5578                       format_author_html('td', \%co, 15, 3) . "<td>";
5579                 # originally git_history used chop_str($co{'title'}, 50)
5580                 print format_subject_html($co{'title'}, $co{'title_short'},
5581                                           href(action=>"commit", hash=>$commit), $ref);
5582                 print "</td>\n" .
5583                       "<td class=\"link\">" .
5584                       $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5585                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5586
5587                 if ($ftype eq 'blob') {
5588                         my $blob_current = $file_hash;
5589                         my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5590                         if (defined $blob_current && defined $blob_parent &&
5591                                         $blob_current ne $blob_parent) {
5592                                 print " | " .
5593                                         $cgi->a({-href => href(action=>"blobdiff",
5594                                                                hash=>$blob_current, hash_parent=>$blob_parent,
5595                                                                hash_base=>$hash_base, hash_parent_base=>$commit,
5596                                                                file_name=>$file_name)},
5597                                                 "diff to current");
5598                         }
5599                 }
5600                 print "</td>\n" .
5601                       "</tr>\n";
5602         }
5603         if (defined $extra) {
5604                 print "<tr>\n" .
5605                       "<td colspan=\"4\">$extra</td>\n" .
5606                       "</tr>\n";
5607         }
5608         print "</table>\n";
5609 }
5610
5611 sub git_tags_body {
5612         # uses global variable $project
5613         my ($taglist, $from, $to, $extra) = @_;
5614         $from = 0 unless defined $from;
5615         $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5616
5617         print "<table class=\"tags\">\n";
5618         my $alternate = 1;
5619         for (my $i = $from; $i <= $to; $i++) {
5620                 my $entry = $taglist->[$i];
5621                 my %tag = %$entry;
5622                 my $comment = $tag{'subject'};
5623                 my $comment_short;
5624                 if (defined $comment) {
5625                         $comment_short = chop_str($comment, 30, 5);
5626                 }
5627                 if ($alternate) {
5628                         print "<tr class=\"dark\">\n";
5629                 } else {
5630                         print "<tr class=\"light\">\n";
5631                 }
5632                 $alternate ^= 1;
5633                 if (defined $tag{'age'}) {
5634                         print "<td><i>$tag{'age'}</i></td>\n";
5635                 } else {
5636                         print "<td></td>\n";
5637                 }
5638                 print "<td>" .
5639                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5640                                -class => "list name"}, esc_html($tag{'name'})) .
5641                       "</td>\n" .
5642                       "<td>";
5643                 if (defined $comment) {
5644                         print format_subject_html($comment, $comment_short,
5645                                                   href(action=>"tag", hash=>$tag{'id'}));
5646                 }
5647                 print "</td>\n" .
5648                       "<td class=\"selflink\">";
5649                 if ($tag{'type'} eq "tag") {
5650                         print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5651                 } else {
5652                         print "&nbsp;";
5653                 }
5654                 print "</td>\n" .
5655                       "<td class=\"link\">" . " | " .
5656                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5657                 if ($tag{'reftype'} eq "commit") {
5658                         print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5659                               " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5660                 } elsif ($tag{'reftype'} eq "blob") {
5661                         print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5662                 }
5663                 print "</td>\n" .
5664                       "</tr>";
5665         }
5666         if (defined $extra) {
5667                 print "<tr>\n" .
5668                       "<td colspan=\"5\">$extra</td>\n" .
5669                       "</tr>\n";
5670         }
5671         print "</table>\n";
5672 }
5673
5674 sub git_heads_body {
5675         # uses global variable $project
5676         my ($headlist, $head_at, $from, $to, $extra) = @_;
5677         $from = 0 unless defined $from;
5678         $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5679
5680         print "<table class=\"heads\">\n";
5681         my $alternate = 1;
5682         for (my $i = $from; $i <= $to; $i++) {
5683                 my $entry = $headlist->[$i];
5684                 my %ref = %$entry;
5685                 my $curr = defined $head_at && $ref{'id'} eq $head_at;
5686                 if ($alternate) {
5687                         print "<tr class=\"dark\">\n";
5688                 } else {
5689                         print "<tr class=\"light\">\n";
5690                 }
5691                 $alternate ^= 1;
5692                 print "<td><i>$ref{'age'}</i></td>\n" .
5693                       ($curr ? "<td class=\"current_head\">" : "<td>") .
5694                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5695                                -class => "list name"},esc_html($ref{'name'})) .
5696                       "</td>\n" .
5697                       "<td class=\"link\">" .
5698                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5699                       $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5700                       $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5701                       "</td>\n" .
5702                       "</tr>";
5703         }
5704         if (defined $extra) {
5705                 print "<tr>\n" .
5706                       "<td colspan=\"3\">$extra</td>\n" .
5707                       "</tr>\n";
5708         }
5709         print "</table>\n";
5710 }
5711
5712 # Display a single remote block
5713 sub git_remote_block {
5714         my ($remote, $rdata, $limit, $head) = @_;
5715
5716         my $heads = $rdata->{'heads'};
5717         my $fetch = $rdata->{'fetch'};
5718         my $push = $rdata->{'push'};
5719
5720         my $urls_table = "<table class=\"projects_list\">\n" ;
5721
5722         if (defined $fetch) {
5723                 if ($fetch eq $push) {
5724                         $urls_table .= format_repo_url("URL", $fetch);
5725                 } else {
5726                         $urls_table .= format_repo_url("Fetch URL", $fetch);
5727                         $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5728                 }
5729         } elsif (defined $push) {
5730                 $urls_table .= format_repo_url("Push URL", $push);
5731         } else {
5732                 $urls_table .= format_repo_url("", "No remote URL");
5733         }
5734
5735         $urls_table .= "</table>\n";
5736
5737         my $dots;
5738         if (defined $limit && $limit < @$heads) {
5739                 $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5740         }
5741
5742         print $urls_table;
5743         git_heads_body($heads, $head, 0, $limit, $dots);
5744 }
5745
5746 # Display a list of remote names with the respective fetch and push URLs
5747 sub git_remotes_list {
5748         my ($remotedata, $limit) = @_;
5749         print "<table class=\"heads\">\n";
5750         my $alternate = 1;
5751         my @remotes = sort keys %$remotedata;
5752
5753         my $limited = $limit && $limit < @remotes;
5754
5755         $#remotes = $limit - 1 if $limited;
5756
5757         while (my $remote = shift @remotes) {
5758                 my $rdata = $remotedata->{$remote};
5759                 my $fetch = $rdata->{'fetch'};
5760                 my $push = $rdata->{'push'};
5761                 if ($alternate) {
5762                         print "<tr class=\"dark\">\n";
5763                 } else {
5764                         print "<tr class=\"light\">\n";
5765                 }
5766                 $alternate ^= 1;
5767                 print "<td>" .
5768                       $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5769                                -class=> "list name"},esc_html($remote)) .
5770                       "</td>";
5771                 print "<td class=\"link\">" .
5772                       (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5773                       " | " .
5774                       (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5775                       "</td>";
5776
5777                 print "</tr>\n";
5778         }
5779
5780         if ($limited) {
5781                 print "<tr>\n" .
5782                       "<td colspan=\"3\">" .
5783                       $cgi->a({-href => href(action=>"remotes")}, "...") .
5784                       "</td>\n" . "</tr>\n";
5785         }
5786
5787         print "</table>";
5788 }
5789
5790 # Display remote heads grouped by remote, unless there are too many
5791 # remotes, in which case we only display the remote names
5792 sub git_remotes_body {
5793         my ($remotedata, $limit, $head) = @_;
5794         if ($limit and $limit < keys %$remotedata) {
5795                 git_remotes_list($remotedata, $limit);
5796         } else {
5797                 fill_remote_heads($remotedata);
5798                 while (my ($remote, $rdata) = each %$remotedata) {
5799                         git_print_section({-class=>"remote", -id=>$remote},
5800                                 ["remotes", $remote, $remote], sub {
5801                                         git_remote_block($remote, $rdata, $limit, $head);
5802                                 });
5803                 }
5804         }
5805 }
5806
5807 sub git_search_message {
5808         my %co = @_;
5809
5810         my $greptype;
5811         if ($searchtype eq 'commit') {
5812                 $greptype = "--grep=";
5813         } elsif ($searchtype eq 'author') {
5814                 $greptype = "--author=";
5815         } elsif ($searchtype eq 'committer') {
5816                 $greptype = "--committer=";
5817         }
5818         $greptype .= $searchtext;
5819         my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
5820                                        $greptype, '--regexp-ignore-case',
5821                                        $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
5822
5823         my $paging_nav = '';
5824         if ($page > 0) {
5825                 $paging_nav .=
5826                         $cgi->a({-href => href(-replay=>1, page=>undef)},
5827                                 "first") .
5828                         " &sdot; " .
5829                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
5830                                  -accesskey => "p", -title => "Alt-p"}, "prev");
5831         } else {
5832                 $paging_nav .= "first &sdot; prev";
5833         }
5834         my $next_link = '';
5835         if ($#commitlist >= 100) {
5836                 $next_link =
5837                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
5838                                  -accesskey => "n", -title => "Alt-n"}, "next");
5839                 $paging_nav .= " &sdot; $next_link";
5840         } else {
5841                 $paging_nav .= " &sdot; next";
5842         }
5843
5844         git_header_html();
5845
5846         git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
5847         git_print_header_div('commit', esc_html($co{'title'}), $hash);
5848         if ($page == 0 && !@commitlist) {
5849                 print "<p>No match.</p>\n";
5850         } else {
5851                 git_search_grep_body(\@commitlist, 0, 99, $next_link);
5852         }
5853
5854         git_footer_html();
5855 }
5856
5857 sub git_search_changes {
5858         my %co = @_;
5859
5860         local $/ = "\n";
5861         open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
5862                 '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
5863                 ($search_use_regexp ? '--pickaxe-regex' : ())
5864                         or die_error(500, "Open git-log failed");
5865
5866         git_header_html();
5867
5868         git_print_page_nav('','', $hash,$co{'tree'},$hash);
5869         git_print_header_div('commit', esc_html($co{'title'}), $hash);
5870
5871         print "<table class=\"pickaxe search\">\n";
5872         my $alternate = 1;
5873         undef %co;
5874         my @files;
5875         while (my $line = <$fd>) {
5876                 chomp $line;
5877                 next unless $line;
5878
5879                 my %set = parse_difftree_raw_line($line);
5880                 if (defined $set{'commit'}) {
5881                         # finish previous commit
5882                         if (%co) {
5883                                 print "</td>\n" .
5884                                       "<td class=\"link\">" .
5885                                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5886                                               "commit") .
5887                                       " | " .
5888                                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5889                                                              hash_base=>$co{'id'})},
5890                                               "tree") .
5891                                       "</td>\n" .
5892                                       "</tr>\n";
5893                         }
5894
5895                         if ($alternate) {
5896                                 print "<tr class=\"dark\">\n";
5897                         } else {
5898                                 print "<tr class=\"light\">\n";
5899                         }
5900                         $alternate ^= 1;
5901                         %co = parse_commit($set{'commit'});
5902                         my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
5903                         print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5904                               "<td><i>$author</i></td>\n" .
5905                               "<td>" .
5906                               $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5907                                       -class => "list subject"},
5908                                       chop_and_escape_str($co{'title'}, 50) . "<br/>");
5909                 } elsif (defined $set{'to_id'}) {
5910                         next if ($set{'to_id'} =~ m/^0{40}$/);
5911
5912                         print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
5913                                                      hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
5914                                       -class => "list"},
5915                                       "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
5916                               "<br/>\n";
5917                 }
5918         }
5919         close $fd;
5920
5921         # finish last commit (warning: repetition!)
5922         if (%co) {
5923                 print "</td>\n" .
5924                       "<td class=\"link\">" .
5925                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5926                               "commit") .
5927                       " | " .
5928                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5929                                              hash_base=>$co{'id'})},
5930                               "tree") .
5931                       "</td>\n" .
5932                       "</tr>\n";
5933         }
5934
5935         print "</table>\n";
5936
5937         git_footer_html();
5938 }
5939
5940 sub git_search_files {
5941         my %co = @_;
5942
5943         local $/ = "\n";
5944         open my $fd, "-|", git_cmd(), 'grep', '-n', '-z',
5945                 $search_use_regexp ? ('-E', '-i') : '-F',
5946                 $searchtext, $co{'tree'}
5947                         or die_error(500, "Open git-grep failed");
5948
5949         git_header_html();
5950
5951         git_print_page_nav('','', $hash,$co{'tree'},$hash);
5952         git_print_header_div('commit', esc_html($co{'title'}), $hash);
5953
5954         print "<table class=\"grep_search\">\n";
5955         my $alternate = 1;
5956         my $matches = 0;
5957         my $lastfile = '';
5958         my $file_href;
5959         while (my $line = <$fd>) {
5960                 chomp $line;
5961                 my ($file, $lno, $ltext, $binary);
5962                 last if ($matches++ > 1000);
5963                 if ($line =~ /^Binary file (.+) matches$/) {
5964                         $file = $1;
5965                         $binary = 1;
5966                 } else {
5967                         ($file, $lno, $ltext) = split(/\0/, $line, 3);
5968                         $file =~ s/^$co{'tree'}://;
5969                 }
5970                 if ($file ne $lastfile) {
5971                         $lastfile and print "</td></tr>\n";
5972                         if ($alternate++) {
5973                                 print "<tr class=\"dark\">\n";
5974                         } else {
5975                                 print "<tr class=\"light\">\n";
5976                         }
5977                         $file_href = href(action=>"blob", hash_base=>$co{'id'},
5978                                           file_name=>$file);
5979                         print "<td class=\"list\">".
5980                                 $cgi->a({-href => $file_href, -class => "list"}, esc_path($file));
5981                         print "</td><td>\n";
5982                         $lastfile = $file;
5983                 }
5984                 if ($binary) {
5985                         print "<div class=\"binary\">Binary file</div>\n";
5986                 } else {
5987                         $ltext = untabify($ltext);
5988                         if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
5989                                 $ltext = esc_html($1, -nbsp=>1);
5990                                 $ltext .= '<span class="match">';
5991                                 $ltext .= esc_html($2, -nbsp=>1);
5992                                 $ltext .= '</span>';
5993                                 $ltext .= esc_html($3, -nbsp=>1);
5994                         } else {
5995                                 $ltext = esc_html($ltext, -nbsp=>1);
5996                         }
5997                         print "<div class=\"pre\">" .
5998                                 $cgi->a({-href => $file_href.'#l'.$lno,
5999                                         -class => "linenr"}, sprintf('%4i', $lno)) .
6000                                 ' ' .  $ltext . "</div>\n";
6001                 }
6002         }
6003         if ($lastfile) {
6004                 print "</td></tr>\n";
6005                 if ($matches > 1000) {
6006                         print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
6007                 }
6008         } else {
6009                 print "<div class=\"diff nodifferences\">No matches found</div>\n";
6010         }
6011         close $fd;
6012
6013         print "</table>\n";
6014
6015         git_footer_html();
6016 }
6017
6018 sub git_search_grep_body {
6019         my ($commitlist, $from, $to, $extra) = @_;
6020         $from = 0 unless defined $from;
6021         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
6022
6023         print "<table class=\"commit_search\">\n";
6024         my $alternate = 1;
6025         for (my $i = $from; $i <= $to; $i++) {
6026                 my %co = %{$commitlist->[$i]};
6027                 if (!%co) {
6028                         next;
6029                 }
6030                 my $commit = $co{'id'};
6031                 if ($alternate) {
6032                         print "<tr class=\"dark\">\n";
6033                 } else {
6034                         print "<tr class=\"light\">\n";
6035                 }
6036                 $alternate ^= 1;
6037                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
6038                       format_author_html('td', \%co, 15, 5) .
6039                       "<td>" .
6040                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
6041                                -class => "list subject"},
6042                               chop_and_escape_str($co{'title'}, 50) . "<br/>");
6043                 my $comment = $co{'comment'};
6044                 foreach my $line (@$comment) {
6045                         if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
6046                                 my ($lead, $match, $trail) = ($1, $2, $3);
6047                                 $match = chop_str($match, 70, 5, 'center');
6048                                 my $contextlen = int((80 - length($match))/2);
6049                                 $contextlen = 30 if ($contextlen > 30);
6050                                 $lead  = chop_str($lead,  $contextlen, 10, 'left');
6051                                 $trail = chop_str($trail, $contextlen, 10, 'right');
6052
6053                                 $lead  = esc_html($lead);
6054                                 $match = esc_html($match);
6055                                 $trail = esc_html($trail);
6056
6057                                 print "$lead<span class=\"match\">$match</span>$trail<br />";
6058                         }
6059                 }
6060                 print "</td>\n" .
6061                       "<td class=\"link\">" .
6062                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
6063                       " | " .
6064                       $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
6065                       " | " .
6066                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
6067                 print "</td>\n" .
6068                       "</tr>\n";
6069         }
6070         if (defined $extra) {
6071                 print "<tr>\n" .
6072                       "<td colspan=\"3\">$extra</td>\n" .
6073                       "</tr>\n";
6074         }
6075         print "</table>\n";
6076 }
6077
6078 ## ======================================================================
6079 ## ======================================================================
6080 ## actions
6081
6082 sub git_project_list {
6083         my $order = $input_params{'order'};
6084         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6085                 die_error(400, "Unknown order parameter");
6086         }
6087
6088         my @list = git_get_projects_list($project_filter, $strict_export);
6089         if (!@list) {
6090                 die_error(404, "No projects found");
6091         }
6092
6093         git_header_html();
6094         if (defined $home_text && -f $home_text) {
6095                 print "<div class=\"index_include\">\n";
6096                 insert_file($home_text);
6097                 print "</div>\n";
6098         }
6099
6100         git_project_search_form($searchtext, $search_use_regexp);
6101         git_project_list_body(\@list, $order);
6102         git_footer_html();
6103 }
6104
6105 sub git_forks {
6106         my $order = $input_params{'order'};
6107         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6108                 die_error(400, "Unknown order parameter");
6109         }
6110
6111         my $filter = $project;
6112         $filter =~ s/\.git$//;
6113         my @list = git_get_projects_list($filter);
6114         if (!@list) {
6115                 die_error(404, "No forks found");
6116         }
6117
6118         git_header_html();
6119         git_print_page_nav('','');
6120         git_print_header_div('summary', "$project forks");
6121         git_project_list_body(\@list, $order);
6122         git_footer_html();
6123 }
6124
6125 sub git_project_index {
6126         my @projects = git_get_projects_list($project_filter, $strict_export);
6127         if (!@projects) {
6128                 die_error(404, "No projects found");
6129         }
6130
6131         print $cgi->header(
6132                 -type => 'text/plain',
6133                 -charset => 'utf-8',
6134                 -content_disposition => 'inline; filename="index.aux"');
6135
6136         foreach my $pr (@projects) {
6137                 if (!exists $pr->{'owner'}) {
6138                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6139                 }
6140
6141                 my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6142                 # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6143                 $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6144                 $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6145                 $path  =~ s/ /\+/g;
6146                 $owner =~ s/ /\+/g;
6147
6148                 print "$path $owner\n";
6149         }
6150 }
6151
6152 sub git_summary {
6153         my $descr = git_get_project_description($project) || "none";
6154         my %co = parse_commit("HEAD");
6155         my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6156         my $head = $co{'id'};
6157         my $remote_heads = gitweb_check_feature('remote_heads');
6158
6159         my $owner = git_get_project_owner($project);
6160
6161         my $refs = git_get_references();
6162         # These get_*_list functions return one more to allow us to see if
6163         # there are more ...
6164         my @taglist  = git_get_tags_list(16);
6165         my @headlist = git_get_heads_list(16);
6166         my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6167         my @forklist;
6168         my $check_forks = gitweb_check_feature('forks');
6169
6170         if ($check_forks) {
6171                 # find forks of a project
6172                 my $filter = $project;
6173                 $filter =~ s/\.git$//;
6174                 @forklist = git_get_projects_list($filter);
6175                 # filter out forks of forks
6176                 @forklist = filter_forks_from_projects_list(\@forklist)
6177                         if (@forklist);
6178         }
6179
6180         git_header_html();
6181         git_print_page_nav('summary','', $head);
6182
6183         print "<div class=\"title\">&nbsp;</div>\n";
6184         print "<table class=\"projects_list\">\n" .
6185               "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
6186               "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6187         if (defined $cd{'rfc2822'}) {
6188                 print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6189                       "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6190         }
6191
6192         # use per project git URL list in $projectroot/$project/cloneurl
6193         # or make project git URL from git base URL and project name
6194         my $url_tag = "URL";
6195         my @url_list = git_get_project_url_list($project);
6196         @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6197         foreach my $git_url (@url_list) {
6198                 next unless $git_url;
6199                 print format_repo_url($url_tag, $git_url);
6200                 $url_tag = "";
6201         }
6202
6203         # Tag cloud
6204         my $show_ctags = gitweb_check_feature('ctags');
6205         if ($show_ctags) {
6206                 my $ctags = git_get_project_ctags($project);
6207                 if (%$ctags) {
6208                         # without ability to add tags, don't show if there are none
6209                         my $cloud = git_populate_project_tagcloud($ctags);
6210                         print "<tr id=\"metadata_ctags\">" .
6211                               "<td>content tags</td>" .
6212                               "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6213                               "</tr>\n";
6214                 }
6215         }
6216
6217         print "</table>\n";
6218
6219         # If XSS prevention is on, we don't include README.html.
6220         # TODO: Allow a readme in some safe format.
6221         if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6222                 print "<div class=\"title\">readme</div>\n" .
6223                       "<div class=\"readme\">\n";
6224                 insert_file("$projectroot/$project/README.html");
6225                 print "\n</div>\n"; # class="readme"
6226         }
6227
6228         # we need to request one more than 16 (0..15) to check if
6229         # those 16 are all
6230         my @commitlist = $head ? parse_commits($head, 17) : ();
6231         if (@commitlist) {
6232                 git_print_header_div('shortlog');
6233                 git_shortlog_body(\@commitlist, 0, 15, $refs,
6234                                   $#commitlist <=  15 ? undef :
6235                                   $cgi->a({-href => href(action=>"shortlog")}, "..."));
6236         }
6237
6238         if (@taglist) {
6239                 git_print_header_div('tags');
6240                 git_tags_body(\@taglist, 0, 15,
6241                               $#taglist <=  15 ? undef :
6242                               $cgi->a({-href => href(action=>"tags")}, "..."));
6243         }
6244
6245         if (@headlist) {
6246                 git_print_header_div('heads');
6247                 git_heads_body(\@headlist, $head, 0, 15,
6248                                $#headlist <= 15 ? undef :
6249                                $cgi->a({-href => href(action=>"heads")}, "..."));
6250         }
6251
6252         if (%remotedata) {
6253                 git_print_header_div('remotes');
6254                 git_remotes_body(\%remotedata, 15, $head);
6255         }
6256
6257         if (@forklist) {
6258                 git_print_header_div('forks');
6259                 git_project_list_body(\@forklist, 'age', 0, 15,
6260                                       $#forklist <= 15 ? undef :
6261                                       $cgi->a({-href => href(action=>"forks")}, "..."),
6262                                       'no_header');
6263         }
6264
6265         git_footer_html();
6266 }
6267
6268 sub git_tag {
6269         my %tag = parse_tag($hash);
6270
6271         if (! %tag) {
6272                 die_error(404, "Unknown tag object");
6273         }
6274
6275         my $head = git_get_head_hash($project);
6276         git_header_html();
6277         git_print_page_nav('','', $head,undef,$head);
6278         git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6279         print "<div class=\"title_text\">\n" .
6280               "<table class=\"object_header\">\n" .
6281               "<tr>\n" .
6282               "<td>object</td>\n" .
6283               "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6284                                $tag{'object'}) . "</td>\n" .
6285               "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6286                                               $tag{'type'}) . "</td>\n" .
6287               "</tr>\n";
6288         if (defined($tag{'author'})) {
6289                 git_print_authorship_rows(\%tag, 'author');
6290         }
6291         print "</table>\n\n" .
6292               "</div>\n";
6293         print "<div class=\"page_body\">";
6294         my $comment = $tag{'comment'};
6295         foreach my $line (@$comment) {
6296                 chomp $line;
6297                 print esc_html($line, -nbsp=>1) . "<br/>\n";
6298         }
6299         print "</div>\n";
6300         git_footer_html();
6301 }
6302
6303 sub git_blame_common {
6304         my $format = shift || 'porcelain';
6305         if ($format eq 'porcelain' && $input_params{'javascript'}) {
6306                 $format = 'incremental';
6307                 $action = 'blame_incremental'; # for page title etc
6308         }
6309
6310         # permissions
6311         gitweb_check_feature('blame')
6312                 or die_error(403, "Blame view not allowed");
6313
6314         # error checking
6315         die_error(400, "No file name given") unless $file_name;
6316         $hash_base ||= git_get_head_hash($project);
6317         die_error(404, "Couldn't find base commit") unless $hash_base;
6318         my %co = parse_commit($hash_base)
6319                 or die_error(404, "Commit not found");
6320         my $ftype = "blob";
6321         if (!defined $hash) {
6322                 $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6323                         or die_error(404, "Error looking up file");
6324         } else {
6325                 $ftype = git_get_type($hash);
6326                 if ($ftype !~ "blob") {
6327                         die_error(400, "Object is not a blob");
6328                 }
6329         }
6330
6331         my $fd;
6332         if ($format eq 'incremental') {
6333                 # get file contents (as base)
6334                 open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6335                         or die_error(500, "Open git-cat-file failed");
6336         } elsif ($format eq 'data') {
6337                 # run git-blame --incremental
6338                 open $fd, "-|", git_cmd(), "blame", "--incremental",
6339                         $hash_base, "--", $file_name
6340                         or die_error(500, "Open git-blame --incremental failed");
6341         } else {
6342                 # run git-blame --porcelain
6343                 open $fd, "-|", git_cmd(), "blame", '-p',
6344                         $hash_base, '--', $file_name
6345                         or die_error(500, "Open git-blame --porcelain failed");
6346         }
6347
6348         # incremental blame data returns early
6349         if ($format eq 'data') {
6350                 print $cgi->header(
6351                         -type=>"text/plain", -charset => "utf-8",
6352                         -status=> "200 OK");
6353                 local $| = 1; # output autoflush
6354                 while (my $line = <$fd>) {
6355                         print to_utf8($line);
6356                 }
6357                 close $fd
6358                         or print "ERROR $!\n";
6359
6360                 print 'END';
6361                 if (defined $t0 && gitweb_check_feature('timed')) {
6362                         print ' '.
6363                               tv_interval($t0, [ gettimeofday() ]).
6364                               ' '.$number_of_git_cmds;
6365                 }
6366                 print "\n";
6367
6368                 return;
6369         }
6370
6371         # page header
6372         git_header_html();
6373         my $formats_nav =
6374                 $cgi->a({-href => href(action=>"blob", -replay=>1)},
6375                         "blob") .
6376                 " | ";
6377         if ($format eq 'incremental') {
6378                 $formats_nav .=
6379                         $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6380                                 "blame") . " (non-incremental)";
6381         } else {
6382                 $formats_nav .=
6383                         $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6384                                 "blame") . " (incremental)";
6385         }
6386         $formats_nav .=
6387                 " | " .
6388                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6389                         "history") .
6390                 " | " .
6391                 $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6392                         "HEAD");
6393         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6394         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6395         git_print_page_path($file_name, $ftype, $hash_base);
6396
6397         # page body
6398         if ($format eq 'incremental') {
6399                 print "<noscript>\n<div class=\"error\"><center><b>\n".
6400                       "This page requires JavaScript to run.\n Use ".
6401                       $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6402                               'this page').
6403                       " instead.\n".
6404                       "</b></center></div>\n</noscript>\n";
6405
6406                 print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6407         }
6408
6409         print qq!<div class="page_body">\n!;
6410         print qq!<div id="progress_info">... / ...</div>\n!
6411                 if ($format eq 'incremental');
6412         print qq!<table id="blame_table" class="blame" width="100%">\n!.
6413               #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6414               qq!<thead>\n!.
6415               qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6416               qq!</thead>\n!.
6417               qq!<tbody>\n!;
6418
6419         my @rev_color = qw(light dark);
6420         my $num_colors = scalar(@rev_color);
6421         my $current_color = 0;
6422
6423         if ($format eq 'incremental') {
6424                 my $color_class = $rev_color[$current_color];
6425
6426                 #contents of a file
6427                 my $linenr = 0;
6428         LINE:
6429                 while (my $line = <$fd>) {
6430                         chomp $line;
6431                         $linenr++;
6432
6433                         print qq!<tr id="l$linenr" class="$color_class">!.
6434                               qq!<td class="sha1"><a href=""> </a></td>!.
6435                               qq!<td class="linenr">!.
6436                               qq!<a class="linenr" href="">$linenr</a></td>!;
6437                         print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6438                         print qq!</tr>\n!;
6439                 }
6440
6441         } else { # porcelain, i.e. ordinary blame
6442                 my %metainfo = (); # saves information about commits
6443
6444                 # blame data
6445         LINE:
6446                 while (my $line = <$fd>) {
6447                         chomp $line;
6448                         # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6449                         # no <lines in group> for subsequent lines in group of lines
6450                         my ($full_rev, $orig_lineno, $lineno, $group_size) =
6451                            ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6452                         if (!exists $metainfo{$full_rev}) {
6453                                 $metainfo{$full_rev} = { 'nprevious' => 0 };
6454                         }
6455                         my $meta = $metainfo{$full_rev};
6456                         my $data;
6457                         while ($data = <$fd>) {
6458                                 chomp $data;
6459                                 last if ($data =~ s/^\t//); # contents of line
6460                                 if ($data =~ /^(\S+)(?: (.*))?$/) {
6461                                         $meta->{$1} = $2 unless exists $meta->{$1};
6462                                 }
6463                                 if ($data =~ /^previous /) {
6464                                         $meta->{'nprevious'}++;
6465                                 }
6466                         }
6467                         my $short_rev = substr($full_rev, 0, 8);
6468                         my $author = $meta->{'author'};
6469                         my %date =
6470                                 parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6471                         my $date = $date{'iso-tz'};
6472                         if ($group_size) {
6473                                 $current_color = ($current_color + 1) % $num_colors;
6474                         }
6475                         my $tr_class = $rev_color[$current_color];
6476                         $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6477                         $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6478                         $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6479                         print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6480                         if ($group_size) {
6481                                 print "<td class=\"sha1\"";
6482                                 print " title=\"". esc_html($author) . ", $date\"";
6483                                 print " rowspan=\"$group_size\"" if ($group_size > 1);
6484                                 print ">";
6485                                 print $cgi->a({-href => href(action=>"commit",
6486                                                              hash=>$full_rev,
6487                                                              file_name=>$file_name)},
6488                                               esc_html($short_rev));
6489                                 if ($group_size >= 2) {
6490                                         my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6491                                         if (@author_initials) {
6492                                                 print "<br />" .
6493                                                       esc_html(join('', @author_initials));
6494                                                 #           or join('.', ...)
6495                                         }
6496                                 }
6497                                 print "</td>\n";
6498                         }
6499                         # 'previous' <sha1 of parent commit> <filename at commit>
6500                         if (exists $meta->{'previous'} &&
6501                             $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6502                                 $meta->{'parent'} = $1;
6503                                 $meta->{'file_parent'} = unquote($2);
6504                         }
6505                         my $linenr_commit =
6506                                 exists($meta->{'parent'}) ?
6507                                 $meta->{'parent'} : $full_rev;
6508                         my $linenr_filename =
6509                                 exists($meta->{'file_parent'}) ?
6510                                 $meta->{'file_parent'} : unquote($meta->{'filename'});
6511                         my $blamed = href(action => 'blame',
6512                                           file_name => $linenr_filename,
6513                                           hash_base => $linenr_commit);
6514                         print "<td class=\"linenr\">";
6515                         print $cgi->a({ -href => "$blamed#l$orig_lineno",
6516                                         -class => "linenr" },
6517                                       esc_html($lineno));
6518                         print "</td>";
6519                         print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6520                         print "</tr>\n";
6521                 } # end while
6522
6523         }
6524
6525         # footer
6526         print "</tbody>\n".
6527               "</table>\n"; # class="blame"
6528         print "</div>\n";   # class="blame_body"
6529         close $fd
6530                 or print "Reading blob failed\n";
6531
6532         git_footer_html();
6533 }
6534
6535 sub git_blame {
6536         git_blame_common();
6537 }
6538
6539 sub git_blame_incremental {
6540         git_blame_common('incremental');
6541 }
6542
6543 sub git_blame_data {
6544         git_blame_common('data');
6545 }
6546
6547 sub git_tags {
6548         my $head = git_get_head_hash($project);
6549         git_header_html();
6550         git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6551         git_print_header_div('summary', $project);
6552
6553         my @tagslist = git_get_tags_list();
6554         if (@tagslist) {
6555                 git_tags_body(\@tagslist);
6556         }
6557         git_footer_html();
6558 }
6559
6560 sub git_heads {
6561         my $head = git_get_head_hash($project);
6562         git_header_html();
6563         git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6564         git_print_header_div('summary', $project);
6565
6566         my @headslist = git_get_heads_list();
6567         if (@headslist) {
6568                 git_heads_body(\@headslist, $head);
6569         }
6570         git_footer_html();
6571 }
6572
6573 # used both for single remote view and for list of all the remotes
6574 sub git_remotes {
6575         gitweb_check_feature('remote_heads')
6576                 or die_error(403, "Remote heads view is disabled");
6577
6578         my $head = git_get_head_hash($project);
6579         my $remote = $input_params{'hash'};
6580
6581         my $remotedata = git_get_remotes_list($remote);
6582         die_error(500, "Unable to get remote information") unless defined $remotedata;
6583
6584         unless (%$remotedata) {
6585                 die_error(404, defined $remote ?
6586                         "Remote $remote not found" :
6587                         "No remotes found");
6588         }
6589
6590         git_header_html(undef, undef, -action_extra => $remote);
6591         git_print_page_nav('', '',  $head, undef, $head,
6592                 format_ref_views($remote ? '' : 'remotes'));
6593
6594         fill_remote_heads($remotedata);
6595         if (defined $remote) {
6596                 git_print_header_div('remotes', "$remote remote for $project");
6597                 git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6598         } else {
6599                 git_print_header_div('summary', "$project remotes");
6600                 git_remotes_body($remotedata, undef, $head);
6601         }
6602
6603         git_footer_html();
6604 }
6605
6606 sub git_blob_plain {
6607         my $type = shift;
6608         my $expires;
6609
6610         if (!defined $hash) {
6611                 if (defined $file_name) {
6612                         my $base = $hash_base || git_get_head_hash($project);
6613                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6614                                 or die_error(404, "Cannot find file");
6615                 } else {
6616                         die_error(400, "No file name defined");
6617                 }
6618         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6619                 # blobs defined by non-textual hash id's can be cached
6620                 $expires = "+1d";
6621         }
6622
6623         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6624                 or die_error(500, "Open git-cat-file blob '$hash' failed");
6625
6626         # content-type (can include charset)
6627         $type = blob_contenttype($fd, $file_name, $type);
6628
6629         # "save as" filename, even when no $file_name is given
6630         my $save_as = "$hash";
6631         if (defined $file_name) {
6632                 $save_as = $file_name;
6633         } elsif ($type =~ m/^text\//) {
6634                 $save_as .= '.txt';
6635         }
6636
6637         # With XSS prevention on, blobs of all types except a few known safe
6638         # ones are served with "Content-Disposition: attachment" to make sure
6639         # they don't run in our security domain.  For certain image types,
6640         # blob view writes an <img> tag referring to blob_plain view, and we
6641         # want to be sure not to break that by serving the image as an
6642         # attachment (though Firefox 3 doesn't seem to care).
6643         my $sandbox = $prevent_xss &&
6644                 $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6645
6646         # serve text/* as text/plain
6647         if ($prevent_xss &&
6648             ($type =~ m!^text/[a-z]+\b(.*)$! ||
6649              ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
6650                 my $rest = $1;
6651                 $rest = defined $rest ? $rest : '';
6652                 $type = "text/plain$rest";
6653         }
6654
6655         print $cgi->header(
6656                 -type => $type,
6657                 -expires => $expires,
6658                 -content_disposition =>
6659                         ($sandbox ? 'attachment' : 'inline')
6660                         . '; filename="' . $save_as . '"');
6661         local $/ = undef;
6662         binmode STDOUT, ':raw';
6663         print <$fd>;
6664         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6665         close $fd;
6666 }
6667
6668 sub git_blob {
6669         my $expires;
6670
6671         if (!defined $hash) {
6672                 if (defined $file_name) {
6673                         my $base = $hash_base || git_get_head_hash($project);
6674                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6675                                 or die_error(404, "Cannot find file");
6676                 } else {
6677                         die_error(400, "No file name defined");
6678                 }
6679         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6680                 # blobs defined by non-textual hash id's can be cached
6681                 $expires = "+1d";
6682         }
6683
6684         my $have_blame = gitweb_check_feature('blame');
6685         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6686                 or die_error(500, "Couldn't cat $file_name, $hash");
6687         my $mimetype = blob_mimetype($fd, $file_name);
6688         # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6689         if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6690                 close $fd;
6691                 return git_blob_plain($mimetype);
6692         }
6693         # we can have blame only for text/* mimetype
6694         $have_blame &&= ($mimetype =~ m!^text/!);
6695
6696         my $highlight = gitweb_check_feature('highlight');
6697         my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6698         $fd = run_highlighter($fd, $highlight, $syntax)
6699                 if $syntax;
6700
6701         git_header_html(undef, $expires);
6702         my $formats_nav = '';
6703         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6704                 if (defined $file_name) {
6705                         if ($have_blame) {
6706                                 $formats_nav .=
6707                                         $cgi->a({-href => href(action=>"blame", -replay=>1)},
6708                                                 "blame") .
6709                                         " | ";
6710                         }
6711                         $formats_nav .=
6712                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6713                                         "history") .
6714                                 " | " .
6715                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6716                                         "raw") .
6717                                 " | " .
6718                                 $cgi->a({-href => href(action=>"blob",
6719                                                        hash_base=>"HEAD", file_name=>$file_name)},
6720                                         "HEAD");
6721                 } else {
6722                         $formats_nav .=
6723                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6724                                         "raw");
6725                 }
6726                 git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6727                 git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6728         } else {
6729                 print "<div class=\"page_nav\">\n" .
6730                       "<br/><br/></div>\n" .
6731                       "<div class=\"title\">".esc_html($hash)."</div>\n";
6732         }
6733         git_print_page_path($file_name, "blob", $hash_base);
6734         print "<div class=\"page_body\">\n";
6735         if ($mimetype =~ m!^image/!) {
6736                 print qq!<img type="!.esc_attr($mimetype).qq!"!;
6737                 if ($file_name) {
6738                         print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
6739                 }
6740                 print qq! src="! .
6741                       href(action=>"blob_plain", hash=>$hash,
6742                            hash_base=>$hash_base, file_name=>$file_name) .
6743                       qq!" />\n!;
6744         } else {
6745                 my $nr;
6746                 while (my $line = <$fd>) {
6747                         chomp $line;
6748                         $nr++;
6749                         $line = untabify($line);
6750                         printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
6751                                $nr, esc_attr(href(-replay => 1)), $nr, $nr,
6752                                $syntax ? sanitize($line) : esc_html($line, -nbsp=>1);
6753                 }
6754         }
6755         close $fd
6756                 or print "Reading blob failed.\n";
6757         print "</div>";
6758         git_footer_html();
6759 }
6760
6761 sub git_tree {
6762         if (!defined $hash_base) {
6763                 $hash_base = "HEAD";
6764         }
6765         if (!defined $hash) {
6766                 if (defined $file_name) {
6767                         $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
6768                 } else {
6769                         $hash = $hash_base;
6770                 }
6771         }
6772         die_error(404, "No such tree") unless defined($hash);
6773
6774         my $show_sizes = gitweb_check_feature('show-sizes');
6775         my $have_blame = gitweb_check_feature('blame');
6776
6777         my @entries = ();
6778         {
6779                 local $/ = "\0";
6780                 open my $fd, "-|", git_cmd(), "ls-tree", '-z',
6781                         ($show_sizes ? '-l' : ()), @extra_options, $hash
6782                         or die_error(500, "Open git-ls-tree failed");
6783                 @entries = map { chomp; $_ } <$fd>;
6784                 close $fd
6785                         or die_error(404, "Reading tree failed");
6786         }
6787
6788         my $refs = git_get_references();
6789         my $ref = format_ref_marker($refs, $hash_base);
6790         git_header_html();
6791         my $basedir = '';
6792         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6793                 my @views_nav = ();
6794                 if (defined $file_name) {
6795                         push @views_nav,
6796                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6797                                         "history"),
6798                                 $cgi->a({-href => href(action=>"tree",
6799                                                        hash_base=>"HEAD", file_name=>$file_name)},
6800                                         "HEAD"),
6801                 }
6802                 my $snapshot_links = format_snapshot_links($hash);
6803                 if (defined $snapshot_links) {
6804                         # FIXME: Should be available when we have no hash base as well.
6805                         push @views_nav, $snapshot_links;
6806                 }
6807                 git_print_page_nav('tree','', $hash_base, undef, undef,
6808                                    join(' | ', @views_nav));
6809                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6810         } else {
6811                 undef $hash_base;
6812                 print "<div class=\"page_nav\">\n";
6813                 print "<br/><br/></div>\n";
6814                 print "<div class=\"title\">".esc_html($hash)."</div>\n";
6815         }
6816         if (defined $file_name) {
6817                 $basedir = $file_name;
6818                 if ($basedir ne '' && substr($basedir, -1) ne '/') {
6819                         $basedir .= '/';
6820                 }
6821                 git_print_page_path($file_name, 'tree', $hash_base);
6822         }
6823         print "<div class=\"page_body\">\n";
6824         print "<table class=\"tree\">\n";
6825         my $alternate = 1;
6826         # '..' (top directory) link if possible
6827         if (defined $hash_base &&
6828             defined $file_name && $file_name =~ m![^/]+$!) {
6829                 if ($alternate) {
6830                         print "<tr class=\"dark\">\n";
6831                 } else {
6832                         print "<tr class=\"light\">\n";
6833                 }
6834                 $alternate ^= 1;
6835
6836                 my $up = $file_name;
6837                 $up =~ s!/?[^/]+$!!;
6838                 undef $up unless $up;
6839                 # based on git_print_tree_entry
6840                 print '<td class="mode">' . mode_str('040000') . "</td>\n";
6841                 print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6842                 print '<td class="list">';
6843                 print $cgi->a({-href => href(action=>"tree",
6844                                              hash_base=>$hash_base,
6845                                              file_name=>$up)},
6846                               "..");
6847                 print "</td>\n";
6848                 print "<td class=\"link\"></td>\n";
6849
6850                 print "</tr>\n";
6851         }
6852         foreach my $line (@entries) {
6853                 my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6854
6855                 if ($alternate) {
6856                         print "<tr class=\"dark\">\n";
6857                 } else {
6858                         print "<tr class=\"light\">\n";
6859                 }
6860                 $alternate ^= 1;
6861
6862                 git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6863
6864                 print "</tr>\n";
6865         }
6866         print "</table>\n" .
6867               "</div>";
6868         git_footer_html();
6869 }
6870
6871 sub snapshot_name {
6872         my ($project, $hash) = @_;
6873
6874         # path/to/project.git  -> project
6875         # path/to/project/.git -> project
6876         my $name = to_utf8($project);
6877         $name =~ s,([^/])/*\.git$,$1,;
6878         $name = basename($name);
6879         # sanitize name
6880         $name =~ s/[[:cntrl:]]/?/g;
6881
6882         my $ver = $hash;
6883         if ($hash =~ /^[0-9a-fA-F]+$/) {
6884                 # shorten SHA-1 hash
6885                 my $full_hash = git_get_full_hash($project, $hash);
6886                 if ($full_hash =~ /^$hash/ && length($hash) > 7) {
6887                         $ver = git_get_short_hash($project, $hash);
6888                 }
6889         } elsif ($hash =~ m!^refs/tags/(.*)$!) {
6890                 # tags don't need shortened SHA-1 hash
6891                 $ver = $1;
6892         } else {
6893                 # branches and other need shortened SHA-1 hash
6894                 if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
6895                         $ver = $1;
6896                 }
6897                 $ver .= '-' . git_get_short_hash($project, $hash);
6898         }
6899         # in case of hierarchical branch names
6900         $ver =~ s!/!.!g;
6901
6902         # name = project-version_string
6903         $name = "$name-$ver";
6904
6905         return wantarray ? ($name, $name) : $name;
6906 }
6907
6908 sub git_snapshot {
6909         my $format = $input_params{'snapshot_format'};
6910         if (!@snapshot_fmts) {
6911                 die_error(403, "Snapshots not allowed");
6912         }
6913         # default to first supported snapshot format
6914         $format ||= $snapshot_fmts[0];
6915         if ($format !~ m/^[a-z0-9]+$/) {
6916                 die_error(400, "Invalid snapshot format parameter");
6917         } elsif (!exists($known_snapshot_formats{$format})) {
6918                 die_error(400, "Unknown snapshot format");
6919         } elsif ($known_snapshot_formats{$format}{'disabled'}) {
6920                 die_error(403, "Snapshot format not allowed");
6921         } elsif (!grep($_ eq $format, @snapshot_fmts)) {
6922                 die_error(403, "Unsupported snapshot format");
6923         }
6924
6925         my $type = git_get_type("$hash^{}");
6926         if (!$type) {
6927                 die_error(404, 'Object does not exist');
6928         }  elsif ($type eq 'blob') {
6929                 die_error(400, 'Object is not a tree-ish');
6930         }
6931
6932         my ($name, $prefix) = snapshot_name($project, $hash);
6933         my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
6934         my $cmd = quote_command(
6935                 git_cmd(), 'archive',
6936                 "--format=$known_snapshot_formats{$format}{'format'}",
6937                 "--prefix=$prefix/", $hash);
6938         if (exists $known_snapshot_formats{$format}{'compressor'}) {
6939                 $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
6940         }
6941
6942         $filename =~ s/(["\\])/\\$1/g;
6943         print $cgi->header(
6944                 -type => $known_snapshot_formats{$format}{'type'},
6945                 -content_disposition => 'inline; filename="' . $filename . '"',
6946                 -status => '200 OK');
6947
6948         open my $fd, "-|", $cmd
6949                 or die_error(500, "Execute git-archive failed");
6950         binmode STDOUT, ':raw';
6951         print <$fd>;
6952         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6953         close $fd;
6954 }
6955
6956 sub git_log_generic {
6957         my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
6958
6959         my $head = git_get_head_hash($project);
6960         if (!defined $base) {
6961                 $base = $head;
6962         }
6963         if (!defined $page) {
6964                 $page = 0;
6965         }
6966         my $refs = git_get_references();
6967
6968         my $commit_hash = $base;
6969         if (defined $parent) {
6970                 $commit_hash = "$parent..$base";
6971         }
6972         my @commitlist =
6973                 parse_commits($commit_hash, 101, (100 * $page),
6974                               defined $file_name ? ($file_name, "--full-history") : ());
6975
6976         my $ftype;
6977         if (!defined $file_hash && defined $file_name) {
6978                 # some commits could have deleted file in question,
6979                 # and not have it in tree, but one of them has to have it
6980                 for (my $i = 0; $i < @commitlist; $i++) {
6981                         $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
6982                         last if defined $file_hash;
6983                 }
6984         }
6985         if (defined $file_hash) {
6986                 $ftype = git_get_type($file_hash);
6987         }
6988         if (defined $file_name && !defined $ftype) {
6989                 die_error(500, "Unknown type of object");
6990         }
6991         my %co;
6992         if (defined $file_name) {
6993                 %co = parse_commit($base)
6994                         or die_error(404, "Unknown commit object");
6995         }
6996
6997
6998         my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
6999         my $next_link = '';
7000         if ($#commitlist >= 100) {
7001                 $next_link =
7002                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
7003                                  -accesskey => "n", -title => "Alt-n"}, "next");
7004         }
7005         my $patch_max = gitweb_get_feature('patches');
7006         if ($patch_max && !defined $file_name) {
7007                 if ($patch_max < 0 || @commitlist <= $patch_max) {
7008                         $paging_nav .= " &sdot; " .
7009                                 $cgi->a({-href => href(action=>"patches", -replay=>1)},
7010                                         "patches");
7011                 }
7012         }
7013
7014         git_header_html();
7015         git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
7016         if (defined $file_name) {
7017                 git_print_header_div('commit', esc_html($co{'title'}), $base);
7018         } else {
7019                 git_print_header_div('summary', $project)
7020         }
7021         git_print_page_path($file_name, $ftype, $hash_base)
7022                 if (defined $file_name);
7023
7024         $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
7025                      $file_name, $file_hash, $ftype);
7026
7027         git_footer_html();
7028 }
7029
7030 sub git_log {
7031         git_log_generic('log', \&git_log_body,
7032                         $hash, $hash_parent);
7033 }
7034
7035 sub git_commit {
7036         $hash ||= $hash_base || "HEAD";
7037         my %co = parse_commit($hash)
7038             or die_error(404, "Unknown commit object");
7039
7040         my $parent  = $co{'parent'};
7041         my $parents = $co{'parents'}; # listref
7042
7043         # we need to prepare $formats_nav before any parameter munging
7044         my $formats_nav;
7045         if (!defined $parent) {
7046                 # --root commitdiff
7047                 $formats_nav .= '(initial)';
7048         } elsif (@$parents == 1) {
7049                 # single parent commit
7050                 $formats_nav .=
7051                         '(parent: ' .
7052                         $cgi->a({-href => href(action=>"commit",
7053                                                hash=>$parent)},
7054                                 esc_html(substr($parent, 0, 7))) .
7055                         ')';
7056         } else {
7057                 # merge commit
7058                 $formats_nav .=
7059                         '(merge: ' .
7060                         join(' ', map {
7061                                 $cgi->a({-href => href(action=>"commit",
7062                                                        hash=>$_)},
7063                                         esc_html(substr($_, 0, 7)));
7064                         } @$parents ) .
7065                         ')';
7066         }
7067         if (gitweb_check_feature('patches') && @$parents <= 1) {
7068                 $formats_nav .= " | " .
7069                         $cgi->a({-href => href(action=>"patch", -replay=>1)},
7070                                 "patch");
7071         }
7072
7073         if (!defined $parent) {
7074                 $parent = "--root";
7075         }
7076         my @difftree;
7077         open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
7078                 @diff_opts,
7079                 (@$parents <= 1 ? $parent : '-c'),
7080                 $hash, "--"
7081                 or die_error(500, "Open git-diff-tree failed");
7082         @difftree = map { chomp; $_ } <$fd>;
7083         close $fd or die_error(404, "Reading git-diff-tree failed");
7084
7085         # non-textual hash id's can be cached
7086         my $expires;
7087         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7088                 $expires = "+1d";
7089         }
7090         my $refs = git_get_references();
7091         my $ref = format_ref_marker($refs, $co{'id'});
7092
7093         git_header_html(undef, $expires);
7094         git_print_page_nav('commit', '',
7095                            $hash, $co{'tree'}, $hash,
7096                            $formats_nav);
7097
7098         if (defined $co{'parent'}) {
7099                 git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
7100         } else {
7101                 git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
7102         }
7103         print "<div class=\"title_text\">\n" .
7104               "<table class=\"object_header\">\n";
7105         git_print_authorship_rows(\%co);
7106         print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
7107         print "<tr>" .
7108               "<td>tree</td>" .
7109               "<td class=\"sha1\">" .
7110               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7111                        class => "list"}, $co{'tree'}) .
7112               "</td>" .
7113               "<td class=\"link\">" .
7114               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7115                       "tree");
7116         my $snapshot_links = format_snapshot_links($hash);
7117         if (defined $snapshot_links) {
7118                 print " | " . $snapshot_links;
7119         }
7120         print "</td>" .
7121               "</tr>\n";
7122
7123         foreach my $par (@$parents) {
7124                 print "<tr>" .
7125                       "<td>parent</td>" .
7126                       "<td class=\"sha1\">" .
7127                       $cgi->a({-href => href(action=>"commit", hash=>$par),
7128                                class => "list"}, $par) .
7129                       "</td>" .
7130                       "<td class=\"link\">" .
7131                       $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7132                       " | " .
7133                       $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7134                       "</td>" .
7135                       "</tr>\n";
7136         }
7137         print "</table>".
7138               "</div>\n";
7139
7140         print "<div class=\"page_body\">\n";
7141         git_print_log($co{'comment'});
7142         print "</div>\n";
7143
7144         git_difftree_body(\@difftree, $hash, @$parents);
7145
7146         git_footer_html();
7147 }
7148
7149 sub git_object {
7150         # object is defined by:
7151         # - hash or hash_base alone
7152         # - hash_base and file_name
7153         my $type;
7154
7155         # - hash or hash_base alone
7156         if ($hash || ($hash_base && !defined $file_name)) {
7157                 my $object_id = $hash || $hash_base;
7158
7159                 open my $fd, "-|", quote_command(
7160                         git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7161                         or die_error(404, "Object does not exist");
7162                 $type = <$fd>;
7163                 chomp $type;
7164                 close $fd
7165                         or die_error(404, "Object does not exist");
7166
7167         # - hash_base and file_name
7168         } elsif ($hash_base && defined $file_name) {
7169                 $file_name =~ s,/+$,,;
7170
7171                 system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7172                         or die_error(404, "Base object does not exist");
7173
7174                 # here errors should not hapen
7175                 open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7176                         or die_error(500, "Open git-ls-tree failed");
7177                 my $line = <$fd>;
7178                 close $fd;
7179
7180                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7181                 unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7182                         die_error(404, "File or directory for given base does not exist");
7183                 }
7184                 $type = $2;
7185                 $hash = $3;
7186         } else {
7187                 die_error(400, "Not enough information to find object");
7188         }
7189
7190         print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7191                                           hash=>$hash, hash_base=>$hash_base,
7192                                           file_name=>$file_name),
7193                              -status => '302 Found');
7194 }
7195
7196 sub git_blobdiff {
7197         my $format = shift || 'html';
7198         my $diff_style = $input_params{'diff_style'} || 'inline';
7199
7200         my $fd;
7201         my @difftree;
7202         my %diffinfo;
7203         my $expires;
7204
7205         # preparing $fd and %diffinfo for git_patchset_body
7206         # new style URI
7207         if (defined $hash_base && defined $hash_parent_base) {
7208                 if (defined $file_name) {
7209                         # read raw output
7210                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7211                                 $hash_parent_base, $hash_base,
7212                                 "--", (defined $file_parent ? $file_parent : ()), $file_name
7213                                 or die_error(500, "Open git-diff-tree failed");
7214                         @difftree = map { chomp; $_ } <$fd>;
7215                         close $fd
7216                                 or die_error(404, "Reading git-diff-tree failed");
7217                         @difftree
7218                                 or die_error(404, "Blob diff not found");
7219
7220                 } elsif (defined $hash &&
7221                          $hash =~ /[0-9a-fA-F]{40}/) {
7222                         # try to find filename from $hash
7223
7224                         # read filtered raw output
7225                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7226                                 $hash_parent_base, $hash_base, "--"
7227                                 or die_error(500, "Open git-diff-tree failed");
7228                         @difftree =
7229                                 # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7230                                 # $hash == to_id
7231                                 grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7232                                 map { chomp; $_ } <$fd>;
7233                         close $fd
7234                                 or die_error(404, "Reading git-diff-tree failed");
7235                         @difftree
7236                                 or die_error(404, "Blob diff not found");
7237
7238                 } else {
7239                         die_error(400, "Missing one of the blob diff parameters");
7240                 }
7241
7242                 if (@difftree > 1) {
7243                         die_error(400, "Ambiguous blob diff specification");
7244                 }
7245
7246                 %diffinfo = parse_difftree_raw_line($difftree[0]);
7247                 $file_parent ||= $diffinfo{'from_file'} || $file_name;
7248                 $file_name   ||= $diffinfo{'to_file'};
7249
7250                 $hash_parent ||= $diffinfo{'from_id'};
7251                 $hash        ||= $diffinfo{'to_id'};
7252
7253                 # non-textual hash id's can be cached
7254                 if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7255                     $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7256                         $expires = '+1d';
7257                 }
7258
7259                 # open patch output
7260                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7261                         '-p', ($format eq 'html' ? "--full-index" : ()),
7262                         $hash_parent_base, $hash_base,
7263                         "--", (defined $file_parent ? $file_parent : ()), $file_name
7264                         or die_error(500, "Open git-diff-tree failed");
7265         }
7266
7267         # old/legacy style URI -- not generated anymore since 1.4.3.
7268         if (!%diffinfo) {
7269                 die_error('404 Not Found', "Missing one of the blob diff parameters")
7270         }
7271
7272         # header
7273         if ($format eq 'html') {
7274                 my $formats_nav =
7275                         $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7276                                 "raw");
7277                 $formats_nav .= diff_style_nav($diff_style);
7278                 git_header_html(undef, $expires);
7279                 if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7280                         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7281                         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7282                 } else {
7283                         print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7284                         print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7285                 }
7286                 if (defined $file_name) {
7287                         git_print_page_path($file_name, "blob", $hash_base);
7288                 } else {
7289                         print "<div class=\"page_path\"></div>\n";
7290                 }
7291
7292         } elsif ($format eq 'plain') {
7293                 print $cgi->header(
7294                         -type => 'text/plain',
7295                         -charset => 'utf-8',
7296                         -expires => $expires,
7297                         -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7298
7299                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7300
7301         } else {
7302                 die_error(400, "Unknown blobdiff format");
7303         }
7304
7305         # patch
7306         if ($format eq 'html') {
7307                 print "<div class=\"page_body\">\n";
7308
7309                 git_patchset_body($fd, $diff_style,
7310                                   [ \%diffinfo ], $hash_base, $hash_parent_base);
7311                 close $fd;
7312
7313                 print "</div>\n"; # class="page_body"
7314                 git_footer_html();
7315
7316         } else {
7317                 while (my $line = <$fd>) {
7318                         $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7319                         $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7320
7321                         print $line;
7322
7323                         last if $line =~ m!^\+\+\+!;
7324                 }
7325                 local $/ = undef;
7326                 print <$fd>;
7327                 close $fd;
7328         }
7329 }
7330
7331 sub git_blobdiff_plain {
7332         git_blobdiff('plain');
7333 }
7334
7335 # assumes that it is added as later part of already existing navigation,
7336 # so it returns "| foo | bar" rather than just "foo | bar"
7337 sub diff_style_nav {
7338         my ($diff_style, $is_combined) = @_;
7339         $diff_style ||= 'inline';
7340
7341         return "" if ($is_combined);
7342
7343         my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7344         my %styles = @styles;
7345         @styles =
7346                 @styles[ map { $_ * 2 } 0..$#styles/2 ];
7347
7348         return join '',
7349                 map { " | ".$_ }
7350                 map {
7351                         $_ eq $diff_style ? $styles{$_} :
7352                         $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7353                 } @styles;
7354 }
7355
7356 sub git_commitdiff {
7357         my %params = @_;
7358         my $format = $params{-format} || 'html';
7359         my $diff_style = $input_params{'diff_style'} || 'inline';
7360
7361         my ($patch_max) = gitweb_get_feature('patches');
7362         if ($format eq 'patch') {
7363                 die_error(403, "Patch view not allowed") unless $patch_max;
7364         }
7365
7366         $hash ||= $hash_base || "HEAD";
7367         my %co = parse_commit($hash)
7368             or die_error(404, "Unknown commit object");
7369
7370         # choose format for commitdiff for merge
7371         if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7372                 $hash_parent = '--cc';
7373         }
7374         # we need to prepare $formats_nav before almost any parameter munging
7375         my $formats_nav;
7376         if ($format eq 'html') {
7377                 $formats_nav =
7378                         $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7379                                 "raw");
7380                 if ($patch_max && @{$co{'parents'}} <= 1) {
7381                         $formats_nav .= " | " .
7382                                 $cgi->a({-href => href(action=>"patch", -replay=>1)},
7383                                         "patch");
7384                 }
7385                 $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7386
7387                 if (defined $hash_parent &&
7388                     $hash_parent ne '-c' && $hash_parent ne '--cc') {
7389                         # commitdiff with two commits given
7390                         my $hash_parent_short = $hash_parent;
7391                         if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7392                                 $hash_parent_short = substr($hash_parent, 0, 7);
7393                         }
7394                         $formats_nav .=
7395                                 ' (from';
7396                         for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7397                                 if ($co{'parents'}[$i] eq $hash_parent) {
7398                                         $formats_nav .= ' parent ' . ($i+1);
7399                                         last;
7400                                 }
7401                         }
7402                         $formats_nav .= ': ' .
7403                                 $cgi->a({-href => href(-replay=>1,
7404                                                        hash=>$hash_parent, hash_base=>undef)},
7405                                         esc_html($hash_parent_short)) .
7406                                 ')';
7407                 } elsif (!$co{'parent'}) {
7408                         # --root commitdiff
7409                         $formats_nav .= ' (initial)';
7410                 } elsif (scalar @{$co{'parents'}} == 1) {
7411                         # single parent commit
7412                         $formats_nav .=
7413                                 ' (parent: ' .
7414                                 $cgi->a({-href => href(-replay=>1,
7415                                                        hash=>$co{'parent'}, hash_base=>undef)},
7416                                         esc_html(substr($co{'parent'}, 0, 7))) .
7417                                 ')';
7418                 } else {
7419                         # merge commit
7420                         if ($hash_parent eq '--cc') {
7421                                 $formats_nav .= ' | ' .
7422                                         $cgi->a({-href => href(-replay=>1,
7423                                                                hash=>$hash, hash_parent=>'-c')},
7424                                                 'combined');
7425                         } else { # $hash_parent eq '-c'
7426                                 $formats_nav .= ' | ' .
7427                                         $cgi->a({-href => href(-replay=>1,
7428                                                                hash=>$hash, hash_parent=>'--cc')},
7429                                                 'compact');
7430                         }
7431                         $formats_nav .=
7432                                 ' (merge: ' .
7433                                 join(' ', map {
7434                                         $cgi->a({-href => href(-replay=>1,
7435                                                                hash=>$_, hash_base=>undef)},
7436                                                 esc_html(substr($_, 0, 7)));
7437                                 } @{$co{'parents'}} ) .
7438                                 ')';
7439                 }
7440         }
7441
7442         my $hash_parent_param = $hash_parent;
7443         if (!defined $hash_parent_param) {
7444                 # --cc for multiple parents, --root for parentless
7445                 $hash_parent_param =
7446                         @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7447         }
7448
7449         # read commitdiff
7450         my $fd;
7451         my @difftree;
7452         if ($format eq 'html') {
7453                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7454                         "--no-commit-id", "--patch-with-raw", "--full-index",
7455                         $hash_parent_param, $hash, "--"
7456                         or die_error(500, "Open git-diff-tree failed");
7457
7458                 while (my $line = <$fd>) {
7459                         chomp $line;
7460                         # empty line ends raw part of diff-tree output
7461                         last unless $line;
7462                         push @difftree, scalar parse_difftree_raw_line($line);
7463                 }
7464
7465         } elsif ($format eq 'plain') {
7466                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7467                         '-p', $hash_parent_param, $hash, "--"
7468                         or die_error(500, "Open git-diff-tree failed");
7469         } elsif ($format eq 'patch') {
7470                 # For commit ranges, we limit the output to the number of
7471                 # patches specified in the 'patches' feature.
7472                 # For single commits, we limit the output to a single patch,
7473                 # diverging from the git-format-patch default.
7474                 my @commit_spec = ();
7475                 if ($hash_parent) {
7476                         if ($patch_max > 0) {
7477                                 push @commit_spec, "-$patch_max";
7478                         }
7479                         push @commit_spec, '-n', "$hash_parent..$hash";
7480                 } else {
7481                         if ($params{-single}) {
7482                                 push @commit_spec, '-1';
7483                         } else {
7484                                 if ($patch_max > 0) {
7485                                         push @commit_spec, "-$patch_max";
7486                                 }
7487                                 push @commit_spec, "-n";
7488                         }
7489                         push @commit_spec, '--root', $hash;
7490                 }
7491                 open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7492                         '--encoding=utf8', '--stdout', @commit_spec
7493                         or die_error(500, "Open git-format-patch failed");
7494         } else {
7495                 die_error(400, "Unknown commitdiff format");
7496         }
7497
7498         # non-textual hash id's can be cached
7499         my $expires;
7500         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7501                 $expires = "+1d";
7502         }
7503
7504         # write commit message
7505         if ($format eq 'html') {
7506                 my $refs = git_get_references();
7507                 my $ref = format_ref_marker($refs, $co{'id'});
7508
7509                 git_header_html(undef, $expires);
7510                 git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7511                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7512                 print "<div class=\"title_text\">\n" .
7513                       "<table class=\"object_header\">\n";
7514                 git_print_authorship_rows(\%co);
7515                 print "</table>".
7516                       "</div>\n";
7517                 print "<div class=\"page_body\">\n";
7518                 if (@{$co{'comment'}} > 1) {
7519                         print "<div class=\"log\">\n";
7520                         git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7521                         print "</div>\n"; # class="log"
7522                 }
7523
7524         } elsif ($format eq 'plain') {
7525                 my $refs = git_get_references("tags");
7526                 my $tagname = git_get_rev_name_tags($hash);
7527                 my $filename = basename($project) . "-$hash.patch";
7528
7529                 print $cgi->header(
7530                         -type => 'text/plain',
7531                         -charset => 'utf-8',
7532                         -expires => $expires,
7533                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7534                 my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7535                 print "From: " . to_utf8($co{'author'}) . "\n";
7536                 print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7537                 print "Subject: " . to_utf8($co{'title'}) . "\n";
7538
7539                 print "X-Git-Tag: $tagname\n" if $tagname;
7540                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7541
7542                 foreach my $line (@{$co{'comment'}}) {
7543                         print to_utf8($line) . "\n";
7544                 }
7545                 print "---\n\n";
7546         } elsif ($format eq 'patch') {
7547                 my $filename = basename($project) . "-$hash.patch";
7548
7549                 print $cgi->header(
7550                         -type => 'text/plain',
7551                         -charset => 'utf-8',
7552                         -expires => $expires,
7553                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7554         }
7555
7556         # write patch
7557         if ($format eq 'html') {
7558                 my $use_parents = !defined $hash_parent ||
7559                         $hash_parent eq '-c' || $hash_parent eq '--cc';
7560                 git_difftree_body(\@difftree, $hash,
7561                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7562                 print "<br/>\n";
7563
7564                 git_patchset_body($fd, $diff_style,
7565                                   \@difftree, $hash,
7566                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7567                 close $fd;
7568                 print "</div>\n"; # class="page_body"
7569                 git_footer_html();
7570
7571         } elsif ($format eq 'plain') {
7572                 local $/ = undef;
7573                 print <$fd>;
7574                 close $fd
7575                         or print "Reading git-diff-tree failed\n";
7576         } elsif ($format eq 'patch') {
7577                 local $/ = undef;
7578                 print <$fd>;
7579                 close $fd
7580                         or print "Reading git-format-patch failed\n";
7581         }
7582 }
7583
7584 sub git_commitdiff_plain {
7585         git_commitdiff(-format => 'plain');
7586 }
7587
7588 # format-patch-style patches
7589 sub git_patch {
7590         git_commitdiff(-format => 'patch', -single => 1);
7591 }
7592
7593 sub git_patches {
7594         git_commitdiff(-format => 'patch');
7595 }
7596
7597 sub git_history {
7598         git_log_generic('history', \&git_history_body,
7599                         $hash_base, $hash_parent_base,
7600                         $file_name, $hash);
7601 }
7602
7603 sub git_search {
7604         $searchtype ||= 'commit';
7605
7606         # check if appropriate features are enabled
7607         gitweb_check_feature('search')
7608                 or die_error(403, "Search is disabled");
7609         if ($searchtype eq 'pickaxe') {
7610                 # pickaxe may take all resources of your box and run for several minutes
7611                 # with every query - so decide by yourself how public you make this feature
7612                 gitweb_check_feature('pickaxe')
7613                         or die_error(403, "Pickaxe search is disabled");
7614         }
7615         if ($searchtype eq 'grep') {
7616                 # grep search might be potentially CPU-intensive, too
7617                 gitweb_check_feature('grep')
7618                         or die_error(403, "Grep search is disabled");
7619         }
7620
7621         if (!defined $searchtext) {
7622                 die_error(400, "Text field is empty");
7623         }
7624         if (!defined $hash) {
7625                 $hash = git_get_head_hash($project);
7626         }
7627         my %co = parse_commit($hash);
7628         if (!%co) {
7629                 die_error(404, "Unknown commit object");
7630         }
7631         if (!defined $page) {
7632                 $page = 0;
7633         }
7634
7635         if ($searchtype eq 'commit' ||
7636             $searchtype eq 'author' ||
7637             $searchtype eq 'committer') {
7638                 git_search_message(%co);
7639         } elsif ($searchtype eq 'pickaxe') {
7640                 git_search_changes(%co);
7641         } elsif ($searchtype eq 'grep') {
7642                 git_search_files(%co);
7643         } else {
7644                 die_error(400, "Unknown search type");
7645         }
7646 }
7647
7648 sub git_search_help {
7649         git_header_html();
7650         git_print_page_nav('','', $hash,$hash,$hash);
7651         print <<EOT;
7652 <p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7653 regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7654 the pattern entered is recognized as the POSIX extended
7655 <a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7656 insensitive).</p>
7657 <dl>
7658 <dt><b>commit</b></dt>
7659 <dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7660 EOT
7661         my $have_grep = gitweb_check_feature('grep');
7662         if ($have_grep) {
7663                 print <<EOT;
7664 <dt><b>grep</b></dt>
7665 <dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7666     a different one) are searched for the given pattern. On large trees, this search can take
7667 a while and put some strain on the server, so please use it with some consideration. Note that
7668 due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7669 case-sensitive.</dd>
7670 EOT
7671         }
7672         print <<EOT;
7673 <dt><b>author</b></dt>
7674 <dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7675 <dt><b>committer</b></dt>
7676 <dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7677 EOT
7678         my $have_pickaxe = gitweb_check_feature('pickaxe');
7679         if ($have_pickaxe) {
7680                 print <<EOT;
7681 <dt><b>pickaxe</b></dt>
7682 <dd>All commits that caused the string to appear or disappear from any file (changes that
7683 added, removed or "modified" the string) will be listed. This search can take a while and
7684 takes a lot of strain on the server, so please use it wisely. Note that since you may be
7685 interested even in changes just changing the case as well, this search is case sensitive.</dd>
7686 EOT
7687         }
7688         print "</dl>\n";
7689         git_footer_html();
7690 }
7691
7692 sub git_shortlog {
7693         git_log_generic('shortlog', \&git_shortlog_body,
7694                         $hash, $hash_parent);
7695 }
7696
7697 ## ......................................................................
7698 ## feeds (RSS, Atom; OPML)
7699
7700 sub git_feed {
7701         my $format = shift || 'atom';
7702         my $have_blame = gitweb_check_feature('blame');
7703
7704         # Atom: http://www.atomenabled.org/developers/syndication/
7705         # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7706         if ($format ne 'rss' && $format ne 'atom') {
7707                 die_error(400, "Unknown web feed format");
7708         }
7709
7710         # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7711         my $head = $hash || 'HEAD';
7712         my @commitlist = parse_commits($head, 150, 0, $file_name);
7713
7714         my %latest_commit;
7715         my %latest_date;
7716         my $content_type = "application/$format+xml";
7717         if (defined $cgi->http('HTTP_ACCEPT') &&
7718                  $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7719                 # browser (feed reader) prefers text/xml
7720                 $content_type = 'text/xml';
7721         }
7722         if (defined($commitlist[0])) {
7723                 %latest_commit = %{$commitlist[0]};
7724                 my $latest_epoch = $latest_commit{'committer_epoch'};
7725                 %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7726                 my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7727                 if (defined $if_modified) {
7728                         my $since;
7729                         if (eval { require HTTP::Date; 1; }) {
7730                                 $since = HTTP::Date::str2time($if_modified);
7731                         } elsif (eval { require Time::ParseDate; 1; }) {
7732                                 $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7733                         }
7734                         if (defined $since && $latest_epoch <= $since) {
7735                                 print $cgi->header(
7736                                         -type => $content_type,
7737                                         -charset => 'utf-8',
7738                                         -last_modified => $latest_date{'rfc2822'},
7739                                         -status => '304 Not Modified');
7740                                 return;
7741                         }
7742                 }
7743                 print $cgi->header(
7744                         -type => $content_type,
7745                         -charset => 'utf-8',
7746                         -last_modified => $latest_date{'rfc2822'});
7747         } else {
7748                 print $cgi->header(
7749                         -type => $content_type,
7750                         -charset => 'utf-8');
7751         }
7752
7753         # Optimization: skip generating the body if client asks only
7754         # for Last-Modified date.
7755         return if ($cgi->request_method() eq 'HEAD');
7756
7757         # header variables
7758         my $title = "$site_name - $project/$action";
7759         my $feed_type = 'log';
7760         if (defined $hash) {
7761                 $title .= " - '$hash'";
7762                 $feed_type = 'branch log';
7763                 if (defined $file_name) {
7764                         $title .= " :: $file_name";
7765                         $feed_type = 'history';
7766                 }
7767         } elsif (defined $file_name) {
7768                 $title .= " - $file_name";
7769                 $feed_type = 'history';
7770         }
7771         $title .= " $feed_type";
7772         my $descr = git_get_project_description($project);
7773         if (defined $descr) {
7774                 $descr = esc_html($descr);
7775         } else {
7776                 $descr = "$project " .
7777                          ($format eq 'rss' ? 'RSS' : 'Atom') .
7778                          " feed";
7779         }
7780         my $owner = git_get_project_owner($project);
7781         $owner = esc_html($owner);
7782
7783         #header
7784         my $alt_url;
7785         if (defined $file_name) {
7786                 $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7787         } elsif (defined $hash) {
7788                 $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7789         } else {
7790                 $alt_url = href(-full=>1, action=>"summary");
7791         }
7792         print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7793         if ($format eq 'rss') {
7794                 print <<XML;
7795 <rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7796 <channel>
7797 XML
7798                 print "<title>$title</title>\n" .
7799                       "<link>$alt_url</link>\n" .
7800                       "<description>$descr</description>\n" .
7801                       "<language>en</language>\n" .
7802                       # project owner is responsible for 'editorial' content
7803                       "<managingEditor>$owner</managingEditor>\n";
7804                 if (defined $logo || defined $favicon) {
7805                         # prefer the logo to the favicon, since RSS
7806                         # doesn't allow both
7807                         my $img = esc_url($logo || $favicon);
7808                         print "<image>\n" .
7809                               "<url>$img</url>\n" .
7810                               "<title>$title</title>\n" .
7811                               "<link>$alt_url</link>\n" .
7812                               "</image>\n";
7813                 }
7814                 if (%latest_date) {
7815                         print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7816                         print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7817                 }
7818                 print "<generator>gitweb v.$version/$git_version</generator>\n";
7819         } elsif ($format eq 'atom') {
7820                 print <<XML;
7821 <feed xmlns="http://www.w3.org/2005/Atom">
7822 XML
7823                 print "<title>$title</title>\n" .
7824                       "<subtitle>$descr</subtitle>\n" .
7825                       '<link rel="alternate" type="text/html" href="' .
7826                       $alt_url . '" />' . "\n" .
7827                       '<link rel="self" type="' . $content_type . '" href="' .
7828                       $cgi->self_url() . '" />' . "\n" .
7829                       "<id>" . href(-full=>1) . "</id>\n" .
7830                       # use project owner for feed author
7831                       "<author><name>$owner</name></author>\n";
7832                 if (defined $favicon) {
7833                         print "<icon>" . esc_url($favicon) . "</icon>\n";
7834                 }
7835                 if (defined $logo) {
7836                         # not twice as wide as tall: 72 x 27 pixels
7837                         print "<logo>" . esc_url($logo) . "</logo>\n";
7838                 }
7839                 if (! %latest_date) {
7840                         # dummy date to keep the feed valid until commits trickle in:
7841                         print "<updated>1970-01-01T00:00:00Z</updated>\n";
7842                 } else {
7843                         print "<updated>$latest_date{'iso-8601'}</updated>\n";
7844                 }
7845                 print "<generator version='$version/$git_version'>gitweb</generator>\n";
7846         }
7847
7848         # contents
7849         for (my $i = 0; $i <= $#commitlist; $i++) {
7850                 my %co = %{$commitlist[$i]};
7851                 my $commit = $co{'id'};
7852                 # we read 150, we always show 30 and the ones more recent than 48 hours
7853                 if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7854                         last;
7855                 }
7856                 my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7857
7858                 # get list of changed files
7859                 open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7860                         $co{'parent'} || "--root",
7861                         $co{'id'}, "--", (defined $file_name ? $file_name : ())
7862                         or next;
7863                 my @difftree = map { chomp; $_ } <$fd>;
7864                 close $fd
7865                         or next;
7866
7867                 # print element (entry, item)
7868                 my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7869                 if ($format eq 'rss') {
7870                         print "<item>\n" .
7871                               "<title>" . esc_html($co{'title'}) . "</title>\n" .
7872                               "<author>" . esc_html($co{'author'}) . "</author>\n" .
7873                               "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7874                               "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7875                               "<link>$co_url</link>\n" .
7876                               "<description>" . esc_html($co{'title'}) . "</description>\n" .
7877                               "<content:encoded>" .
7878                               "<![CDATA[\n";
7879                 } elsif ($format eq 'atom') {
7880                         print "<entry>\n" .
7881                               "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7882                               "<updated>$cd{'iso-8601'}</updated>\n" .
7883                               "<author>\n" .
7884                               "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7885                         if ($co{'author_email'}) {
7886                                 print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7887                         }
7888                         print "</author>\n" .
7889                               # use committer for contributor
7890                               "<contributor>\n" .
7891                               "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7892                         if ($co{'committer_email'}) {
7893                                 print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7894                         }
7895                         print "</contributor>\n" .
7896                               "<published>$cd{'iso-8601'}</published>\n" .
7897                               "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7898                               "<id>$co_url</id>\n" .
7899                               "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
7900                               "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
7901                 }
7902                 my $comment = $co{'comment'};
7903                 print "<pre>\n";
7904                 foreach my $line (@$comment) {
7905                         $line = esc_html($line);
7906                         print "$line\n";
7907                 }
7908                 print "</pre><ul>\n";
7909                 foreach my $difftree_line (@difftree) {
7910                         my %difftree = parse_difftree_raw_line($difftree_line);
7911                         next if !$difftree{'from_id'};
7912
7913                         my $file = $difftree{'file'} || $difftree{'to_file'};
7914
7915                         print "<li>" .
7916                               "[" .
7917                               $cgi->a({-href => href(-full=>1, action=>"blobdiff",
7918                                                      hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
7919                                                      hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
7920                                                      file_name=>$file, file_parent=>$difftree{'from_file'}),
7921                                       -title => "diff"}, 'D');
7922                         if ($have_blame) {
7923                                 print $cgi->a({-href => href(-full=>1, action=>"blame",
7924                                                              file_name=>$file, hash_base=>$commit),
7925                                               -title => "blame"}, 'B');
7926                         }
7927                         # if this is not a feed of a file history
7928                         if (!defined $file_name || $file_name ne $file) {
7929                                 print $cgi->a({-href => href(-full=>1, action=>"history",
7930                                                              file_name=>$file, hash=>$commit),
7931                                               -title => "history"}, 'H');
7932                         }
7933                         $file = esc_path($file);
7934                         print "] ".
7935                               "$file</li>\n";
7936                 }
7937                 if ($format eq 'rss') {
7938                         print "</ul>]]>\n" .
7939                               "</content:encoded>\n" .
7940                               "</item>\n";
7941                 } elsif ($format eq 'atom') {
7942                         print "</ul>\n</div>\n" .
7943                               "</content>\n" .
7944                               "</entry>\n";
7945                 }
7946         }
7947
7948         # end of feed
7949         if ($format eq 'rss') {
7950                 print "</channel>\n</rss>\n";
7951         } elsif ($format eq 'atom') {
7952                 print "</feed>\n";
7953         }
7954 }
7955
7956 sub git_rss {
7957         git_feed('rss');
7958 }
7959
7960 sub git_atom {
7961         git_feed('atom');
7962 }
7963
7964 sub git_opml {
7965         my @list = git_get_projects_list($project_filter, $strict_export);
7966         if (!@list) {
7967                 die_error(404, "No projects found");
7968         }
7969
7970         print $cgi->header(
7971                 -type => 'text/xml',
7972                 -charset => 'utf-8',
7973                 -content_disposition => 'inline; filename="opml.xml"');
7974
7975         my $title = esc_html($site_name);
7976         my $filter = " within subdirectory ";
7977         if (defined $project_filter) {
7978                 $filter .= esc_html($project_filter);
7979         } else {
7980                 $filter = "";
7981         }
7982         print <<XML;
7983 <?xml version="1.0" encoding="utf-8"?>
7984 <opml version="1.0">
7985 <head>
7986   <title>$title OPML Export$filter</title>
7987 </head>
7988 <body>
7989 <outline text="git RSS feeds">
7990 XML
7991
7992         foreach my $pr (@list) {
7993                 my %proj = %$pr;
7994                 my $head = git_get_head_hash($proj{'path'});
7995                 if (!defined $head) {
7996                         next;
7997                 }
7998                 $git_dir = "$projectroot/$proj{'path'}";
7999                 my %co = parse_commit($head);
8000                 if (!%co) {
8001                         next;
8002                 }
8003
8004                 my $path = esc_html(chop_str($proj{'path'}, 25, 5));
8005                 my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
8006                 my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
8007                 print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
8008         }
8009         print <<XML;
8010 </outline>
8011 </body>
8012 </opml>
8013 XML
8014 }