Sync with 1.7.8.6
[git] / gitweb / gitweb.perl
1 #!/usr/bin/perl
2
3 # gitweb - simple web interface to track changes in git repositories
4 #
5 # (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
6 # (C) 2005, Christian Gierke
7 #
8 # This program is licensed under the GPLv2
9
10 use 5.008;
11 use strict;
12 use warnings;
13 use CGI qw(:standard :escapeHTML -nosticky);
14 use CGI::Util qw(unescape);
15 use CGI::Carp qw(fatalsToBrowser set_message);
16 use Encode;
17 use Fcntl ':mode';
18 use File::Find qw();
19 use File::Basename qw(basename);
20 use Time::HiRes qw(gettimeofday tv_interval);
21 binmode STDOUT, ':utf8';
22
23 our $t0 = [ gettimeofday() ];
24 our $number_of_git_cmds = 0;
25
26 BEGIN {
27         CGI->compile() if $ENV{'MOD_PERL'};
28 }
29
30 our $version = "++GIT_VERSION++";
31
32 our ($my_url, $my_uri, $base_url, $path_info, $home_link);
33 sub evaluate_uri {
34         our $cgi;
35
36         our $my_url = $cgi->url();
37         our $my_uri = $cgi->url(-absolute => 1);
38
39         # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
40         # needed and used only for URLs with nonempty PATH_INFO
41         our $base_url = $my_url;
42
43         # When the script is used as DirectoryIndex, the URL does not contain the name
44         # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
45         # have to do it ourselves. We make $path_info global because it's also used
46         # later on.
47         #
48         # Another issue with the script being the DirectoryIndex is that the resulting
49         # $my_url data is not the full script URL: this is good, because we want
50         # generated links to keep implying the script name if it wasn't explicitly
51         # indicated in the URL we're handling, but it means that $my_url cannot be used
52         # as base URL.
53         # Therefore, if we needed to strip PATH_INFO, then we know that we have
54         # to build the base URL ourselves:
55         our $path_info = decode_utf8($ENV{"PATH_INFO"});
56         if ($path_info) {
57                 if ($my_url =~ s,\Q$path_info\E$,, &&
58                     $my_uri =~ s,\Q$path_info\E$,, &&
59                     defined $ENV{'SCRIPT_NAME'}) {
60                         $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
61                 }
62         }
63
64         # target of the home link on top of all pages
65         our $home_link = $my_uri || "/";
66 }
67
68 # core git executable to use
69 # this can just be "git" if your webserver has a sensible PATH
70 our $GIT = "++GIT_BINDIR++/git";
71
72 # absolute fs-path which will be prepended to the project path
73 #our $projectroot = "/pub/scm";
74 our $projectroot = "++GITWEB_PROJECTROOT++";
75
76 # fs traversing limit for getting project list
77 # the number is relative to the projectroot
78 our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
79
80 # string of the home link on top of all pages
81 our $home_link_str = "++GITWEB_HOME_LINK_STR++";
82
83 # name of your site or organization to appear in page titles
84 # replace this with something more descriptive for clearer bookmarks
85 our $site_name = "++GITWEB_SITENAME++"
86                  || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
87
88 # html snippet to include in the <head> section of each page
89 our $site_html_head_string = "++GITWEB_SITE_HTML_HEAD_STRING++";
90 # filename of html text to include at top of each page
91 our $site_header = "++GITWEB_SITE_HEADER++";
92 # html text to include at home page
93 our $home_text = "++GITWEB_HOMETEXT++";
94 # filename of html text to include at bottom of each page
95 our $site_footer = "++GITWEB_SITE_FOOTER++";
96
97 # URI of stylesheets
98 our @stylesheets = ("++GITWEB_CSS++");
99 # URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
100 our $stylesheet = undef;
101 # URI of GIT logo (72x27 size)
102 our $logo = "++GITWEB_LOGO++";
103 # URI of GIT favicon, assumed to be image/png type
104 our $favicon = "++GITWEB_FAVICON++";
105 # URI of gitweb.js (JavaScript code for gitweb)
106 our $javascript = "++GITWEB_JS++";
107
108 # URI and label (title) of GIT logo link
109 #our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
110 #our $logo_label = "git documentation";
111 our $logo_url = "http://git-scm.com/";
112 our $logo_label = "git homepage";
113
114 # source of projects list
115 our $projects_list = "++GITWEB_LIST++";
116
117 # the width (in characters) of the projects list "Description" column
118 our $projects_list_description_width = 25;
119
120 # group projects by category on the projects list
121 # (enabled if this variable evaluates to true)
122 our $projects_list_group_categories = 0;
123
124 # default category if none specified
125 # (leave the empty string for no category)
126 our $project_list_default_category = "";
127
128 # default order of projects list
129 # valid values are none, project, descr, owner, and age
130 our $default_projects_order = "project";
131
132 # show repository only if this file exists
133 # (only effective if this variable evaluates to true)
134 our $export_ok = "++GITWEB_EXPORT_OK++";
135
136 # show repository only if this subroutine returns true
137 # when given the path to the project, for example:
138 #    sub { return -e "$_[0]/git-daemon-export-ok"; }
139 our $export_auth_hook = undef;
140
141 # only allow viewing of repositories also shown on the overview page
142 our $strict_export = "++GITWEB_STRICT_EXPORT++";
143
144 # list of git base URLs used for URL to where fetch project from,
145 # i.e. full URL is "$git_base_url/$project"
146 our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
147
148 # default blob_plain mimetype and default charset for text/plain blob
149 our $default_blob_plain_mimetype = 'text/plain';
150 our $default_text_plain_charset  = undef;
151
152 # file to use for guessing MIME types before trying /etc/mime.types
153 # (relative to the current git repository)
154 our $mimetypes_file = undef;
155
156 # assume this charset if line contains non-UTF-8 characters;
157 # it should be valid encoding (see Encoding::Supported(3pm) for list),
158 # for which encoding all byte sequences are valid, for example
159 # 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
160 # could be even 'utf-8' for the old behavior)
161 our $fallback_encoding = 'latin1';
162
163 # rename detection options for git-diff and git-diff-tree
164 # - default is '-M', with the cost proportional to
165 #   (number of removed files) * (number of new files).
166 # - more costly is '-C' (which implies '-M'), with the cost proportional to
167 #   (number of changed files + number of removed files) * (number of new files)
168 # - even more costly is '-C', '--find-copies-harder' with cost
169 #   (number of files in the original tree) * (number of new files)
170 # - one might want to include '-B' option, e.g. '-B', '-M'
171 our @diff_opts = ('-M'); # taken from git_commit
172
173 # Disables features that would allow repository owners to inject script into
174 # the gitweb domain.
175 our $prevent_xss = 0;
176
177 # Path to the highlight executable to use (must be the one from
178 # http://www.andre-simon.de due to assumptions about parameters and output).
179 # Useful if highlight is not installed on your webserver's PATH.
180 # [Default: highlight]
181 our $highlight_bin = "++HIGHLIGHT_BIN++";
182
183 # information about snapshot formats that gitweb is capable of serving
184 our %known_snapshot_formats = (
185         # name => {
186         #       'display' => display name,
187         #       'type' => mime type,
188         #       'suffix' => filename suffix,
189         #       'format' => --format for git-archive,
190         #       'compressor' => [compressor command and arguments]
191         #                       (array reference, optional)
192         #       'disabled' => boolean (optional)}
193         #
194         'tgz' => {
195                 'display' => 'tar.gz',
196                 'type' => 'application/x-gzip',
197                 'suffix' => '.tar.gz',
198                 'format' => 'tar',
199                 'compressor' => ['gzip', '-n']},
200
201         'tbz2' => {
202                 'display' => 'tar.bz2',
203                 'type' => 'application/x-bzip2',
204                 'suffix' => '.tar.bz2',
205                 'format' => 'tar',
206                 'compressor' => ['bzip2']},
207
208         'txz' => {
209                 'display' => 'tar.xz',
210                 'type' => 'application/x-xz',
211                 'suffix' => '.tar.xz',
212                 'format' => 'tar',
213                 'compressor' => ['xz'],
214                 'disabled' => 1},
215
216         'zip' => {
217                 'display' => 'zip',
218                 'type' => 'application/x-zip',
219                 'suffix' => '.zip',
220                 'format' => 'zip'},
221 );
222
223 # Aliases so we understand old gitweb.snapshot values in repository
224 # configuration.
225 our %known_snapshot_format_aliases = (
226         'gzip'  => 'tgz',
227         'bzip2' => 'tbz2',
228         'xz'    => 'txz',
229
230         # backward compatibility: legacy gitweb config support
231         'x-gzip' => undef, 'gz' => undef,
232         'x-bzip2' => undef, 'bz2' => undef,
233         'x-zip' => undef, '' => undef,
234 );
235
236 # Pixel sizes for icons and avatars. If the default font sizes or lineheights
237 # are changed, it may be appropriate to change these values too via
238 # $GITWEB_CONFIG.
239 our %avatar_size = (
240         'default' => 16,
241         'double'  => 32
242 );
243
244 # Used to set the maximum load that we will still respond to gitweb queries.
245 # If server load exceed this value then return "503 server busy" error.
246 # If gitweb cannot determined server load, it is taken to be 0.
247 # Leave it undefined (or set to 'undef') to turn off load checking.
248 our $maxload = 300;
249
250 # configuration for 'highlight' (http://www.andre-simon.de/)
251 # match by basename
252 our %highlight_basename = (
253         #'Program' => 'py',
254         #'Library' => 'py',
255         'SConstruct' => 'py', # SCons equivalent of Makefile
256         'Makefile' => 'make',
257 );
258 # match by extension
259 our %highlight_ext = (
260         # main extensions, defining name of syntax;
261         # see files in /usr/share/highlight/langDefs/ directory
262         map { $_ => $_ }
263                 qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
264         # alternate extensions, see /etc/highlight/filetypes.conf
265         'h' => 'c',
266         map { $_ => 'sh'  } qw(bash zsh ksh),
267         map { $_ => 'cpp' } qw(cxx c++ cc),
268         map { $_ => 'php' } qw(php3 php4 php5 phps),
269         map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
270         map { $_ => 'make'} qw(mak mk),
271         map { $_ => 'xml' } qw(xhtml html htm),
272 );
273
274 # You define site-wide feature defaults here; override them with
275 # $GITWEB_CONFIG as necessary.
276 our %feature = (
277         # feature => {
278         #       'sub' => feature-sub (subroutine),
279         #       'override' => allow-override (boolean),
280         #       'default' => [ default options...] (array reference)}
281         #
282         # if feature is overridable (it means that allow-override has true value),
283         # then feature-sub will be called with default options as parameters;
284         # return value of feature-sub indicates if to enable specified feature
285         #
286         # if there is no 'sub' key (no feature-sub), then feature cannot be
287         # overridden
288         #
289         # use gitweb_get_feature(<feature>) to retrieve the <feature> value
290         # (an array) or gitweb_check_feature(<feature>) to check if <feature>
291         # is enabled
292
293         # Enable the 'blame' blob view, showing the last commit that modified
294         # each line in the file. This can be very CPU-intensive.
295
296         # To enable system wide have in $GITWEB_CONFIG
297         # $feature{'blame'}{'default'} = [1];
298         # To have project specific config enable override in $GITWEB_CONFIG
299         # $feature{'blame'}{'override'} = 1;
300         # and in project config gitweb.blame = 0|1;
301         'blame' => {
302                 'sub' => sub { feature_bool('blame', @_) },
303                 'override' => 0,
304                 'default' => [0]},
305
306         # Enable the 'snapshot' link, providing a compressed archive of any
307         # tree. This can potentially generate high traffic if you have large
308         # project.
309
310         # Value is a list of formats defined in %known_snapshot_formats that
311         # you wish to offer.
312         # To disable system wide have in $GITWEB_CONFIG
313         # $feature{'snapshot'}{'default'} = [];
314         # To have project specific config enable override in $GITWEB_CONFIG
315         # $feature{'snapshot'}{'override'} = 1;
316         # and in project config, a comma-separated list of formats or "none"
317         # to disable.  Example: gitweb.snapshot = tbz2,zip;
318         'snapshot' => {
319                 'sub' => \&feature_snapshot,
320                 'override' => 0,
321                 'default' => ['tgz']},
322
323         # Enable text search, which will list the commits which match author,
324         # committer or commit text to a given string.  Enabled by default.
325         # Project specific override is not supported.
326         #
327         # Note that this controls all search features, which means that if
328         # it is disabled, then 'grep' and 'pickaxe' search would also be
329         # disabled.
330         'search' => {
331                 'override' => 0,
332                 'default' => [1]},
333
334         # Enable grep search, which will list the files in currently selected
335         # tree containing the given string. Enabled by default. This can be
336         # potentially CPU-intensive, of course.
337         # Note that you need to have 'search' feature enabled too.
338
339         # To enable system wide have in $GITWEB_CONFIG
340         # $feature{'grep'}{'default'} = [1];
341         # To have project specific config enable override in $GITWEB_CONFIG
342         # $feature{'grep'}{'override'} = 1;
343         # and in project config gitweb.grep = 0|1;
344         'grep' => {
345                 'sub' => sub { feature_bool('grep', @_) },
346                 'override' => 0,
347                 'default' => [1]},
348
349         # Enable the pickaxe search, which will list the commits that modified
350         # a given string in a file. This can be practical and quite faster
351         # alternative to 'blame', but still potentially CPU-intensive.
352         # Note that you need to have 'search' feature enabled too.
353
354         # To enable system wide have in $GITWEB_CONFIG
355         # $feature{'pickaxe'}{'default'} = [1];
356         # To have project specific config enable override in $GITWEB_CONFIG
357         # $feature{'pickaxe'}{'override'} = 1;
358         # and in project config gitweb.pickaxe = 0|1;
359         'pickaxe' => {
360                 'sub' => sub { feature_bool('pickaxe', @_) },
361                 'override' => 0,
362                 'default' => [1]},
363
364         # Enable showing size of blobs in a 'tree' view, in a separate
365         # column, similar to what 'ls -l' does.  This cost a bit of IO.
366
367         # To disable system wide have in $GITWEB_CONFIG
368         # $feature{'show-sizes'}{'default'} = [0];
369         # To have project specific config enable override in $GITWEB_CONFIG
370         # $feature{'show-sizes'}{'override'} = 1;
371         # and in project config gitweb.showsizes = 0|1;
372         'show-sizes' => {
373                 'sub' => sub { feature_bool('showsizes', @_) },
374                 'override' => 0,
375                 'default' => [1]},
376
377         # Make gitweb use an alternative format of the URLs which can be
378         # more readable and natural-looking: project name is embedded
379         # directly in the path and the query string contains other
380         # auxiliary information. All gitweb installations recognize
381         # URL in either format; this configures in which formats gitweb
382         # generates links.
383
384         # To enable system wide have in $GITWEB_CONFIG
385         # $feature{'pathinfo'}{'default'} = [1];
386         # Project specific override is not supported.
387
388         # Note that you will need to change the default location of CSS,
389         # favicon, logo and possibly other files to an absolute URL. Also,
390         # if gitweb.cgi serves as your indexfile, you will need to force
391         # $my_uri to contain the script name in your $GITWEB_CONFIG.
392         'pathinfo' => {
393                 'override' => 0,
394                 'default' => [0]},
395
396         # Make gitweb consider projects in project root subdirectories
397         # to be forks of existing projects. Given project $projname.git,
398         # projects matching $projname/*.git will not be shown in the main
399         # projects list, instead a '+' mark will be added to $projname
400         # there and a 'forks' view will be enabled for the project, listing
401         # all the forks. If project list is taken from a file, forks have
402         # to be listed after the main project.
403
404         # To enable system wide have in $GITWEB_CONFIG
405         # $feature{'forks'}{'default'} = [1];
406         # Project specific override is not supported.
407         'forks' => {
408                 'override' => 0,
409                 'default' => [0]},
410
411         # Insert custom links to the action bar of all project pages.
412         # This enables you mainly to link to third-party scripts integrating
413         # into gitweb; e.g. git-browser for graphical history representation
414         # or custom web-based repository administration interface.
415
416         # The 'default' value consists of a list of triplets in the form
417         # (label, link, position) where position is the label after which
418         # to insert the link and link is a format string where %n expands
419         # to the project name, %f to the project path within the filesystem,
420         # %h to the current hash (h gitweb parameter) and %b to the current
421         # hash base (hb gitweb parameter); %% expands to %.
422
423         # To enable system wide have in $GITWEB_CONFIG e.g.
424         # $feature{'actions'}{'default'} = [('graphiclog',
425         #       '/git-browser/by-commit.html?r=%n', 'summary')];
426         # Project specific override is not supported.
427         'actions' => {
428                 'override' => 0,
429                 'default' => []},
430
431         # Allow gitweb scan project content tags of project repository,
432         # and display the popular Web 2.0-ish "tag cloud" near the projects
433         # list.  Note that this is something COMPLETELY different from the
434         # normal Git tags.
435
436         # gitweb by itself can show existing tags, but it does not handle
437         # tagging itself; you need to do it externally, outside gitweb.
438         # The format is described in git_get_project_ctags() subroutine.
439         # You may want to install the HTML::TagCloud Perl module to get
440         # a pretty tag cloud instead of just a list of tags.
441
442         # To enable system wide have in $GITWEB_CONFIG
443         # $feature{'ctags'}{'default'} = [1];
444         # Project specific override is not supported.
445
446         # In the future whether ctags editing is enabled might depend
447         # on the value, but using 1 should always mean no editing of ctags.
448         'ctags' => {
449                 'override' => 0,
450                 'default' => [0]},
451
452         # The maximum number of patches in a patchset generated in patch
453         # view. Set this to 0 or undef to disable patch view, or to a
454         # negative number to remove any limit.
455
456         # To disable system wide have in $GITWEB_CONFIG
457         # $feature{'patches'}{'default'} = [0];
458         # To have project specific config enable override in $GITWEB_CONFIG
459         # $feature{'patches'}{'override'} = 1;
460         # and in project config gitweb.patches = 0|n;
461         # where n is the maximum number of patches allowed in a patchset.
462         'patches' => {
463                 'sub' => \&feature_patches,
464                 'override' => 0,
465                 'default' => [16]},
466
467         # Avatar support. When this feature is enabled, views such as
468         # shortlog or commit will display an avatar associated with
469         # the email of the committer(s) and/or author(s).
470
471         # Currently available providers are gravatar and picon.
472         # If an unknown provider is specified, the feature is disabled.
473
474         # Gravatar depends on Digest::MD5.
475         # Picon currently relies on the indiana.edu database.
476
477         # To enable system wide have in $GITWEB_CONFIG
478         # $feature{'avatar'}{'default'} = ['<provider>'];
479         # where <provider> is either gravatar or picon.
480         # To have project specific config enable override in $GITWEB_CONFIG
481         # $feature{'avatar'}{'override'} = 1;
482         # and in project config gitweb.avatar = <provider>;
483         'avatar' => {
484                 'sub' => \&feature_avatar,
485                 'override' => 0,
486                 'default' => ['']},
487
488         # Enable displaying how much time and how many git commands
489         # it took to generate and display page.  Disabled by default.
490         # Project specific override is not supported.
491         'timed' => {
492                 'override' => 0,
493                 'default' => [0]},
494
495         # Enable turning some links into links to actions which require
496         # JavaScript to run (like 'blame_incremental').  Not enabled by
497         # default.  Project specific override is currently not supported.
498         'javascript-actions' => {
499                 'override' => 0,
500                 'default' => [0]},
501
502         # Enable and configure ability to change common timezone for dates
503         # in gitweb output via JavaScript.  Enabled by default.
504         # Project specific override is not supported.
505         'javascript-timezone' => {
506                 'override' => 0,
507                 'default' => [
508                         'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
509                                      # or undef to turn off this feature
510                         'gitweb_tz', # name of cookie where to store selected timezone
511                         'datetime',  # CSS class used to mark up dates for manipulation
512                 ]},
513
514         # Syntax highlighting support. This is based on Daniel Svensson's
515         # and Sham Chukoury's work in gitweb-xmms2.git.
516         # It requires the 'highlight' program present in $PATH,
517         # and therefore is disabled by default.
518
519         # To enable system wide have in $GITWEB_CONFIG
520         # $feature{'highlight'}{'default'} = [1];
521
522         'highlight' => {
523                 'sub' => sub { feature_bool('highlight', @_) },
524                 'override' => 0,
525                 'default' => [0]},
526
527         # Enable displaying of remote heads in the heads list
528
529         # To enable system wide have in $GITWEB_CONFIG
530         # $feature{'remote_heads'}{'default'} = [1];
531         # To have project specific config enable override in $GITWEB_CONFIG
532         # $feature{'remote_heads'}{'override'} = 1;
533         # and in project config gitweb.remote_heads = 0|1;
534         'remote_heads' => {
535                 'sub' => sub { feature_bool('remote_heads', @_) },
536                 'override' => 0,
537                 'default' => [0]},
538 );
539
540 sub gitweb_get_feature {
541         my ($name) = @_;
542         return unless exists $feature{$name};
543         my ($sub, $override, @defaults) = (
544                 $feature{$name}{'sub'},
545                 $feature{$name}{'override'},
546                 @{$feature{$name}{'default'}});
547         # project specific override is possible only if we have project
548         our $git_dir; # global variable, declared later
549         if (!$override || !defined $git_dir) {
550                 return @defaults;
551         }
552         if (!defined $sub) {
553                 warn "feature $name is not overridable";
554                 return @defaults;
555         }
556         return $sub->(@defaults);
557 }
558
559 # A wrapper to check if a given feature is enabled.
560 # With this, you can say
561 #
562 #   my $bool_feat = gitweb_check_feature('bool_feat');
563 #   gitweb_check_feature('bool_feat') or somecode;
564 #
565 # instead of
566 #
567 #   my ($bool_feat) = gitweb_get_feature('bool_feat');
568 #   (gitweb_get_feature('bool_feat'))[0] or somecode;
569 #
570 sub gitweb_check_feature {
571         return (gitweb_get_feature(@_))[0];
572 }
573
574
575 sub feature_bool {
576         my $key = shift;
577         my ($val) = git_get_project_config($key, '--bool');
578
579         if (!defined $val) {
580                 return ($_[0]);
581         } elsif ($val eq 'true') {
582                 return (1);
583         } elsif ($val eq 'false') {
584                 return (0);
585         }
586 }
587
588 sub feature_snapshot {
589         my (@fmts) = @_;
590
591         my ($val) = git_get_project_config('snapshot');
592
593         if ($val) {
594                 @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
595         }
596
597         return @fmts;
598 }
599
600 sub feature_patches {
601         my @val = (git_get_project_config('patches', '--int'));
602
603         if (@val) {
604                 return @val;
605         }
606
607         return ($_[0]);
608 }
609
610 sub feature_avatar {
611         my @val = (git_get_project_config('avatar'));
612
613         return @val ? @val : @_;
614 }
615
616 # checking HEAD file with -e is fragile if the repository was
617 # initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
618 # and then pruned.
619 sub check_head_link {
620         my ($dir) = @_;
621         my $headfile = "$dir/HEAD";
622         return ((-e $headfile) ||
623                 (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
624 }
625
626 sub check_export_ok {
627         my ($dir) = @_;
628         return (check_head_link($dir) &&
629                 (!$export_ok || -e "$dir/$export_ok") &&
630                 (!$export_auth_hook || $export_auth_hook->($dir)));
631 }
632
633 # process alternate names for backward compatibility
634 # filter out unsupported (unknown) snapshot formats
635 sub filter_snapshot_fmts {
636         my @fmts = @_;
637
638         @fmts = map {
639                 exists $known_snapshot_format_aliases{$_} ?
640                        $known_snapshot_format_aliases{$_} : $_} @fmts;
641         @fmts = grep {
642                 exists $known_snapshot_formats{$_} &&
643                 !$known_snapshot_formats{$_}{'disabled'}} @fmts;
644 }
645
646 # If it is set to code reference, it is code that it is to be run once per
647 # request, allowing updating configurations that change with each request,
648 # while running other code in config file only once.
649 #
650 # Otherwise, if it is false then gitweb would process config file only once;
651 # if it is true then gitweb config would be run for each request.
652 our $per_request_config = 1;
653
654 # read and parse gitweb config file given by its parameter.
655 # returns true on success, false on recoverable error, allowing
656 # to chain this subroutine, using first file that exists.
657 # dies on errors during parsing config file, as it is unrecoverable.
658 sub read_config_file {
659         my $filename = shift;
660         return unless defined $filename;
661         # die if there are errors parsing config file
662         if (-e $filename) {
663                 do $filename;
664                 die $@ if $@;
665                 return 1;
666         }
667         return;
668 }
669
670 our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM, $GITWEB_CONFIG_COMMON);
671 sub evaluate_gitweb_config {
672         our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
673         our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
674         our $GITWEB_CONFIG_COMMON = $ENV{'GITWEB_CONFIG_COMMON'} || "++GITWEB_CONFIG_COMMON++";
675
676         # Protect agains duplications of file names, to not read config twice.
677         # Only one of $GITWEB_CONFIG and $GITWEB_CONFIG_SYSTEM is used, so
678         # there possibility of duplication of filename there doesn't matter.
679         $GITWEB_CONFIG = ""        if ($GITWEB_CONFIG eq $GITWEB_CONFIG_COMMON);
680         $GITWEB_CONFIG_SYSTEM = "" if ($GITWEB_CONFIG_SYSTEM eq $GITWEB_CONFIG_COMMON);
681
682         # Common system-wide settings for convenience.
683         # Those settings can be ovverriden by GITWEB_CONFIG or GITWEB_CONFIG_SYSTEM.
684         read_config_file($GITWEB_CONFIG_COMMON);
685
686         # Use first config file that exists.  This means use the per-instance
687         # GITWEB_CONFIG if exists, otherwise use GITWEB_SYSTEM_CONFIG.
688         read_config_file($GITWEB_CONFIG) and return;
689         read_config_file($GITWEB_CONFIG_SYSTEM);
690 }
691
692 # Get loadavg of system, to compare against $maxload.
693 # Currently it requires '/proc/loadavg' present to get loadavg;
694 # if it is not present it returns 0, which means no load checking.
695 sub get_loadavg {
696         if( -e '/proc/loadavg' ){
697                 open my $fd, '<', '/proc/loadavg'
698                         or return 0;
699                 my @load = split(/\s+/, scalar <$fd>);
700                 close $fd;
701
702                 # The first three columns measure CPU and IO utilization of the last one,
703                 # five, and 10 minute periods.  The fourth column shows the number of
704                 # currently running processes and the total number of processes in the m/n
705                 # format.  The last column displays the last process ID used.
706                 return $load[0] || 0;
707         }
708         # additional checks for load average should go here for things that don't export
709         # /proc/loadavg
710
711         return 0;
712 }
713
714 # version of the core git binary
715 our $git_version;
716 sub evaluate_git_version {
717         our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
718         $number_of_git_cmds++;
719 }
720
721 sub check_loadavg {
722         if (defined $maxload && get_loadavg() > $maxload) {
723                 die_error(503, "The load average on the server is too high");
724         }
725 }
726
727 # ======================================================================
728 # input validation and dispatch
729
730 # input parameters can be collected from a variety of sources (presently, CGI
731 # and PATH_INFO), so we define an %input_params hash that collects them all
732 # together during validation: this allows subsequent uses (e.g. href()) to be
733 # agnostic of the parameter origin
734
735 our %input_params = ();
736
737 # input parameters are stored with the long parameter name as key. This will
738 # also be used in the href subroutine to convert parameters to their CGI
739 # equivalent, and since the href() usage is the most frequent one, we store
740 # the name -> CGI key mapping here, instead of the reverse.
741 #
742 # XXX: Warning: If you touch this, check the search form for updating,
743 # too.
744
745 our @cgi_param_mapping = (
746         project => "p",
747         action => "a",
748         file_name => "f",
749         file_parent => "fp",
750         hash => "h",
751         hash_parent => "hp",
752         hash_base => "hb",
753         hash_parent_base => "hpb",
754         page => "pg",
755         order => "o",
756         searchtext => "s",
757         searchtype => "st",
758         snapshot_format => "sf",
759         extra_options => "opt",
760         search_use_regexp => "sr",
761         ctag => "by_tag",
762         diff_style => "ds",
763         # this must be last entry (for manipulation from JavaScript)
764         javascript => "js"
765 );
766 our %cgi_param_mapping = @cgi_param_mapping;
767
768 # we will also need to know the possible actions, for validation
769 our %actions = (
770         "blame" => \&git_blame,
771         "blame_incremental" => \&git_blame_incremental,
772         "blame_data" => \&git_blame_data,
773         "blobdiff" => \&git_blobdiff,
774         "blobdiff_plain" => \&git_blobdiff_plain,
775         "blob" => \&git_blob,
776         "blob_plain" => \&git_blob_plain,
777         "commitdiff" => \&git_commitdiff,
778         "commitdiff_plain" => \&git_commitdiff_plain,
779         "commit" => \&git_commit,
780         "forks" => \&git_forks,
781         "heads" => \&git_heads,
782         "history" => \&git_history,
783         "log" => \&git_log,
784         "patch" => \&git_patch,
785         "patches" => \&git_patches,
786         "remotes" => \&git_remotes,
787         "rss" => \&git_rss,
788         "atom" => \&git_atom,
789         "search" => \&git_search,
790         "search_help" => \&git_search_help,
791         "shortlog" => \&git_shortlog,
792         "summary" => \&git_summary,
793         "tag" => \&git_tag,
794         "tags" => \&git_tags,
795         "tree" => \&git_tree,
796         "snapshot" => \&git_snapshot,
797         "object" => \&git_object,
798         # those below don't need $project
799         "opml" => \&git_opml,
800         "project_list" => \&git_project_list,
801         "project_index" => \&git_project_index,
802 );
803
804 # finally, we have the hash of allowed extra_options for the commands that
805 # allow them
806 our %allowed_options = (
807         "--no-merges" => [ qw(rss atom log shortlog history) ],
808 );
809
810 # fill %input_params with the CGI parameters. All values except for 'opt'
811 # should be single values, but opt can be an array. We should probably
812 # build an array of parameters that can be multi-valued, but since for the time
813 # being it's only this one, we just single it out
814 sub evaluate_query_params {
815         our $cgi;
816
817         while (my ($name, $symbol) = each %cgi_param_mapping) {
818                 if ($symbol eq 'opt') {
819                         $input_params{$name} = [ map { decode_utf8($_) } $cgi->param($symbol) ];
820                 } else {
821                         $input_params{$name} = decode_utf8($cgi->param($symbol));
822                 }
823         }
824 }
825
826 # now read PATH_INFO and update the parameter list for missing parameters
827 sub evaluate_path_info {
828         return if defined $input_params{'project'};
829         return if !$path_info;
830         $path_info =~ s,^/+,,;
831         return if !$path_info;
832
833         # find which part of PATH_INFO is project
834         my $project = $path_info;
835         $project =~ s,/+$,,;
836         while ($project && !check_head_link("$projectroot/$project")) {
837                 $project =~ s,/*[^/]*$,,;
838         }
839         return unless $project;
840         $input_params{'project'} = $project;
841
842         # do not change any parameters if an action is given using the query string
843         return if $input_params{'action'};
844         $path_info =~ s,^\Q$project\E/*,,;
845
846         # next, check if we have an action
847         my $action = $path_info;
848         $action =~ s,/.*$,,;
849         if (exists $actions{$action}) {
850                 $path_info =~ s,^$action/*,,;
851                 $input_params{'action'} = $action;
852         }
853
854         # list of actions that want hash_base instead of hash, but can have no
855         # pathname (f) parameter
856         my @wants_base = (
857                 'tree',
858                 'history',
859         );
860
861         # we want to catch, among others
862         # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
863         my ($parentrefname, $parentpathname, $refname, $pathname) =
864                 ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
865
866         # first, analyze the 'current' part
867         if (defined $pathname) {
868                 # we got "branch:filename" or "branch:dir/"
869                 # we could use git_get_type(branch:pathname), but:
870                 # - it needs $git_dir
871                 # - it does a git() call
872                 # - the convention of terminating directories with a slash
873                 #   makes it superfluous
874                 # - embedding the action in the PATH_INFO would make it even
875                 #   more superfluous
876                 $pathname =~ s,^/+,,;
877                 if (!$pathname || substr($pathname, -1) eq "/") {
878                         $input_params{'action'} ||= "tree";
879                         $pathname =~ s,/$,,;
880                 } else {
881                         # the default action depends on whether we had parent info
882                         # or not
883                         if ($parentrefname) {
884                                 $input_params{'action'} ||= "blobdiff_plain";
885                         } else {
886                                 $input_params{'action'} ||= "blob_plain";
887                         }
888                 }
889                 $input_params{'hash_base'} ||= $refname;
890                 $input_params{'file_name'} ||= $pathname;
891         } elsif (defined $refname) {
892                 # we got "branch". In this case we have to choose if we have to
893                 # set hash or hash_base.
894                 #
895                 # Most of the actions without a pathname only want hash to be
896                 # set, except for the ones specified in @wants_base that want
897                 # hash_base instead. It should also be noted that hand-crafted
898                 # links having 'history' as an action and no pathname or hash
899                 # set will fail, but that happens regardless of PATH_INFO.
900                 if (defined $parentrefname) {
901                         # if there is parent let the default be 'shortlog' action
902                         # (for http://git.example.com/repo.git/A..B links); if there
903                         # is no parent, dispatch will detect type of object and set
904                         # action appropriately if required (if action is not set)
905                         $input_params{'action'} ||= "shortlog";
906                 }
907                 if ($input_params{'action'} &&
908                     grep { $_ eq $input_params{'action'} } @wants_base) {
909                         $input_params{'hash_base'} ||= $refname;
910                 } else {
911                         $input_params{'hash'} ||= $refname;
912                 }
913         }
914
915         # next, handle the 'parent' part, if present
916         if (defined $parentrefname) {
917                 # a missing pathspec defaults to the 'current' filename, allowing e.g.
918                 # someproject/blobdiff/oldrev..newrev:/filename
919                 if ($parentpathname) {
920                         $parentpathname =~ s,^/+,,;
921                         $parentpathname =~ s,/$,,;
922                         $input_params{'file_parent'} ||= $parentpathname;
923                 } else {
924                         $input_params{'file_parent'} ||= $input_params{'file_name'};
925                 }
926                 # we assume that hash_parent_base is wanted if a path was specified,
927                 # or if the action wants hash_base instead of hash
928                 if (defined $input_params{'file_parent'} ||
929                         grep { $_ eq $input_params{'action'} } @wants_base) {
930                         $input_params{'hash_parent_base'} ||= $parentrefname;
931                 } else {
932                         $input_params{'hash_parent'} ||= $parentrefname;
933                 }
934         }
935
936         # for the snapshot action, we allow URLs in the form
937         # $project/snapshot/$hash.ext
938         # where .ext determines the snapshot and gets removed from the
939         # passed $refname to provide the $hash.
940         #
941         # To be able to tell that $refname includes the format extension, we
942         # require the following two conditions to be satisfied:
943         # - the hash input parameter MUST have been set from the $refname part
944         #   of the URL (i.e. they must be equal)
945         # - the snapshot format MUST NOT have been defined already (e.g. from
946         #   CGI parameter sf)
947         # It's also useless to try any matching unless $refname has a dot,
948         # so we check for that too
949         if (defined $input_params{'action'} &&
950                 $input_params{'action'} eq 'snapshot' &&
951                 defined $refname && index($refname, '.') != -1 &&
952                 $refname eq $input_params{'hash'} &&
953                 !defined $input_params{'snapshot_format'}) {
954                 # We loop over the known snapshot formats, checking for
955                 # extensions. Allowed extensions are both the defined suffix
956                 # (which includes the initial dot already) and the snapshot
957                 # format key itself, with a prepended dot
958                 while (my ($fmt, $opt) = each %known_snapshot_formats) {
959                         my $hash = $refname;
960                         unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
961                                 next;
962                         }
963                         my $sfx = $1;
964                         # a valid suffix was found, so set the snapshot format
965                         # and reset the hash parameter
966                         $input_params{'snapshot_format'} = $fmt;
967                         $input_params{'hash'} = $hash;
968                         # we also set the format suffix to the one requested
969                         # in the URL: this way a request for e.g. .tgz returns
970                         # a .tgz instead of a .tar.gz
971                         $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
972                         last;
973                 }
974         }
975 }
976
977 our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
978      $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
979      $searchtext, $search_regexp);
980 sub evaluate_and_validate_params {
981         our $action = $input_params{'action'};
982         if (defined $action) {
983                 if (!validate_action($action)) {
984                         die_error(400, "Invalid action parameter");
985                 }
986         }
987
988         # parameters which are pathnames
989         our $project = $input_params{'project'};
990         if (defined $project) {
991                 if (!validate_project($project)) {
992                         undef $project;
993                         die_error(404, "No such project");
994                 }
995         }
996
997         our $file_name = $input_params{'file_name'};
998         if (defined $file_name) {
999                 if (!validate_pathname($file_name)) {
1000                         die_error(400, "Invalid file parameter");
1001                 }
1002         }
1003
1004         our $file_parent = $input_params{'file_parent'};
1005         if (defined $file_parent) {
1006                 if (!validate_pathname($file_parent)) {
1007                         die_error(400, "Invalid file parent parameter");
1008                 }
1009         }
1010
1011         # parameters which are refnames
1012         our $hash = $input_params{'hash'};
1013         if (defined $hash) {
1014                 if (!validate_refname($hash)) {
1015                         die_error(400, "Invalid hash parameter");
1016                 }
1017         }
1018
1019         our $hash_parent = $input_params{'hash_parent'};
1020         if (defined $hash_parent) {
1021                 if (!validate_refname($hash_parent)) {
1022                         die_error(400, "Invalid hash parent parameter");
1023                 }
1024         }
1025
1026         our $hash_base = $input_params{'hash_base'};
1027         if (defined $hash_base) {
1028                 if (!validate_refname($hash_base)) {
1029                         die_error(400, "Invalid hash base parameter");
1030                 }
1031         }
1032
1033         our @extra_options = @{$input_params{'extra_options'}};
1034         # @extra_options is always defined, since it can only be (currently) set from
1035         # CGI, and $cgi->param() returns the empty array in array context if the param
1036         # is not set
1037         foreach my $opt (@extra_options) {
1038                 if (not exists $allowed_options{$opt}) {
1039                         die_error(400, "Invalid option parameter");
1040                 }
1041                 if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1042                         die_error(400, "Invalid option parameter for this action");
1043                 }
1044         }
1045
1046         our $hash_parent_base = $input_params{'hash_parent_base'};
1047         if (defined $hash_parent_base) {
1048                 if (!validate_refname($hash_parent_base)) {
1049                         die_error(400, "Invalid hash parent base parameter");
1050                 }
1051         }
1052
1053         # other parameters
1054         our $page = $input_params{'page'};
1055         if (defined $page) {
1056                 if ($page =~ m/[^0-9]/) {
1057                         die_error(400, "Invalid page parameter");
1058                 }
1059         }
1060
1061         our $searchtype = $input_params{'searchtype'};
1062         if (defined $searchtype) {
1063                 if ($searchtype =~ m/[^a-z]/) {
1064                         die_error(400, "Invalid searchtype parameter");
1065                 }
1066         }
1067
1068         our $search_use_regexp = $input_params{'search_use_regexp'};
1069
1070         our $searchtext = $input_params{'searchtext'};
1071         our $search_regexp;
1072         if (defined $searchtext) {
1073                 if (length($searchtext) < 2) {
1074                         die_error(403, "At least two characters are required for search parameter");
1075                 }
1076                 if ($search_use_regexp) {
1077                         $search_regexp = $searchtext;
1078                         if (!eval { qr/$search_regexp/; 1; }) {
1079                                 (my $error = $@) =~ s/ at \S+ line \d+.*\n?//;
1080                                 die_error(400, "Invalid search regexp '$search_regexp'",
1081                                           esc_html($error));
1082                         }
1083                 } else {
1084                         $search_regexp = quotemeta $searchtext;
1085                 }
1086         }
1087 }
1088
1089 # path to the current git repository
1090 our $git_dir;
1091 sub evaluate_git_dir {
1092         our $git_dir = "$projectroot/$project" if $project;
1093 }
1094
1095 our (@snapshot_fmts, $git_avatar);
1096 sub configure_gitweb_features {
1097         # list of supported snapshot formats
1098         our @snapshot_fmts = gitweb_get_feature('snapshot');
1099         @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1100
1101         # check that the avatar feature is set to a known provider name,
1102         # and for each provider check if the dependencies are satisfied.
1103         # if the provider name is invalid or the dependencies are not met,
1104         # reset $git_avatar to the empty string.
1105         our ($git_avatar) = gitweb_get_feature('avatar');
1106         if ($git_avatar eq 'gravatar') {
1107                 $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1108         } elsif ($git_avatar eq 'picon') {
1109                 # no dependencies
1110         } else {
1111                 $git_avatar = '';
1112         }
1113 }
1114
1115 # custom error handler: 'die <message>' is Internal Server Error
1116 sub handle_errors_html {
1117         my $msg = shift; # it is already HTML escaped
1118
1119         # to avoid infinite loop where error occurs in die_error,
1120         # change handler to default handler, disabling handle_errors_html
1121         set_message("Error occured when inside die_error:\n$msg");
1122
1123         # you cannot jump out of die_error when called as error handler;
1124         # the subroutine set via CGI::Carp::set_message is called _after_
1125         # HTTP headers are already written, so it cannot write them itself
1126         die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1127 }
1128 set_message(\&handle_errors_html);
1129
1130 # dispatch
1131 sub dispatch {
1132         if (!defined $action) {
1133                 if (defined $hash) {
1134                         $action = git_get_type($hash);
1135                         $action or die_error(404, "Object does not exist");
1136                 } elsif (defined $hash_base && defined $file_name) {
1137                         $action = git_get_type("$hash_base:$file_name");
1138                         $action or die_error(404, "File or directory does not exist");
1139                 } elsif (defined $project) {
1140                         $action = 'summary';
1141                 } else {
1142                         $action = 'project_list';
1143                 }
1144         }
1145         if (!defined($actions{$action})) {
1146                 die_error(400, "Unknown action");
1147         }
1148         if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1149             !$project) {
1150                 die_error(400, "Project needed");
1151         }
1152         $actions{$action}->();
1153 }
1154
1155 sub reset_timer {
1156         our $t0 = [ gettimeofday() ]
1157                 if defined $t0;
1158         our $number_of_git_cmds = 0;
1159 }
1160
1161 our $first_request = 1;
1162 sub run_request {
1163         reset_timer();
1164
1165         evaluate_uri();
1166         if ($first_request) {
1167                 evaluate_gitweb_config();
1168                 evaluate_git_version();
1169         }
1170         if ($per_request_config) {
1171                 if (ref($per_request_config) eq 'CODE') {
1172                         $per_request_config->();
1173                 } elsif (!$first_request) {
1174                         evaluate_gitweb_config();
1175                 }
1176         }
1177         check_loadavg();
1178
1179         # $projectroot and $projects_list might be set in gitweb config file
1180         $projects_list ||= $projectroot;
1181
1182         evaluate_query_params();
1183         evaluate_path_info();
1184         evaluate_and_validate_params();
1185         evaluate_git_dir();
1186
1187         configure_gitweb_features();
1188
1189         dispatch();
1190 }
1191
1192 our $is_last_request = sub { 1 };
1193 our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1194 our $CGI = 'CGI';
1195 our $cgi;
1196 sub configure_as_fcgi {
1197         require CGI::Fast;
1198         our $CGI = 'CGI::Fast';
1199
1200         my $request_number = 0;
1201         # let each child service 100 requests
1202         our $is_last_request = sub { ++$request_number > 100 };
1203 }
1204 sub evaluate_argv {
1205         my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1206         configure_as_fcgi()
1207                 if $script_name =~ /\.fcgi$/;
1208
1209         return unless (@ARGV);
1210
1211         require Getopt::Long;
1212         Getopt::Long::GetOptions(
1213                 'fastcgi|fcgi|f' => \&configure_as_fcgi,
1214                 'nproc|n=i' => sub {
1215                         my ($arg, $val) = @_;
1216                         return unless eval { require FCGI::ProcManager; 1; };
1217                         my $proc_manager = FCGI::ProcManager->new({
1218                                 n_processes => $val,
1219                         });
1220                         our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1221                         our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1222                         our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1223                 },
1224         );
1225 }
1226
1227 sub run {
1228         evaluate_argv();
1229
1230         $first_request = 1;
1231         $pre_listen_hook->()
1232                 if $pre_listen_hook;
1233
1234  REQUEST:
1235         while ($cgi = $CGI->new()) {
1236                 $pre_dispatch_hook->()
1237                         if $pre_dispatch_hook;
1238
1239                 run_request();
1240
1241                 $post_dispatch_hook->()
1242                         if $post_dispatch_hook;
1243                 $first_request = 0;
1244
1245                 last REQUEST if ($is_last_request->());
1246         }
1247
1248  DONE_GITWEB:
1249         1;
1250 }
1251
1252 run();
1253
1254 if (defined caller) {
1255         # wrapped in a subroutine processing requests,
1256         # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1257         return;
1258 } else {
1259         # pure CGI script, serving single request
1260         exit;
1261 }
1262
1263 ## ======================================================================
1264 ## action links
1265
1266 # possible values of extra options
1267 # -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1268 # -replay => 1      - start from a current view (replay with modifications)
1269 # -path_info => 0|1 - don't use/use path_info URL (if possible)
1270 # -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1271 sub href {
1272         my %params = @_;
1273         # default is to use -absolute url() i.e. $my_uri
1274         my $href = $params{-full} ? $my_url : $my_uri;
1275
1276         # implicit -replay, must be first of implicit params
1277         $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1278
1279         $params{'project'} = $project unless exists $params{'project'};
1280
1281         if ($params{-replay}) {
1282                 while (my ($name, $symbol) = each %cgi_param_mapping) {
1283                         if (!exists $params{$name}) {
1284                                 $params{$name} = $input_params{$name};
1285                         }
1286                 }
1287         }
1288
1289         my $use_pathinfo = gitweb_check_feature('pathinfo');
1290         if (defined $params{'project'} &&
1291             (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1292                 # try to put as many parameters as possible in PATH_INFO:
1293                 #   - project name
1294                 #   - action
1295                 #   - hash_parent or hash_parent_base:/file_parent
1296                 #   - hash or hash_base:/filename
1297                 #   - the snapshot_format as an appropriate suffix
1298
1299                 # When the script is the root DirectoryIndex for the domain,
1300                 # $href here would be something like http://gitweb.example.com/
1301                 # Thus, we strip any trailing / from $href, to spare us double
1302                 # slashes in the final URL
1303                 $href =~ s,/$,,;
1304
1305                 # Then add the project name, if present
1306                 $href .= "/".esc_path_info($params{'project'});
1307                 delete $params{'project'};
1308
1309                 # since we destructively absorb parameters, we keep this
1310                 # boolean that remembers if we're handling a snapshot
1311                 my $is_snapshot = $params{'action'} eq 'snapshot';
1312
1313                 # Summary just uses the project path URL, any other action is
1314                 # added to the URL
1315                 if (defined $params{'action'}) {
1316                         $href .= "/".esc_path_info($params{'action'})
1317                                 unless $params{'action'} eq 'summary';
1318                         delete $params{'action'};
1319                 }
1320
1321                 # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1322                 # stripping nonexistent or useless pieces
1323                 $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1324                         || $params{'hash_parent'} || $params{'hash'});
1325                 if (defined $params{'hash_base'}) {
1326                         if (defined $params{'hash_parent_base'}) {
1327                                 $href .= esc_path_info($params{'hash_parent_base'});
1328                                 # skip the file_parent if it's the same as the file_name
1329                                 if (defined $params{'file_parent'}) {
1330                                         if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1331                                                 delete $params{'file_parent'};
1332                                         } elsif ($params{'file_parent'} !~ /\.\./) {
1333                                                 $href .= ":/".esc_path_info($params{'file_parent'});
1334                                                 delete $params{'file_parent'};
1335                                         }
1336                                 }
1337                                 $href .= "..";
1338                                 delete $params{'hash_parent'};
1339                                 delete $params{'hash_parent_base'};
1340                         } elsif (defined $params{'hash_parent'}) {
1341                                 $href .= esc_path_info($params{'hash_parent'}). "..";
1342                                 delete $params{'hash_parent'};
1343                         }
1344
1345                         $href .= esc_path_info($params{'hash_base'});
1346                         if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1347                                 $href .= ":/".esc_path_info($params{'file_name'});
1348                                 delete $params{'file_name'};
1349                         }
1350                         delete $params{'hash'};
1351                         delete $params{'hash_base'};
1352                 } elsif (defined $params{'hash'}) {
1353                         $href .= esc_path_info($params{'hash'});
1354                         delete $params{'hash'};
1355                 }
1356
1357                 # If the action was a snapshot, we can absorb the
1358                 # snapshot_format parameter too
1359                 if ($is_snapshot) {
1360                         my $fmt = $params{'snapshot_format'};
1361                         # snapshot_format should always be defined when href()
1362                         # is called, but just in case some code forgets, we
1363                         # fall back to the default
1364                         $fmt ||= $snapshot_fmts[0];
1365                         $href .= $known_snapshot_formats{$fmt}{'suffix'};
1366                         delete $params{'snapshot_format'};
1367                 }
1368         }
1369
1370         # now encode the parameters explicitly
1371         my @result = ();
1372         for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1373                 my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1374                 if (defined $params{$name}) {
1375                         if (ref($params{$name}) eq "ARRAY") {
1376                                 foreach my $par (@{$params{$name}}) {
1377                                         push @result, $symbol . "=" . esc_param($par);
1378                                 }
1379                         } else {
1380                                 push @result, $symbol . "=" . esc_param($params{$name});
1381                         }
1382                 }
1383         }
1384         $href .= "?" . join(';', @result) if scalar @result;
1385
1386         # final transformation: trailing spaces must be escaped (URI-encoded)
1387         $href =~ s/(\s+)$/CGI::escape($1)/e;
1388
1389         if ($params{-anchor}) {
1390                 $href .= "#".esc_param($params{-anchor});
1391         }
1392
1393         return $href;
1394 }
1395
1396
1397 ## ======================================================================
1398 ## validation, quoting/unquoting and escaping
1399
1400 sub validate_action {
1401         my $input = shift || return undef;
1402         return undef unless exists $actions{$input};
1403         return $input;
1404 }
1405
1406 sub validate_project {
1407         my $input = shift || return undef;
1408         if (!validate_pathname($input) ||
1409                 !(-d "$projectroot/$input") ||
1410                 !check_export_ok("$projectroot/$input") ||
1411                 ($strict_export && !project_in_list($input))) {
1412                 return undef;
1413         } else {
1414                 return $input;
1415         }
1416 }
1417
1418 sub validate_pathname {
1419         my $input = shift || return undef;
1420
1421         # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1422         # at the beginning, at the end, and between slashes.
1423         # also this catches doubled slashes
1424         if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1425                 return undef;
1426         }
1427         # no null characters
1428         if ($input =~ m!\0!) {
1429                 return undef;
1430         }
1431         return $input;
1432 }
1433
1434 sub validate_refname {
1435         my $input = shift || return undef;
1436
1437         # textual hashes are O.K.
1438         if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1439                 return $input;
1440         }
1441         # it must be correct pathname
1442         $input = validate_pathname($input)
1443                 or return undef;
1444         # restrictions on ref name according to git-check-ref-format
1445         if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1446                 return undef;
1447         }
1448         return $input;
1449 }
1450
1451 # decode sequences of octets in utf8 into Perl's internal form,
1452 # which is utf-8 with utf8 flag set if needed.  gitweb writes out
1453 # in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1454 sub to_utf8 {
1455         my $str = shift;
1456         return undef unless defined $str;
1457
1458         if (utf8::is_utf8($str) || utf8::decode($str)) {
1459                 return $str;
1460         } else {
1461                 return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1462         }
1463 }
1464
1465 # quote unsafe chars, but keep the slash, even when it's not
1466 # correct, but quoted slashes look too horrible in bookmarks
1467 sub esc_param {
1468         my $str = shift;
1469         return undef unless defined $str;
1470         $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1471         $str =~ s/ /\+/g;
1472         return $str;
1473 }
1474
1475 # the quoting rules for path_info fragment are slightly different
1476 sub esc_path_info {
1477         my $str = shift;
1478         return undef unless defined $str;
1479
1480         # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1481         $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1482
1483         return $str;
1484 }
1485
1486 # quote unsafe chars in whole URL, so some characters cannot be quoted
1487 sub esc_url {
1488         my $str = shift;
1489         return undef unless defined $str;
1490         $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1491         $str =~ s/ /\+/g;
1492         return $str;
1493 }
1494
1495 # quote unsafe characters in HTML attributes
1496 sub esc_attr {
1497
1498         # for XHTML conformance escaping '"' to '&quot;' is not enough
1499         return esc_html(@_);
1500 }
1501
1502 # replace invalid utf8 character with SUBSTITUTION sequence
1503 sub esc_html {
1504         my $str = shift;
1505         my %opts = @_;
1506
1507         return undef unless defined $str;
1508
1509         $str = to_utf8($str);
1510         $str = $cgi->escapeHTML($str);
1511         if ($opts{'-nbsp'}) {
1512                 $str =~ s/ /&nbsp;/g;
1513         }
1514         $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1515         return $str;
1516 }
1517
1518 # quote control characters and escape filename to HTML
1519 sub esc_path {
1520         my $str = shift;
1521         my %opts = @_;
1522
1523         return undef unless defined $str;
1524
1525         $str = to_utf8($str);
1526         $str = $cgi->escapeHTML($str);
1527         if ($opts{'-nbsp'}) {
1528                 $str =~ s/ /&nbsp;/g;
1529         }
1530         $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1531         return $str;
1532 }
1533
1534 # Sanitize for use in XHTML + application/xml+xhtm (valid XML 1.0)
1535 sub sanitize {
1536         my $str = shift;
1537
1538         return undef unless defined $str;
1539
1540         $str = to_utf8($str);
1541         $str =~ s|([[:cntrl:]])|($1 =~ /[\t\n\r]/ ? $1 : quot_cec($1))|eg;
1542         return $str;
1543 }
1544
1545 # Make control characters "printable", using character escape codes (CEC)
1546 sub quot_cec {
1547         my $cntrl = shift;
1548         my %opts = @_;
1549         my %es = ( # character escape codes, aka escape sequences
1550                 "\t" => '\t',   # tab            (HT)
1551                 "\n" => '\n',   # line feed      (LF)
1552                 "\r" => '\r',   # carrige return (CR)
1553                 "\f" => '\f',   # form feed      (FF)
1554                 "\b" => '\b',   # backspace      (BS)
1555                 "\a" => '\a',   # alarm (bell)   (BEL)
1556                 "\e" => '\e',   # escape         (ESC)
1557                 "\013" => '\v', # vertical tab   (VT)
1558                 "\000" => '\0', # nul character  (NUL)
1559         );
1560         my $chr = ( (exists $es{$cntrl})
1561                     ? $es{$cntrl}
1562                     : sprintf('\%2x', ord($cntrl)) );
1563         if ($opts{-nohtml}) {
1564                 return $chr;
1565         } else {
1566                 return "<span class=\"cntrl\">$chr</span>";
1567         }
1568 }
1569
1570 # Alternatively use unicode control pictures codepoints,
1571 # Unicode "printable representation" (PR)
1572 sub quot_upr {
1573         my $cntrl = shift;
1574         my %opts = @_;
1575
1576         my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1577         if ($opts{-nohtml}) {
1578                 return $chr;
1579         } else {
1580                 return "<span class=\"cntrl\">$chr</span>";
1581         }
1582 }
1583
1584 # git may return quoted and escaped filenames
1585 sub unquote {
1586         my $str = shift;
1587
1588         sub unq {
1589                 my $seq = shift;
1590                 my %es = ( # character escape codes, aka escape sequences
1591                         't' => "\t",   # tab            (HT, TAB)
1592                         'n' => "\n",   # newline        (NL)
1593                         'r' => "\r",   # return         (CR)
1594                         'f' => "\f",   # form feed      (FF)
1595                         'b' => "\b",   # backspace      (BS)
1596                         'a' => "\a",   # alarm (bell)   (BEL)
1597                         'e' => "\e",   # escape         (ESC)
1598                         'v' => "\013", # vertical tab   (VT)
1599                 );
1600
1601                 if ($seq =~ m/^[0-7]{1,3}$/) {
1602                         # octal char sequence
1603                         return chr(oct($seq));
1604                 } elsif (exists $es{$seq}) {
1605                         # C escape sequence, aka character escape code
1606                         return $es{$seq};
1607                 }
1608                 # quoted ordinary character
1609                 return $seq;
1610         }
1611
1612         if ($str =~ m/^"(.*)"$/) {
1613                 # needs unquoting
1614                 $str = $1;
1615                 $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1616         }
1617         return $str;
1618 }
1619
1620 # escape tabs (convert tabs to spaces)
1621 sub untabify {
1622         my $line = shift;
1623
1624         while ((my $pos = index($line, "\t")) != -1) {
1625                 if (my $count = (8 - ($pos % 8))) {
1626                         my $spaces = ' ' x $count;
1627                         $line =~ s/\t/$spaces/;
1628                 }
1629         }
1630
1631         return $line;
1632 }
1633
1634 sub project_in_list {
1635         my $project = shift;
1636         my @list = git_get_projects_list();
1637         return @list && scalar(grep { $_->{'path'} eq $project } @list);
1638 }
1639
1640 ## ----------------------------------------------------------------------
1641 ## HTML aware string manipulation
1642
1643 # Try to chop given string on a word boundary between position
1644 # $len and $len+$add_len. If there is no word boundary there,
1645 # chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1646 # (marking chopped part) would be longer than given string.
1647 sub chop_str {
1648         my $str = shift;
1649         my $len = shift;
1650         my $add_len = shift || 10;
1651         my $where = shift || 'right'; # 'left' | 'center' | 'right'
1652
1653         # Make sure perl knows it is utf8 encoded so we don't
1654         # cut in the middle of a utf8 multibyte char.
1655         $str = to_utf8($str);
1656
1657         # allow only $len chars, but don't cut a word if it would fit in $add_len
1658         # if it doesn't fit, cut it if it's still longer than the dots we would add
1659         # remove chopped character entities entirely
1660
1661         # when chopping in the middle, distribute $len into left and right part
1662         # return early if chopping wouldn't make string shorter
1663         if ($where eq 'center') {
1664                 return $str if ($len + 5 >= length($str)); # filler is length 5
1665                 $len = int($len/2);
1666         } else {
1667                 return $str if ($len + 4 >= length($str)); # filler is length 4
1668         }
1669
1670         # regexps: ending and beginning with word part up to $add_len
1671         my $endre = qr/.{$len}\w{0,$add_len}/;
1672         my $begre = qr/\w{0,$add_len}.{$len}/;
1673
1674         if ($where eq 'left') {
1675                 $str =~ m/^(.*?)($begre)$/;
1676                 my ($lead, $body) = ($1, $2);
1677                 if (length($lead) > 4) {
1678                         $lead = " ...";
1679                 }
1680                 return "$lead$body";
1681
1682         } elsif ($where eq 'center') {
1683                 $str =~ m/^($endre)(.*)$/;
1684                 my ($left, $str)  = ($1, $2);
1685                 $str =~ m/^(.*?)($begre)$/;
1686                 my ($mid, $right) = ($1, $2);
1687                 if (length($mid) > 5) {
1688                         $mid = " ... ";
1689                 }
1690                 return "$left$mid$right";
1691
1692         } else {
1693                 $str =~ m/^($endre)(.*)$/;
1694                 my $body = $1;
1695                 my $tail = $2;
1696                 if (length($tail) > 4) {
1697                         $tail = "... ";
1698                 }
1699                 return "$body$tail";
1700         }
1701 }
1702
1703 # takes the same arguments as chop_str, but also wraps a <span> around the
1704 # result with a title attribute if it does get chopped. Additionally, the
1705 # string is HTML-escaped.
1706 sub chop_and_escape_str {
1707         my ($str) = @_;
1708
1709         my $chopped = chop_str(@_);
1710         $str = to_utf8($str);
1711         if ($chopped eq $str) {
1712                 return esc_html($chopped);
1713         } else {
1714                 $str =~ s/[[:cntrl:]]/?/g;
1715                 return $cgi->span({-title=>$str}, esc_html($chopped));
1716         }
1717 }
1718
1719 ## ----------------------------------------------------------------------
1720 ## functions returning short strings
1721
1722 # CSS class for given age value (in seconds)
1723 sub age_class {
1724         my $age = shift;
1725
1726         if (!defined $age) {
1727                 return "noage";
1728         } elsif ($age < 60*60*2) {
1729                 return "age0";
1730         } elsif ($age < 60*60*24*2) {
1731                 return "age1";
1732         } else {
1733                 return "age2";
1734         }
1735 }
1736
1737 # convert age in seconds to "nn units ago" string
1738 sub age_string {
1739         my $age = shift;
1740         my $age_str;
1741
1742         if ($age > 60*60*24*365*2) {
1743                 $age_str = (int $age/60/60/24/365);
1744                 $age_str .= " years ago";
1745         } elsif ($age > 60*60*24*(365/12)*2) {
1746                 $age_str = int $age/60/60/24/(365/12);
1747                 $age_str .= " months ago";
1748         } elsif ($age > 60*60*24*7*2) {
1749                 $age_str = int $age/60/60/24/7;
1750                 $age_str .= " weeks ago";
1751         } elsif ($age > 60*60*24*2) {
1752                 $age_str = int $age/60/60/24;
1753                 $age_str .= " days ago";
1754         } elsif ($age > 60*60*2) {
1755                 $age_str = int $age/60/60;
1756                 $age_str .= " hours ago";
1757         } elsif ($age > 60*2) {
1758                 $age_str = int $age/60;
1759                 $age_str .= " min ago";
1760         } elsif ($age > 2) {
1761                 $age_str = int $age;
1762                 $age_str .= " sec ago";
1763         } else {
1764                 $age_str .= " right now";
1765         }
1766         return $age_str;
1767 }
1768
1769 use constant {
1770         S_IFINVALID => 0030000,
1771         S_IFGITLINK => 0160000,
1772 };
1773
1774 # submodule/subproject, a commit object reference
1775 sub S_ISGITLINK {
1776         my $mode = shift;
1777
1778         return (($mode & S_IFMT) == S_IFGITLINK)
1779 }
1780
1781 # convert file mode in octal to symbolic file mode string
1782 sub mode_str {
1783         my $mode = oct shift;
1784
1785         if (S_ISGITLINK($mode)) {
1786                 return 'm---------';
1787         } elsif (S_ISDIR($mode & S_IFMT)) {
1788                 return 'drwxr-xr-x';
1789         } elsif (S_ISLNK($mode)) {
1790                 return 'lrwxrwxrwx';
1791         } elsif (S_ISREG($mode)) {
1792                 # git cares only about the executable bit
1793                 if ($mode & S_IXUSR) {
1794                         return '-rwxr-xr-x';
1795                 } else {
1796                         return '-rw-r--r--';
1797                 };
1798         } else {
1799                 return '----------';
1800         }
1801 }
1802
1803 # convert file mode in octal to file type string
1804 sub file_type {
1805         my $mode = shift;
1806
1807         if ($mode !~ m/^[0-7]+$/) {
1808                 return $mode;
1809         } else {
1810                 $mode = oct $mode;
1811         }
1812
1813         if (S_ISGITLINK($mode)) {
1814                 return "submodule";
1815         } elsif (S_ISDIR($mode & S_IFMT)) {
1816                 return "directory";
1817         } elsif (S_ISLNK($mode)) {
1818                 return "symlink";
1819         } elsif (S_ISREG($mode)) {
1820                 return "file";
1821         } else {
1822                 return "unknown";
1823         }
1824 }
1825
1826 # convert file mode in octal to file type description string
1827 sub file_type_long {
1828         my $mode = shift;
1829
1830         if ($mode !~ m/^[0-7]+$/) {
1831                 return $mode;
1832         } else {
1833                 $mode = oct $mode;
1834         }
1835
1836         if (S_ISGITLINK($mode)) {
1837                 return "submodule";
1838         } elsif (S_ISDIR($mode & S_IFMT)) {
1839                 return "directory";
1840         } elsif (S_ISLNK($mode)) {
1841                 return "symlink";
1842         } elsif (S_ISREG($mode)) {
1843                 if ($mode & S_IXUSR) {
1844                         return "executable";
1845                 } else {
1846                         return "file";
1847                 };
1848         } else {
1849                 return "unknown";
1850         }
1851 }
1852
1853
1854 ## ----------------------------------------------------------------------
1855 ## functions returning short HTML fragments, or transforming HTML fragments
1856 ## which don't belong to other sections
1857
1858 # format line of commit message.
1859 sub format_log_line_html {
1860         my $line = shift;
1861
1862         $line = esc_html($line, -nbsp=>1);
1863         $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1864                 $cgi->a({-href => href(action=>"object", hash=>$1),
1865                                         -class => "text"}, $1);
1866         }eg;
1867
1868         return $line;
1869 }
1870
1871 # format marker of refs pointing to given object
1872
1873 # the destination action is chosen based on object type and current context:
1874 # - for annotated tags, we choose the tag view unless it's the current view
1875 #   already, in which case we go to shortlog view
1876 # - for other refs, we keep the current view if we're in history, shortlog or
1877 #   log view, and select shortlog otherwise
1878 sub format_ref_marker {
1879         my ($refs, $id) = @_;
1880         my $markers = '';
1881
1882         if (defined $refs->{$id}) {
1883                 foreach my $ref (@{$refs->{$id}}) {
1884                         # this code exploits the fact that non-lightweight tags are the
1885                         # only indirect objects, and that they are the only objects for which
1886                         # we want to use tag instead of shortlog as action
1887                         my ($type, $name) = qw();
1888                         my $indirect = ($ref =~ s/\^\{\}$//);
1889                         # e.g. tags/v2.6.11 or heads/next
1890                         if ($ref =~ m!^(.*?)s?/(.*)$!) {
1891                                 $type = $1;
1892                                 $name = $2;
1893                         } else {
1894                                 $type = "ref";
1895                                 $name = $ref;
1896                         }
1897
1898                         my $class = $type;
1899                         $class .= " indirect" if $indirect;
1900
1901                         my $dest_action = "shortlog";
1902
1903                         if ($indirect) {
1904                                 $dest_action = "tag" unless $action eq "tag";
1905                         } elsif ($action =~ /^(history|(short)?log)$/) {
1906                                 $dest_action = $action;
1907                         }
1908
1909                         my $dest = "";
1910                         $dest .= "refs/" unless $ref =~ m!^refs/!;
1911                         $dest .= $ref;
1912
1913                         my $link = $cgi->a({
1914                                 -href => href(
1915                                         action=>$dest_action,
1916                                         hash=>$dest
1917                                 )}, $name);
1918
1919                         $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
1920                                 $link . "</span>";
1921                 }
1922         }
1923
1924         if ($markers) {
1925                 return ' <span class="refs">'. $markers . '</span>';
1926         } else {
1927                 return "";
1928         }
1929 }
1930
1931 # format, perhaps shortened and with markers, title line
1932 sub format_subject_html {
1933         my ($long, $short, $href, $extra) = @_;
1934         $extra = '' unless defined($extra);
1935
1936         if (length($short) < length($long)) {
1937                 $long =~ s/[[:cntrl:]]/?/g;
1938                 return $cgi->a({-href => $href, -class => "list subject",
1939                                 -title => to_utf8($long)},
1940                        esc_html($short)) . $extra;
1941         } else {
1942                 return $cgi->a({-href => $href, -class => "list subject"},
1943                        esc_html($long)) . $extra;
1944         }
1945 }
1946
1947 # Rather than recomputing the url for an email multiple times, we cache it
1948 # after the first hit. This gives a visible benefit in views where the avatar
1949 # for the same email is used repeatedly (e.g. shortlog).
1950 # The cache is shared by all avatar engines (currently gravatar only), which
1951 # are free to use it as preferred. Since only one avatar engine is used for any
1952 # given page, there's no risk for cache conflicts.
1953 our %avatar_cache = ();
1954
1955 # Compute the picon url for a given email, by using the picon search service over at
1956 # http://www.cs.indiana.edu/picons/search.html
1957 sub picon_url {
1958         my $email = lc shift;
1959         if (!$avatar_cache{$email}) {
1960                 my ($user, $domain) = split('@', $email);
1961                 $avatar_cache{$email} =
1962                         "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1963                         "$domain/$user/" .
1964                         "users+domains+unknown/up/single";
1965         }
1966         return $avatar_cache{$email};
1967 }
1968
1969 # Compute the gravatar url for a given email, if it's not in the cache already.
1970 # Gravatar stores only the part of the URL before the size, since that's the
1971 # one computationally more expensive. This also allows reuse of the cache for
1972 # different sizes (for this particular engine).
1973 sub gravatar_url {
1974         my $email = lc shift;
1975         my $size = shift;
1976         $avatar_cache{$email} ||=
1977                 "http://www.gravatar.com/avatar/" .
1978                         Digest::MD5::md5_hex($email) . "?s=";
1979         return $avatar_cache{$email} . $size;
1980 }
1981
1982 # Insert an avatar for the given $email at the given $size if the feature
1983 # is enabled.
1984 sub git_get_avatar {
1985         my ($email, %opts) = @_;
1986         my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1987         my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1988         $opts{-size} ||= 'default';
1989         my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1990         my $url = "";
1991         if ($git_avatar eq 'gravatar') {
1992                 $url = gravatar_url($email, $size);
1993         } elsif ($git_avatar eq 'picon') {
1994                 $url = picon_url($email);
1995         }
1996         # Other providers can be added by extending the if chain, defining $url
1997         # as needed. If no variant puts something in $url, we assume avatars
1998         # are completely disabled/unavailable.
1999         if ($url) {
2000                 return $pre_white .
2001                        "<img width=\"$size\" " .
2002                             "class=\"avatar\" " .
2003                             "src=\"".esc_url($url)."\" " .
2004                             "alt=\"\" " .
2005                        "/>" . $post_white;
2006         } else {
2007                 return "";
2008         }
2009 }
2010
2011 sub format_search_author {
2012         my ($author, $searchtype, $displaytext) = @_;
2013         my $have_search = gitweb_check_feature('search');
2014
2015         if ($have_search) {
2016                 my $performed = "";
2017                 if ($searchtype eq 'author') {
2018                         $performed = "authored";
2019                 } elsif ($searchtype eq 'committer') {
2020                         $performed = "committed";
2021                 }
2022
2023                 return $cgi->a({-href => href(action=>"search", hash=>$hash,
2024                                 searchtext=>$author,
2025                                 searchtype=>$searchtype), class=>"list",
2026                                 title=>"Search for commits $performed by $author"},
2027                                 $displaytext);
2028
2029         } else {
2030                 return $displaytext;
2031         }
2032 }
2033
2034 # format the author name of the given commit with the given tag
2035 # the author name is chopped and escaped according to the other
2036 # optional parameters (see chop_str).
2037 sub format_author_html {
2038         my $tag = shift;
2039         my $co = shift;
2040         my $author = chop_and_escape_str($co->{'author_name'}, @_);
2041         return "<$tag class=\"author\">" .
2042                format_search_author($co->{'author_name'}, "author",
2043                        git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2044                        $author) .
2045                "</$tag>";
2046 }
2047
2048 # format git diff header line, i.e. "diff --(git|combined|cc) ..."
2049 sub format_git_diff_header_line {
2050         my $line = shift;
2051         my $diffinfo = shift;
2052         my ($from, $to) = @_;
2053
2054         if ($diffinfo->{'nparents'}) {
2055                 # combined diff
2056                 $line =~ s!^(diff (.*?) )"?.*$!$1!;
2057                 if ($to->{'href'}) {
2058                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2059                                          esc_path($to->{'file'}));
2060                 } else { # file was deleted (no href)
2061                         $line .= esc_path($to->{'file'});
2062                 }
2063         } else {
2064                 # "ordinary" diff
2065                 $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2066                 if ($from->{'href'}) {
2067                         $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2068                                          'a/' . esc_path($from->{'file'}));
2069                 } else { # file was added (no href)
2070                         $line .= 'a/' . esc_path($from->{'file'});
2071                 }
2072                 $line .= ' ';
2073                 if ($to->{'href'}) {
2074                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2075                                          'b/' . esc_path($to->{'file'}));
2076                 } else { # file was deleted
2077                         $line .= 'b/' . esc_path($to->{'file'});
2078                 }
2079         }
2080
2081         return "<div class=\"diff header\">$line</div>\n";
2082 }
2083
2084 # format extended diff header line, before patch itself
2085 sub format_extended_diff_header_line {
2086         my $line = shift;
2087         my $diffinfo = shift;
2088         my ($from, $to) = @_;
2089
2090         # match <path>
2091         if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2092                 $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2093                                        esc_path($from->{'file'}));
2094         }
2095         if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2096                 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2097                                  esc_path($to->{'file'}));
2098         }
2099         # match single <mode>
2100         if ($line =~ m/\s(\d{6})$/) {
2101                 $line .= '<span class="info"> (' .
2102                          file_type_long($1) .
2103                          ')</span>';
2104         }
2105         # match <hash>
2106         if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2107                 # can match only for combined diff
2108                 $line = 'index ';
2109                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2110                         if ($from->{'href'}[$i]) {
2111                                 $line .= $cgi->a({-href=>$from->{'href'}[$i],
2112                                                   -class=>"hash"},
2113                                                  substr($diffinfo->{'from_id'}[$i],0,7));
2114                         } else {
2115                                 $line .= '0' x 7;
2116                         }
2117                         # separator
2118                         $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2119                 }
2120                 $line .= '..';
2121                 if ($to->{'href'}) {
2122                         $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2123                                          substr($diffinfo->{'to_id'},0,7));
2124                 } else {
2125                         $line .= '0' x 7;
2126                 }
2127
2128         } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2129                 # can match only for ordinary diff
2130                 my ($from_link, $to_link);
2131                 if ($from->{'href'}) {
2132                         $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2133                                              substr($diffinfo->{'from_id'},0,7));
2134                 } else {
2135                         $from_link = '0' x 7;
2136                 }
2137                 if ($to->{'href'}) {
2138                         $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2139                                            substr($diffinfo->{'to_id'},0,7));
2140                 } else {
2141                         $to_link = '0' x 7;
2142                 }
2143                 my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2144                 $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2145         }
2146
2147         return $line . "<br/>\n";
2148 }
2149
2150 # format from-file/to-file diff header
2151 sub format_diff_from_to_header {
2152         my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2153         my $line;
2154         my $result = '';
2155
2156         $line = $from_line;
2157         #assert($line =~ m/^---/) if DEBUG;
2158         # no extra formatting for "^--- /dev/null"
2159         if (! $diffinfo->{'nparents'}) {
2160                 # ordinary (single parent) diff
2161                 if ($line =~ m!^--- "?a/!) {
2162                         if ($from->{'href'}) {
2163                                 $line = '--- a/' .
2164                                         $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2165                                                 esc_path($from->{'file'}));
2166                         } else {
2167                                 $line = '--- a/' .
2168                                         esc_path($from->{'file'});
2169                         }
2170                 }
2171                 $result .= qq!<div class="diff from_file">$line</div>\n!;
2172
2173         } else {
2174                 # combined diff (merge commit)
2175                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2176                         if ($from->{'href'}[$i]) {
2177                                 $line = '--- ' .
2178                                         $cgi->a({-href=>href(action=>"blobdiff",
2179                                                              hash_parent=>$diffinfo->{'from_id'}[$i],
2180                                                              hash_parent_base=>$parents[$i],
2181                                                              file_parent=>$from->{'file'}[$i],
2182                                                              hash=>$diffinfo->{'to_id'},
2183                                                              hash_base=>$hash,
2184                                                              file_name=>$to->{'file'}),
2185                                                  -class=>"path",
2186                                                  -title=>"diff" . ($i+1)},
2187                                                 $i+1) .
2188                                         '/' .
2189                                         $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2190                                                 esc_path($from->{'file'}[$i]));
2191                         } else {
2192                                 $line = '--- /dev/null';
2193                         }
2194                         $result .= qq!<div class="diff from_file">$line</div>\n!;
2195                 }
2196         }
2197
2198         $line = $to_line;
2199         #assert($line =~ m/^\+\+\+/) if DEBUG;
2200         # no extra formatting for "^+++ /dev/null"
2201         if ($line =~ m!^\+\+\+ "?b/!) {
2202                 if ($to->{'href'}) {
2203                         $line = '+++ b/' .
2204                                 $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2205                                         esc_path($to->{'file'}));
2206                 } else {
2207                         $line = '+++ b/' .
2208                                 esc_path($to->{'file'});
2209                 }
2210         }
2211         $result .= qq!<div class="diff to_file">$line</div>\n!;
2212
2213         return $result;
2214 }
2215
2216 # create note for patch simplified by combined diff
2217 sub format_diff_cc_simplified {
2218         my ($diffinfo, @parents) = @_;
2219         my $result = '';
2220
2221         $result .= "<div class=\"diff header\">" .
2222                    "diff --cc ";
2223         if (!is_deleted($diffinfo)) {
2224                 $result .= $cgi->a({-href => href(action=>"blob",
2225                                                   hash_base=>$hash,
2226                                                   hash=>$diffinfo->{'to_id'},
2227                                                   file_name=>$diffinfo->{'to_file'}),
2228                                     -class => "path"},
2229                                    esc_path($diffinfo->{'to_file'}));
2230         } else {
2231                 $result .= esc_path($diffinfo->{'to_file'});
2232         }
2233         $result .= "</div>\n" . # class="diff header"
2234                    "<div class=\"diff nodifferences\">" .
2235                    "Simple merge" .
2236                    "</div>\n"; # class="diff nodifferences"
2237
2238         return $result;
2239 }
2240
2241 sub diff_line_class {
2242         my ($line, $from, $to) = @_;
2243
2244         # ordinary diff
2245         my $num_sign = 1;
2246         # combined diff
2247         if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2248                 $num_sign = scalar @{$from->{'href'}};
2249         }
2250
2251         my @diff_line_classifier = (
2252                 { regexp => qr/^\@\@{$num_sign} /, class => "chunk_header"},
2253                 { regexp => qr/^\\/,               class => "incomplete"  },
2254                 { regexp => qr/^ {$num_sign}/,     class => "ctx" },
2255                 # classifier for context must come before classifier add/rem,
2256                 # or we would have to use more complicated regexp, for example
2257                 # qr/(?= {0,$m}\+)[+ ]{$num_sign}/, where $m = $num_sign - 1;
2258                 { regexp => qr/^[+ ]{$num_sign}/,   class => "add" },
2259                 { regexp => qr/^[- ]{$num_sign}/,   class => "rem" },
2260         );
2261         for my $clsfy (@diff_line_classifier) {
2262                 return $clsfy->{'class'}
2263                         if ($line =~ $clsfy->{'regexp'});
2264         }
2265
2266         # fallback
2267         return "";
2268 }
2269
2270 # assumes that $from and $to are defined and correctly filled,
2271 # and that $line holds a line of chunk header for unified diff
2272 sub format_unidiff_chunk_header {
2273         my ($line, $from, $to) = @_;
2274
2275         my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2276                 $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2277
2278         $from_lines = 0 unless defined $from_lines;
2279         $to_lines   = 0 unless defined $to_lines;
2280
2281         if ($from->{'href'}) {
2282                 $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2283                                      -class=>"list"}, $from_text);
2284         }
2285         if ($to->{'href'}) {
2286                 $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2287                                      -class=>"list"}, $to_text);
2288         }
2289         $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2290                 "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2291         return $line;
2292 }
2293
2294 # assumes that $from and $to are defined and correctly filled,
2295 # and that $line holds a line of chunk header for combined diff
2296 sub format_cc_diff_chunk_header {
2297         my ($line, $from, $to) = @_;
2298
2299         my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2300         my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2301
2302         @from_text = split(' ', $ranges);
2303         for (my $i = 0; $i < @from_text; ++$i) {
2304                 ($from_start[$i], $from_nlines[$i]) =
2305                         (split(',', substr($from_text[$i], 1)), 0);
2306         }
2307
2308         $to_text   = pop @from_text;
2309         $to_start  = pop @from_start;
2310         $to_nlines = pop @from_nlines;
2311
2312         $line = "<span class=\"chunk_info\">$prefix ";
2313         for (my $i = 0; $i < @from_text; ++$i) {
2314                 if ($from->{'href'}[$i]) {
2315                         $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2316                                           -class=>"list"}, $from_text[$i]);
2317                 } else {
2318                         $line .= $from_text[$i];
2319                 }
2320                 $line .= " ";
2321         }
2322         if ($to->{'href'}) {
2323                 $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2324                                   -class=>"list"}, $to_text);
2325         } else {
2326                 $line .= $to_text;
2327         }
2328         $line .= " $prefix</span>" .
2329                  "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2330         return $line;
2331 }
2332
2333 # process patch (diff) line (not to be used for diff headers),
2334 # returning class and HTML-formatted (but not wrapped) line
2335 sub process_diff_line {
2336         my $line = shift;
2337         my ($from, $to) = @_;
2338
2339         my $diff_class = diff_line_class($line, $from, $to);
2340
2341         chomp $line;
2342         $line = untabify($line);
2343
2344         if ($from && $to && $line =~ m/^\@{2} /) {
2345                 $line = format_unidiff_chunk_header($line, $from, $to);
2346                 return $diff_class, $line;
2347
2348         } elsif ($from && $to && $line =~ m/^\@{3}/) {
2349                 $line = format_cc_diff_chunk_header($line, $from, $to);
2350                 return $diff_class, $line;
2351
2352         }
2353         return $diff_class, esc_html($line, -nbsp=>1);
2354 }
2355
2356 # Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2357 # linked.  Pass the hash of the tree/commit to snapshot.
2358 sub format_snapshot_links {
2359         my ($hash) = @_;
2360         my $num_fmts = @snapshot_fmts;
2361         if ($num_fmts > 1) {
2362                 # A parenthesized list of links bearing format names.
2363                 # e.g. "snapshot (_tar.gz_ _zip_)"
2364                 return "snapshot (" . join(' ', map
2365                         $cgi->a({
2366                                 -href => href(
2367                                         action=>"snapshot",
2368                                         hash=>$hash,
2369                                         snapshot_format=>$_
2370                                 )
2371                         }, $known_snapshot_formats{$_}{'display'})
2372                 , @snapshot_fmts) . ")";
2373         } elsif ($num_fmts == 1) {
2374                 # A single "snapshot" link whose tooltip bears the format name.
2375                 # i.e. "_snapshot_"
2376                 my ($fmt) = @snapshot_fmts;
2377                 return
2378                         $cgi->a({
2379                                 -href => href(
2380                                         action=>"snapshot",
2381                                         hash=>$hash,
2382                                         snapshot_format=>$fmt
2383                                 ),
2384                                 -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2385                         }, "snapshot");
2386         } else { # $num_fmts == 0
2387                 return undef;
2388         }
2389 }
2390
2391 ## ......................................................................
2392 ## functions returning values to be passed, perhaps after some
2393 ## transformation, to other functions; e.g. returning arguments to href()
2394
2395 # returns hash to be passed to href to generate gitweb URL
2396 # in -title key it returns description of link
2397 sub get_feed_info {
2398         my $format = shift || 'Atom';
2399         my %res = (action => lc($format));
2400
2401         # feed links are possible only for project views
2402         return unless (defined $project);
2403         # some views should link to OPML, or to generic project feed,
2404         # or don't have specific feed yet (so they should use generic)
2405         return if (!$action || $action =~ /^(?:tags|heads|forks|tag|search)$/x);
2406
2407         my $branch;
2408         # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2409         # from tag links; this also makes possible to detect branch links
2410         if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2411             (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2412                 $branch = $1;
2413         }
2414         # find log type for feed description (title)
2415         my $type = 'log';
2416         if (defined $file_name) {
2417                 $type  = "history of $file_name";
2418                 $type .= "/" if ($action eq 'tree');
2419                 $type .= " on '$branch'" if (defined $branch);
2420         } else {
2421                 $type = "log of $branch" if (defined $branch);
2422         }
2423
2424         $res{-title} = $type;
2425         $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2426         $res{'file_name'} = $file_name;
2427
2428         return %res;
2429 }
2430
2431 ## ----------------------------------------------------------------------
2432 ## git utility subroutines, invoking git commands
2433
2434 # returns path to the core git executable and the --git-dir parameter as list
2435 sub git_cmd {
2436         $number_of_git_cmds++;
2437         return $GIT, '--git-dir='.$git_dir;
2438 }
2439
2440 # quote the given arguments for passing them to the shell
2441 # quote_command("command", "arg 1", "arg with ' and ! characters")
2442 # => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2443 # Try to avoid using this function wherever possible.
2444 sub quote_command {
2445         return join(' ',
2446                 map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2447 }
2448
2449 # get HEAD ref of given project as hash
2450 sub git_get_head_hash {
2451         return git_get_full_hash(shift, 'HEAD');
2452 }
2453
2454 sub git_get_full_hash {
2455         return git_get_hash(@_);
2456 }
2457
2458 sub git_get_short_hash {
2459         return git_get_hash(@_, '--short=7');
2460 }
2461
2462 sub git_get_hash {
2463         my ($project, $hash, @options) = @_;
2464         my $o_git_dir = $git_dir;
2465         my $retval = undef;
2466         $git_dir = "$projectroot/$project";
2467         if (open my $fd, '-|', git_cmd(), 'rev-parse',
2468             '--verify', '-q', @options, $hash) {
2469                 $retval = <$fd>;
2470                 chomp $retval if defined $retval;
2471                 close $fd;
2472         }
2473         if (defined $o_git_dir) {
2474                 $git_dir = $o_git_dir;
2475         }
2476         return $retval;
2477 }
2478
2479 # get type of given object
2480 sub git_get_type {
2481         my $hash = shift;
2482
2483         open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2484         my $type = <$fd>;
2485         close $fd or return;
2486         chomp $type;
2487         return $type;
2488 }
2489
2490 # repository configuration
2491 our $config_file = '';
2492 our %config;
2493
2494 # store multiple values for single key as anonymous array reference
2495 # single values stored directly in the hash, not as [ <value> ]
2496 sub hash_set_multi {
2497         my ($hash, $key, $value) = @_;
2498
2499         if (!exists $hash->{$key}) {
2500                 $hash->{$key} = $value;
2501         } elsif (!ref $hash->{$key}) {
2502                 $hash->{$key} = [ $hash->{$key}, $value ];
2503         } else {
2504                 push @{$hash->{$key}}, $value;
2505         }
2506 }
2507
2508 # return hash of git project configuration
2509 # optionally limited to some section, e.g. 'gitweb'
2510 sub git_parse_project_config {
2511         my $section_regexp = shift;
2512         my %config;
2513
2514         local $/ = "\0";
2515
2516         open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2517                 or return;
2518
2519         while (my $keyval = <$fh>) {
2520                 chomp $keyval;
2521                 my ($key, $value) = split(/\n/, $keyval, 2);
2522
2523                 hash_set_multi(\%config, $key, $value)
2524                         if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2525         }
2526         close $fh;
2527
2528         return %config;
2529 }
2530
2531 # convert config value to boolean: 'true' or 'false'
2532 # no value, number > 0, 'true' and 'yes' values are true
2533 # rest of values are treated as false (never as error)
2534 sub config_to_bool {
2535         my $val = shift;
2536
2537         return 1 if !defined $val;             # section.key
2538
2539         # strip leading and trailing whitespace
2540         $val =~ s/^\s+//;
2541         $val =~ s/\s+$//;
2542
2543         return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2544                 ($val =~ /^(?:true|yes)$/i));  # section.key = true
2545 }
2546
2547 # convert config value to simple decimal number
2548 # an optional value suffix of 'k', 'm', or 'g' will cause the value
2549 # to be multiplied by 1024, 1048576, or 1073741824
2550 sub config_to_int {
2551         my $val = shift;
2552
2553         # strip leading and trailing whitespace
2554         $val =~ s/^\s+//;
2555         $val =~ s/\s+$//;
2556
2557         if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2558                 $unit = lc($unit);
2559                 # unknown unit is treated as 1
2560                 return $num * ($unit eq 'g' ? 1073741824 :
2561                                $unit eq 'm' ?    1048576 :
2562                                $unit eq 'k' ?       1024 : 1);
2563         }
2564         return $val;
2565 }
2566
2567 # convert config value to array reference, if needed
2568 sub config_to_multi {
2569         my $val = shift;
2570
2571         return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2572 }
2573
2574 sub git_get_project_config {
2575         my ($key, $type) = @_;
2576
2577         return unless defined $git_dir;
2578
2579         # key sanity check
2580         return unless ($key);
2581         # only subsection, if exists, is case sensitive,
2582         # and not lowercased by 'git config -z -l'
2583         if (my ($hi, $mi, $lo) = ($key =~ /^([^.]*)\.(.*)\.([^.]*)$/)) {
2584                 $key = join(".", lc($hi), $mi, lc($lo));
2585         } else {
2586                 $key = lc($key);
2587         }
2588         $key =~ s/^gitweb\.//;
2589         return if ($key =~ m/\W/);
2590
2591         # type sanity check
2592         if (defined $type) {
2593                 $type =~ s/^--//;
2594                 $type = undef
2595                         unless ($type eq 'bool' || $type eq 'int');
2596         }
2597
2598         # get config
2599         if (!defined $config_file ||
2600             $config_file ne "$git_dir/config") {
2601                 %config = git_parse_project_config('gitweb');
2602                 $config_file = "$git_dir/config";
2603         }
2604
2605         # check if config variable (key) exists
2606         return unless exists $config{"gitweb.$key"};
2607
2608         # ensure given type
2609         if (!defined $type) {
2610                 return $config{"gitweb.$key"};
2611         } elsif ($type eq 'bool') {
2612                 # backward compatibility: 'git config --bool' returns true/false
2613                 return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2614         } elsif ($type eq 'int') {
2615                 return config_to_int($config{"gitweb.$key"});
2616         }
2617         return $config{"gitweb.$key"};
2618 }
2619
2620 # get hash of given path at given ref
2621 sub git_get_hash_by_path {
2622         my $base = shift;
2623         my $path = shift || return undef;
2624         my $type = shift;
2625
2626         $path =~ s,/+$,,;
2627
2628         open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2629                 or die_error(500, "Open git-ls-tree failed");
2630         my $line = <$fd>;
2631         close $fd or return undef;
2632
2633         if (!defined $line) {
2634                 # there is no tree or hash given by $path at $base
2635                 return undef;
2636         }
2637
2638         #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2639         $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2640         if (defined $type && $type ne $2) {
2641                 # type doesn't match
2642                 return undef;
2643         }
2644         return $3;
2645 }
2646
2647 # get path of entry with given hash at given tree-ish (ref)
2648 # used to get 'from' filename for combined diff (merge commit) for renames
2649 sub git_get_path_by_hash {
2650         my $base = shift || return;
2651         my $hash = shift || return;
2652
2653         local $/ = "\0";
2654
2655         open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2656                 or return undef;
2657         while (my $line = <$fd>) {
2658                 chomp $line;
2659
2660                 #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2661                 #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2662                 if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2663                         close $fd;
2664                         return $1;
2665                 }
2666         }
2667         close $fd;
2668         return undef;
2669 }
2670
2671 ## ......................................................................
2672 ## git utility functions, directly accessing git repository
2673
2674 # get the value of config variable either from file named as the variable
2675 # itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2676 # configuration variable in the repository config file.
2677 sub git_get_file_or_project_config {
2678         my ($path, $name) = @_;
2679
2680         $git_dir = "$projectroot/$path";
2681         open my $fd, '<', "$git_dir/$name"
2682                 or return git_get_project_config($name);
2683         my $conf = <$fd>;
2684         close $fd;
2685         if (defined $conf) {
2686                 chomp $conf;
2687         }
2688         return $conf;
2689 }
2690
2691 sub git_get_project_description {
2692         my $path = shift;
2693         return git_get_file_or_project_config($path, 'description');
2694 }
2695
2696 sub git_get_project_category {
2697         my $path = shift;
2698         return git_get_file_or_project_config($path, 'category');
2699 }
2700
2701
2702 # supported formats:
2703 # * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2704 #   - if its contents is a number, use it as tag weight,
2705 #   - otherwise add a tag with weight 1
2706 # * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2707 #   the same value multiple times increases tag weight
2708 # * `gitweb.ctag' multi-valued repo config variable
2709 sub git_get_project_ctags {
2710         my $project = shift;
2711         my $ctags = {};
2712
2713         $git_dir = "$projectroot/$project";
2714         if (opendir my $dh, "$git_dir/ctags") {
2715                 my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2716                 foreach my $tagfile (@files) {
2717                         open my $ct, '<', $tagfile
2718                                 or next;
2719                         my $val = <$ct>;
2720                         chomp $val if $val;
2721                         close $ct;
2722
2723                         (my $ctag = $tagfile) =~ s#.*/##;
2724                         if ($val =~ /^\d+$/) {
2725                                 $ctags->{$ctag} = $val;
2726                         } else {
2727                                 $ctags->{$ctag} = 1;
2728                         }
2729                 }
2730                 closedir $dh;
2731
2732         } elsif (open my $fh, '<', "$git_dir/ctags") {
2733                 while (my $line = <$fh>) {
2734                         chomp $line;
2735                         $ctags->{$line}++ if $line;
2736                 }
2737                 close $fh;
2738
2739         } else {
2740                 my $taglist = config_to_multi(git_get_project_config('ctag'));
2741                 foreach my $tag (@$taglist) {
2742                         $ctags->{$tag}++;
2743                 }
2744         }
2745
2746         return $ctags;
2747 }
2748
2749 # return hash, where keys are content tags ('ctags'),
2750 # and values are sum of weights of given tag in every project
2751 sub git_gather_all_ctags {
2752         my $projects = shift;
2753         my $ctags = {};
2754
2755         foreach my $p (@$projects) {
2756                 foreach my $ct (keys %{$p->{'ctags'}}) {
2757                         $ctags->{$ct} += $p->{'ctags'}->{$ct};
2758                 }
2759         }
2760
2761         return $ctags;
2762 }
2763
2764 sub git_populate_project_tagcloud {
2765         my $ctags = shift;
2766
2767         # First, merge different-cased tags; tags vote on casing
2768         my %ctags_lc;
2769         foreach (keys %$ctags) {
2770                 $ctags_lc{lc $_}->{count} += $ctags->{$_};
2771                 if (not $ctags_lc{lc $_}->{topcount}
2772                     or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2773                         $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2774                         $ctags_lc{lc $_}->{topname} = $_;
2775                 }
2776         }
2777
2778         my $cloud;
2779         my $matched = $input_params{'ctag'};
2780         if (eval { require HTML::TagCloud; 1; }) {
2781                 $cloud = HTML::TagCloud->new;
2782                 foreach my $ctag (sort keys %ctags_lc) {
2783                         # Pad the title with spaces so that the cloud looks
2784                         # less crammed.
2785                         my $title = esc_html($ctags_lc{$ctag}->{topname});
2786                         $title =~ s/ /&nbsp;/g;
2787                         $title =~ s/^/&nbsp;/g;
2788                         $title =~ s/$/&nbsp;/g;
2789                         if (defined $matched && $matched eq $ctag) {
2790                                 $title = qq(<span class="match">$title</span>);
2791                         }
2792                         $cloud->add($title, href(project=>undef, ctag=>$ctag),
2793                                     $ctags_lc{$ctag}->{count});
2794                 }
2795         } else {
2796                 $cloud = {};
2797                 foreach my $ctag (keys %ctags_lc) {
2798                         my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2799                         if (defined $matched && $matched eq $ctag) {
2800                                 $title = qq(<span class="match">$title</span>);
2801                         }
2802                         $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2803                         $cloud->{$ctag}{ctag} =
2804                                 $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2805                 }
2806         }
2807         return $cloud;
2808 }
2809
2810 sub git_show_project_tagcloud {
2811         my ($cloud, $count) = @_;
2812         if (ref $cloud eq 'HTML::TagCloud') {
2813                 return $cloud->html_and_css($count);
2814         } else {
2815                 my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2816                 return
2817                         '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2818                         join (', ', map {
2819                                 $cloud->{$_}->{'ctag'}
2820                         } splice(@tags, 0, $count)) .
2821                         '</div>';
2822         }
2823 }
2824
2825 sub git_get_project_url_list {
2826         my $path = shift;
2827
2828         $git_dir = "$projectroot/$path";
2829         open my $fd, '<', "$git_dir/cloneurl"
2830                 or return wantarray ?
2831                 @{ config_to_multi(git_get_project_config('url')) } :
2832                    config_to_multi(git_get_project_config('url'));
2833         my @git_project_url_list = map { chomp; $_ } <$fd>;
2834         close $fd;
2835
2836         return wantarray ? @git_project_url_list : \@git_project_url_list;
2837 }
2838
2839 sub git_get_projects_list {
2840         my $filter = shift || '';
2841         my @list;
2842
2843         $filter =~ s/\.git$//;
2844
2845         if (-d $projects_list) {
2846                 # search in directory
2847                 my $dir = $projects_list;
2848                 # remove the trailing "/"
2849                 $dir =~ s!/+$!!;
2850                 my $pfxlen = length("$dir");
2851                 my $pfxdepth = ($dir =~ tr!/!!);
2852                 # when filtering, search only given subdirectory
2853                 if ($filter) {
2854                         $dir .= "/$filter";
2855                         $dir =~ s!/+$!!;
2856                 }
2857
2858                 File::Find::find({
2859                         follow_fast => 1, # follow symbolic links
2860                         follow_skip => 2, # ignore duplicates
2861                         dangling_symlinks => 0, # ignore dangling symlinks, silently
2862                         wanted => sub {
2863                                 # global variables
2864                                 our $project_maxdepth;
2865                                 our $projectroot;
2866                                 # skip project-list toplevel, if we get it.
2867                                 return if (m!^[/.]$!);
2868                                 # only directories can be git repositories
2869                                 return unless (-d $_);
2870                                 # don't traverse too deep (Find is super slow on os x)
2871                                 # $project_maxdepth excludes depth of $projectroot
2872                                 if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2873                                         $File::Find::prune = 1;
2874                                         return;
2875                                 }
2876
2877                                 my $path = substr($File::Find::name, $pfxlen + 1);
2878                                 # we check related file in $projectroot
2879                                 if (check_export_ok("$projectroot/$path")) {
2880                                         push @list, { path => $path };
2881                                         $File::Find::prune = 1;
2882                                 }
2883                         },
2884                 }, "$dir");
2885
2886         } elsif (-f $projects_list) {
2887                 # read from file(url-encoded):
2888                 # 'git%2Fgit.git Linus+Torvalds'
2889                 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2890                 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2891                 open my $fd, '<', $projects_list or return;
2892         PROJECT:
2893                 while (my $line = <$fd>) {
2894                         chomp $line;
2895                         my ($path, $owner) = split ' ', $line;
2896                         $path = unescape($path);
2897                         $owner = unescape($owner);
2898                         if (!defined $path) {
2899                                 next;
2900                         }
2901                         # if $filter is rpovided, check if $path begins with $filter
2902                         if ($filter && $path !~ m!^\Q$filter\E/!) {
2903                                 next;
2904                         }
2905                         if (check_export_ok("$projectroot/$path")) {
2906                                 my $pr = {
2907                                         path => $path,
2908                                         owner => to_utf8($owner),
2909                                 };
2910                                 push @list, $pr;
2911                         }
2912                 }
2913                 close $fd;
2914         }
2915         return @list;
2916 }
2917
2918 # written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
2919 # as side effects it sets 'forks' field to list of forks for forked projects
2920 sub filter_forks_from_projects_list {
2921         my $projects = shift;
2922
2923         my %trie; # prefix tree of directories (path components)
2924         # generate trie out of those directories that might contain forks
2925         foreach my $pr (@$projects) {
2926                 my $path = $pr->{'path'};
2927                 $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
2928                 next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
2929                 next unless ($path);      # skip '.git' repository: tests, git-instaweb
2930                 next unless (-d "$projectroot/$path"); # containing directory exists
2931                 $pr->{'forks'} = [];      # there can be 0 or more forks of project
2932
2933                 # add to trie
2934                 my @dirs = split('/', $path);
2935                 # walk the trie, until either runs out of components or out of trie
2936                 my $ref = \%trie;
2937                 while (scalar @dirs &&
2938                        exists($ref->{$dirs[0]})) {
2939                         $ref = $ref->{shift @dirs};
2940                 }
2941                 # create rest of trie structure from rest of components
2942                 foreach my $dir (@dirs) {
2943                         $ref = $ref->{$dir} = {};
2944                 }
2945                 # create end marker, store $pr as a data
2946                 $ref->{''} = $pr if (!exists $ref->{''});
2947         }
2948
2949         # filter out forks, by finding shortest prefix match for paths
2950         my @filtered;
2951  PROJECT:
2952         foreach my $pr (@$projects) {
2953                 # trie lookup
2954                 my $ref = \%trie;
2955         DIR:
2956                 foreach my $dir (split('/', $pr->{'path'})) {
2957                         if (exists $ref->{''}) {
2958                                 # found [shortest] prefix, is a fork - skip it
2959                                 push @{$ref->{''}{'forks'}}, $pr;
2960                                 next PROJECT;
2961                         }
2962                         if (!exists $ref->{$dir}) {
2963                                 # not in trie, cannot have prefix, not a fork
2964                                 push @filtered, $pr;
2965                                 next PROJECT;
2966                         }
2967                         # If the dir is there, we just walk one step down the trie.
2968                         $ref = $ref->{$dir};
2969                 }
2970                 # we ran out of trie
2971                 # (shouldn't happen: it's either no match, or end marker)
2972                 push @filtered, $pr;
2973         }
2974
2975         return @filtered;
2976 }
2977
2978 # note: fill_project_list_info must be run first,
2979 # for 'descr_long' and 'ctags' to be filled
2980 sub search_projects_list {
2981         my ($projlist, %opts) = @_;
2982         my $tagfilter  = $opts{'tagfilter'};
2983         my $search_re = $opts{'search_regexp'};
2984
2985         return @$projlist
2986                 unless ($tagfilter || $search_re);
2987
2988         my @projects;
2989  PROJECT:
2990         foreach my $pr (@$projlist) {
2991
2992                 if ($tagfilter) {
2993                         next unless ref($pr->{'ctags'}) eq 'HASH';
2994                         next unless
2995                                 grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
2996                 }
2997
2998                 if ($search_re) {
2999                         next unless
3000                                 $pr->{'path'} =~ /$search_re/ ||
3001                                 $pr->{'descr_long'} =~ /$search_re/;
3002                 }
3003
3004                 push @projects, $pr;
3005         }
3006
3007         return @projects;
3008 }
3009
3010 our $gitweb_project_owner = undef;
3011 sub git_get_project_list_from_file {
3012
3013         return if (defined $gitweb_project_owner);
3014
3015         $gitweb_project_owner = {};
3016         # read from file (url-encoded):
3017         # 'git%2Fgit.git Linus+Torvalds'
3018         # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
3019         # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
3020         if (-f $projects_list) {
3021                 open(my $fd, '<', $projects_list);
3022                 while (my $line = <$fd>) {
3023                         chomp $line;
3024                         my ($pr, $ow) = split ' ', $line;
3025                         $pr = unescape($pr);
3026                         $ow = unescape($ow);
3027                         $gitweb_project_owner->{$pr} = to_utf8($ow);
3028                 }
3029                 close $fd;
3030         }
3031 }
3032
3033 sub git_get_project_owner {
3034         my $project = shift;
3035         my $owner;
3036
3037         return undef unless $project;
3038         $git_dir = "$projectroot/$project";
3039
3040         if (!defined $gitweb_project_owner) {
3041                 git_get_project_list_from_file();
3042         }
3043
3044         if (exists $gitweb_project_owner->{$project}) {
3045                 $owner = $gitweb_project_owner->{$project};
3046         }
3047         if (!defined $owner){
3048                 $owner = git_get_project_config('owner');
3049         }
3050         if (!defined $owner) {
3051                 $owner = get_file_owner("$git_dir");
3052         }
3053
3054         return $owner;
3055 }
3056
3057 sub git_get_last_activity {
3058         my ($path) = @_;
3059         my $fd;
3060
3061         $git_dir = "$projectroot/$path";
3062         open($fd, "-|", git_cmd(), 'for-each-ref',
3063              '--format=%(committer)',
3064              '--sort=-committerdate',
3065              '--count=1',
3066              'refs/heads') or return;
3067         my $most_recent = <$fd>;
3068         close $fd or return;
3069         if (defined $most_recent &&
3070             $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
3071                 my $timestamp = $1;
3072                 my $age = time - $timestamp;
3073                 return ($age, age_string($age));
3074         }
3075         return (undef, undef);
3076 }
3077
3078 # Implementation note: when a single remote is wanted, we cannot use 'git
3079 # remote show -n' because that command always work (assuming it's a remote URL
3080 # if it's not defined), and we cannot use 'git remote show' because that would
3081 # try to make a network roundtrip. So the only way to find if that particular
3082 # remote is defined is to walk the list provided by 'git remote -v' and stop if
3083 # and when we find what we want.
3084 sub git_get_remotes_list {
3085         my $wanted = shift;
3086         my %remotes = ();
3087
3088         open my $fd, '-|' , git_cmd(), 'remote', '-v';
3089         return unless $fd;
3090         while (my $remote = <$fd>) {
3091                 chomp $remote;
3092                 $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3093                 next if $wanted and not $remote eq $wanted;
3094                 my ($url, $key) = ($1, $2);
3095
3096                 $remotes{$remote} ||= { 'heads' => () };
3097                 $remotes{$remote}{$key} = $url;
3098         }
3099         close $fd or return;
3100         return wantarray ? %remotes : \%remotes;
3101 }
3102
3103 # Takes a hash of remotes as first parameter and fills it by adding the
3104 # available remote heads for each of the indicated remotes.
3105 sub fill_remote_heads {
3106         my $remotes = shift;
3107         my @heads = map { "remotes/$_" } keys %$remotes;
3108         my @remoteheads = git_get_heads_list(undef, @heads);
3109         foreach my $remote (keys %$remotes) {
3110                 $remotes->{$remote}{'heads'} = [ grep {
3111                         $_->{'name'} =~ s!^$remote/!!
3112                         } @remoteheads ];
3113         }
3114 }
3115
3116 sub git_get_references {
3117         my $type = shift || "";
3118         my %refs;
3119         # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3120         # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3121         open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3122                 ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3123                 or return;
3124
3125         while (my $line = <$fd>) {
3126                 chomp $line;
3127                 if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3128                         if (defined $refs{$1}) {
3129                                 push @{$refs{$1}}, $2;
3130                         } else {
3131                                 $refs{$1} = [ $2 ];
3132                         }
3133                 }
3134         }
3135         close $fd or return;
3136         return \%refs;
3137 }
3138
3139 sub git_get_rev_name_tags {
3140         my $hash = shift || return undef;
3141
3142         open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3143                 or return;
3144         my $name_rev = <$fd>;
3145         close $fd;
3146
3147         if ($name_rev =~ m|^$hash tags/(.*)$|) {
3148                 return $1;
3149         } else {
3150                 # catches also '$hash undefined' output
3151                 return undef;
3152         }
3153 }
3154
3155 ## ----------------------------------------------------------------------
3156 ## parse to hash functions
3157
3158 sub parse_date {
3159         my $epoch = shift;
3160         my $tz = shift || "-0000";
3161
3162         my %date;
3163         my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3164         my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3165         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3166         $date{'hour'} = $hour;
3167         $date{'minute'} = $min;
3168         $date{'mday'} = $mday;
3169         $date{'day'} = $days[$wday];
3170         $date{'month'} = $months[$mon];
3171         $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3172                              $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3173         $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3174                              $mday, $months[$mon], $hour ,$min;
3175         $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3176                              1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3177
3178         my ($tz_sign, $tz_hour, $tz_min) =
3179                 ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3180         $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3181         my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3182         ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3183         $date{'hour_local'} = $hour;
3184         $date{'minute_local'} = $min;
3185         $date{'tz_local'} = $tz;
3186         $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3187                                   1900+$year, $mon+1, $mday,
3188                                   $hour, $min, $sec, $tz);
3189         return %date;
3190 }
3191
3192 sub parse_tag {
3193         my $tag_id = shift;
3194         my %tag;
3195         my @comment;
3196
3197         open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3198         $tag{'id'} = $tag_id;
3199         while (my $line = <$fd>) {
3200                 chomp $line;
3201                 if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3202                         $tag{'object'} = $1;
3203                 } elsif ($line =~ m/^type (.+)$/) {
3204                         $tag{'type'} = $1;
3205                 } elsif ($line =~ m/^tag (.+)$/) {
3206                         $tag{'name'} = $1;
3207                 } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3208                         $tag{'author'} = $1;
3209                         $tag{'author_epoch'} = $2;
3210                         $tag{'author_tz'} = $3;
3211                         if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3212                                 $tag{'author_name'}  = $1;
3213                                 $tag{'author_email'} = $2;
3214                         } else {
3215                                 $tag{'author_name'} = $tag{'author'};
3216                         }
3217                 } elsif ($line =~ m/--BEGIN/) {
3218                         push @comment, $line;
3219                         last;
3220                 } elsif ($line eq "") {
3221                         last;
3222                 }
3223         }
3224         push @comment, <$fd>;
3225         $tag{'comment'} = \@comment;
3226         close $fd or return;
3227         if (!defined $tag{'name'}) {
3228                 return
3229         };
3230         return %tag
3231 }
3232
3233 sub parse_commit_text {
3234         my ($commit_text, $withparents) = @_;
3235         my @commit_lines = split '\n', $commit_text;
3236         my %co;
3237
3238         pop @commit_lines; # Remove '\0'
3239
3240         if (! @commit_lines) {
3241                 return;
3242         }
3243
3244         my $header = shift @commit_lines;
3245         if ($header !~ m/^[0-9a-fA-F]{40}/) {
3246                 return;
3247         }
3248         ($co{'id'}, my @parents) = split ' ', $header;
3249         while (my $line = shift @commit_lines) {
3250                 last if $line eq "\n";
3251                 if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3252                         $co{'tree'} = $1;
3253                 } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3254                         push @parents, $1;
3255                 } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3256                         $co{'author'} = to_utf8($1);
3257                         $co{'author_epoch'} = $2;
3258                         $co{'author_tz'} = $3;
3259                         if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3260                                 $co{'author_name'}  = $1;
3261                                 $co{'author_email'} = $2;
3262                         } else {
3263                                 $co{'author_name'} = $co{'author'};
3264                         }
3265                 } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3266                         $co{'committer'} = to_utf8($1);
3267                         $co{'committer_epoch'} = $2;
3268                         $co{'committer_tz'} = $3;
3269                         if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3270                                 $co{'committer_name'}  = $1;
3271                                 $co{'committer_email'} = $2;
3272                         } else {
3273                                 $co{'committer_name'} = $co{'committer'};
3274                         }
3275                 }
3276         }
3277         if (!defined $co{'tree'}) {
3278                 return;
3279         };
3280         $co{'parents'} = \@parents;
3281         $co{'parent'} = $parents[0];
3282
3283         foreach my $title (@commit_lines) {
3284                 $title =~ s/^    //;
3285                 if ($title ne "") {
3286                         $co{'title'} = chop_str($title, 80, 5);
3287                         # remove leading stuff of merges to make the interesting part visible
3288                         if (length($title) > 50) {
3289                                 $title =~ s/^Automatic //;
3290                                 $title =~ s/^merge (of|with) /Merge ... /i;
3291                                 if (length($title) > 50) {
3292                                         $title =~ s/(http|rsync):\/\///;
3293                                 }
3294                                 if (length($title) > 50) {
3295                                         $title =~ s/(master|www|rsync)\.//;
3296                                 }
3297                                 if (length($title) > 50) {
3298                                         $title =~ s/kernel.org:?//;
3299                                 }
3300                                 if (length($title) > 50) {
3301                                         $title =~ s/\/pub\/scm//;
3302                                 }
3303                         }
3304                         $co{'title_short'} = chop_str($title, 50, 5);
3305                         last;
3306                 }
3307         }
3308         if (! defined $co{'title'} || $co{'title'} eq "") {
3309                 $co{'title'} = $co{'title_short'} = '(no commit message)';
3310         }
3311         # remove added spaces
3312         foreach my $line (@commit_lines) {
3313                 $line =~ s/^    //;
3314         }
3315         $co{'comment'} = \@commit_lines;
3316
3317         my $age = time - $co{'committer_epoch'};
3318         $co{'age'} = $age;
3319         $co{'age_string'} = age_string($age);
3320         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3321         if ($age > 60*60*24*7*2) {
3322                 $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3323                 $co{'age_string_age'} = $co{'age_string'};
3324         } else {
3325                 $co{'age_string_date'} = $co{'age_string'};
3326                 $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3327         }
3328         return %co;
3329 }
3330
3331 sub parse_commit {
3332         my ($commit_id) = @_;
3333         my %co;
3334
3335         local $/ = "\0";
3336
3337         open my $fd, "-|", git_cmd(), "rev-list",
3338                 "--parents",
3339                 "--header",
3340                 "--max-count=1",
3341                 $commit_id,
3342                 "--",
3343                 or die_error(500, "Open git-rev-list failed");
3344         %co = parse_commit_text(<$fd>, 1);
3345         close $fd;
3346
3347         return %co;
3348 }
3349
3350 sub parse_commits {
3351         my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3352         my @cos;
3353
3354         $maxcount ||= 1;
3355         $skip ||= 0;
3356
3357         local $/ = "\0";
3358
3359         open my $fd, "-|", git_cmd(), "rev-list",
3360                 "--header",
3361                 @args,
3362                 ("--max-count=" . $maxcount),
3363                 ("--skip=" . $skip),
3364                 @extra_options,
3365                 $commit_id,
3366                 "--",
3367                 ($filename ? ($filename) : ())
3368                 or die_error(500, "Open git-rev-list failed");
3369         while (my $line = <$fd>) {
3370                 my %co = parse_commit_text($line);
3371                 push @cos, \%co;
3372         }
3373         close $fd;
3374
3375         return wantarray ? @cos : \@cos;
3376 }
3377
3378 # parse line of git-diff-tree "raw" output
3379 sub parse_difftree_raw_line {
3380         my $line = shift;
3381         my %res;
3382
3383         # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3384         # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3385         if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3386                 $res{'from_mode'} = $1;
3387                 $res{'to_mode'} = $2;
3388                 $res{'from_id'} = $3;
3389                 $res{'to_id'} = $4;
3390                 $res{'status'} = $5;
3391                 $res{'similarity'} = $6;
3392                 if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3393                         ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3394                 } else {
3395                         $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3396                 }
3397         }
3398         # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3399         # combined diff (for merge commit)
3400         elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3401                 $res{'nparents'}  = length($1);
3402                 $res{'from_mode'} = [ split(' ', $2) ];
3403                 $res{'to_mode'} = pop @{$res{'from_mode'}};
3404                 $res{'from_id'} = [ split(' ', $3) ];
3405                 $res{'to_id'} = pop @{$res{'from_id'}};
3406                 $res{'status'} = [ split('', $4) ];
3407                 $res{'to_file'} = unquote($5);
3408         }
3409         # 'c512b523472485aef4fff9e57b229d9d243c967f'
3410         elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3411                 $res{'commit'} = $1;
3412         }
3413
3414         return wantarray ? %res : \%res;
3415 }
3416
3417 # wrapper: return parsed line of git-diff-tree "raw" output
3418 # (the argument might be raw line, or parsed info)
3419 sub parsed_difftree_line {
3420         my $line_or_ref = shift;
3421
3422         if (ref($line_or_ref) eq "HASH") {
3423                 # pre-parsed (or generated by hand)
3424                 return $line_or_ref;
3425         } else {
3426                 return parse_difftree_raw_line($line_or_ref);
3427         }
3428 }
3429
3430 # parse line of git-ls-tree output
3431 sub parse_ls_tree_line {
3432         my $line = shift;
3433         my %opts = @_;
3434         my %res;
3435
3436         if ($opts{'-l'}) {
3437                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3438                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3439
3440                 $res{'mode'} = $1;
3441                 $res{'type'} = $2;
3442                 $res{'hash'} = $3;
3443                 $res{'size'} = $4;
3444                 if ($opts{'-z'}) {
3445                         $res{'name'} = $5;
3446                 } else {
3447                         $res{'name'} = unquote($5);
3448                 }
3449         } else {
3450                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3451                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3452
3453                 $res{'mode'} = $1;
3454                 $res{'type'} = $2;
3455                 $res{'hash'} = $3;
3456                 if ($opts{'-z'}) {
3457                         $res{'name'} = $4;
3458                 } else {
3459                         $res{'name'} = unquote($4);
3460                 }
3461         }
3462
3463         return wantarray ? %res : \%res;
3464 }
3465
3466 # generates _two_ hashes, references to which are passed as 2 and 3 argument
3467 sub parse_from_to_diffinfo {
3468         my ($diffinfo, $from, $to, @parents) = @_;
3469
3470         if ($diffinfo->{'nparents'}) {
3471                 # combined diff
3472                 $from->{'file'} = [];
3473                 $from->{'href'} = [];
3474                 fill_from_file_info($diffinfo, @parents)
3475                         unless exists $diffinfo->{'from_file'};
3476                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3477                         $from->{'file'}[$i] =
3478                                 defined $diffinfo->{'from_file'}[$i] ?
3479                                         $diffinfo->{'from_file'}[$i] :
3480                                         $diffinfo->{'to_file'};
3481                         if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3482                                 $from->{'href'}[$i] = href(action=>"blob",
3483                                                            hash_base=>$parents[$i],
3484                                                            hash=>$diffinfo->{'from_id'}[$i],
3485                                                            file_name=>$from->{'file'}[$i]);
3486                         } else {
3487                                 $from->{'href'}[$i] = undef;
3488                         }
3489                 }
3490         } else {
3491                 # ordinary (not combined) diff
3492                 $from->{'file'} = $diffinfo->{'from_file'};
3493                 if ($diffinfo->{'status'} ne "A") { # not new (added) file
3494                         $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3495                                                hash=>$diffinfo->{'from_id'},
3496                                                file_name=>$from->{'file'});
3497                 } else {
3498                         delete $from->{'href'};
3499                 }
3500         }
3501
3502         $to->{'file'} = $diffinfo->{'to_file'};
3503         if (!is_deleted($diffinfo)) { # file exists in result
3504                 $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3505                                      hash=>$diffinfo->{'to_id'},
3506                                      file_name=>$to->{'file'});
3507         } else {
3508                 delete $to->{'href'};
3509         }
3510 }
3511
3512 ## ......................................................................
3513 ## parse to array of hashes functions
3514
3515 sub git_get_heads_list {
3516         my ($limit, @classes) = @_;
3517         @classes = ('heads') unless @classes;
3518         my @patterns = map { "refs/$_" } @classes;
3519         my @headslist;
3520
3521         open my $fd, '-|', git_cmd(), 'for-each-ref',
3522                 ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3523                 '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3524                 @patterns
3525                 or return;
3526         while (my $line = <$fd>) {
3527                 my %ref_item;
3528
3529                 chomp $line;
3530                 my ($refinfo, $committerinfo) = split(/\0/, $line);
3531                 my ($hash, $name, $title) = split(' ', $refinfo, 3);
3532                 my ($committer, $epoch, $tz) =
3533                         ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3534                 $ref_item{'fullname'}  = $name;
3535                 $name =~ s!^refs/(?:head|remote)s/!!;
3536
3537                 $ref_item{'name'}  = $name;
3538                 $ref_item{'id'}    = $hash;
3539                 $ref_item{'title'} = $title || '(no commit message)';
3540                 $ref_item{'epoch'} = $epoch;
3541                 if ($epoch) {
3542                         $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3543                 } else {
3544                         $ref_item{'age'} = "unknown";
3545                 }
3546
3547                 push @headslist, \%ref_item;
3548         }
3549         close $fd;
3550
3551         return wantarray ? @headslist : \@headslist;
3552 }
3553
3554 sub git_get_tags_list {
3555         my $limit = shift;
3556         my @tagslist;
3557
3558         open my $fd, '-|', git_cmd(), 'for-each-ref',
3559                 ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3560                 '--format=%(objectname) %(objecttype) %(refname) '.
3561                 '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3562                 'refs/tags'
3563                 or return;
3564         while (my $line = <$fd>) {
3565                 my %ref_item;
3566
3567                 chomp $line;
3568                 my ($refinfo, $creatorinfo) = split(/\0/, $line);
3569                 my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3570                 my ($creator, $epoch, $tz) =
3571                         ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3572                 $ref_item{'fullname'} = $name;
3573                 $name =~ s!^refs/tags/!!;
3574
3575                 $ref_item{'type'} = $type;
3576                 $ref_item{'id'} = $id;
3577                 $ref_item{'name'} = $name;
3578                 if ($type eq "tag") {
3579                         $ref_item{'subject'} = $title;
3580                         $ref_item{'reftype'} = $reftype;
3581                         $ref_item{'refid'}   = $refid;
3582                 } else {
3583                         $ref_item{'reftype'} = $type;
3584                         $ref_item{'refid'}   = $id;
3585                 }
3586
3587                 if ($type eq "tag" || $type eq "commit") {
3588                         $ref_item{'epoch'} = $epoch;
3589                         if ($epoch) {
3590                                 $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3591                         } else {
3592                                 $ref_item{'age'} = "unknown";
3593                         }
3594                 }
3595
3596                 push @tagslist, \%ref_item;
3597         }
3598         close $fd;
3599
3600         return wantarray ? @tagslist : \@tagslist;
3601 }
3602
3603 ## ----------------------------------------------------------------------
3604 ## filesystem-related functions
3605
3606 sub get_file_owner {
3607         my $path = shift;
3608
3609         my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3610         my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3611         if (!defined $gcos) {
3612                 return undef;
3613         }
3614         my $owner = $gcos;
3615         $owner =~ s/[,;].*$//;
3616         return to_utf8($owner);
3617 }
3618
3619 # assume that file exists
3620 sub insert_file {
3621         my $filename = shift;
3622
3623         open my $fd, '<', $filename;
3624         print map { to_utf8($_) } <$fd>;
3625         close $fd;
3626 }
3627
3628 ## ......................................................................
3629 ## mimetype related functions
3630
3631 sub mimetype_guess_file {
3632         my $filename = shift;
3633         my $mimemap = shift;
3634         -r $mimemap or return undef;
3635
3636         my %mimemap;
3637         open(my $mh, '<', $mimemap) or return undef;
3638         while (<$mh>) {
3639                 next if m/^#/; # skip comments
3640                 my ($mimetype, @exts) = split(/\s+/);
3641                 foreach my $ext (@exts) {
3642                         $mimemap{$ext} = $mimetype;
3643                 }
3644         }
3645         close($mh);
3646
3647         $filename =~ /\.([^.]*)$/;
3648         return $mimemap{$1};
3649 }
3650
3651 sub mimetype_guess {
3652         my $filename = shift;
3653         my $mime;
3654         $filename =~ /\./ or return undef;
3655
3656         if ($mimetypes_file) {
3657                 my $file = $mimetypes_file;
3658                 if ($file !~ m!^/!) { # if it is relative path
3659                         # it is relative to project
3660                         $file = "$projectroot/$project/$file";
3661                 }
3662                 $mime = mimetype_guess_file($filename, $file);
3663         }
3664         $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3665         return $mime;
3666 }
3667
3668 sub blob_mimetype {
3669         my $fd = shift;
3670         my $filename = shift;
3671
3672         if ($filename) {
3673                 my $mime = mimetype_guess($filename);
3674                 $mime and return $mime;
3675         }
3676
3677         # just in case
3678         return $default_blob_plain_mimetype unless $fd;
3679
3680         if (-T $fd) {
3681                 return 'text/plain';
3682         } elsif (! $filename) {
3683                 return 'application/octet-stream';
3684         } elsif ($filename =~ m/\.png$/i) {
3685                 return 'image/png';
3686         } elsif ($filename =~ m/\.gif$/i) {
3687                 return 'image/gif';
3688         } elsif ($filename =~ m/\.jpe?g$/i) {
3689                 return 'image/jpeg';
3690         } else {
3691                 return 'application/octet-stream';
3692         }
3693 }
3694
3695 sub blob_contenttype {
3696         my ($fd, $file_name, $type) = @_;
3697
3698         $type ||= blob_mimetype($fd, $file_name);
3699         if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3700                 $type .= "; charset=$default_text_plain_charset";
3701         }
3702
3703         return $type;
3704 }
3705
3706 # guess file syntax for syntax highlighting; return undef if no highlighting
3707 # the name of syntax can (in the future) depend on syntax highlighter used
3708 sub guess_file_syntax {
3709         my ($highlight, $mimetype, $file_name) = @_;
3710         return undef unless ($highlight && defined $file_name);
3711         my $basename = basename($file_name, '.in');
3712         return $highlight_basename{$basename}
3713                 if exists $highlight_basename{$basename};
3714
3715         $basename =~ /\.([^.]*)$/;
3716         my $ext = $1 or return undef;
3717         return $highlight_ext{$ext}
3718                 if exists $highlight_ext{$ext};
3719
3720         return undef;
3721 }
3722
3723 # run highlighter and return FD of its output,
3724 # or return original FD if no highlighting
3725 sub run_highlighter {
3726         my ($fd, $highlight, $syntax) = @_;
3727         return $fd unless ($highlight && defined $syntax);
3728
3729         close $fd;
3730         open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3731                   quote_command($highlight_bin).
3732                   " --replace-tabs=8 --fragment --syntax $syntax |"
3733                 or die_error(500, "Couldn't open file or run syntax highlighter");
3734         return $fd;
3735 }
3736
3737 ## ======================================================================
3738 ## functions printing HTML: header, footer, error page
3739
3740 sub get_page_title {
3741         my $title = to_utf8($site_name);
3742
3743         return $title unless (defined $project);
3744         $title .= " - " . to_utf8($project);
3745
3746         return $title unless (defined $action);
3747         $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3748
3749         return $title unless (defined $file_name);
3750         $title .= " - " . esc_path($file_name);
3751         if ($action eq "tree" && $file_name !~ m|/$|) {
3752                 $title .= "/";
3753         }
3754
3755         return $title;
3756 }
3757
3758 sub get_content_type_html {
3759         # require explicit support from the UA if we are to send the page as
3760         # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3761         # we have to do this because MSIE sometimes globs '*/*', pretending to
3762         # support xhtml+xml but choking when it gets what it asked for.
3763         if (defined $cgi->http('HTTP_ACCEPT') &&
3764             $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3765             $cgi->Accept('application/xhtml+xml') != 0) {
3766                 return 'application/xhtml+xml';
3767         } else {
3768                 return 'text/html';
3769         }
3770 }
3771
3772 sub print_feed_meta {
3773         if (defined $project) {
3774                 my %href_params = get_feed_info();
3775                 if (!exists $href_params{'-title'}) {
3776                         $href_params{'-title'} = 'log';
3777                 }
3778
3779                 foreach my $format (qw(RSS Atom)) {
3780                         my $type = lc($format);
3781                         my %link_attr = (
3782                                 '-rel' => 'alternate',
3783                                 '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3784                                 '-type' => "application/$type+xml"
3785                         );
3786
3787                         $href_params{'action'} = $type;
3788                         $link_attr{'-href'} = href(%href_params);
3789                         print "<link ".
3790                               "rel=\"$link_attr{'-rel'}\" ".
3791                               "title=\"$link_attr{'-title'}\" ".
3792                               "href=\"$link_attr{'-href'}\" ".
3793                               "type=\"$link_attr{'-type'}\" ".
3794                               "/>\n";
3795
3796                         $href_params{'extra_options'} = '--no-merges';
3797                         $link_attr{'-href'} = href(%href_params);
3798                         $link_attr{'-title'} .= ' (no merges)';
3799                         print "<link ".
3800                               "rel=\"$link_attr{'-rel'}\" ".
3801                               "title=\"$link_attr{'-title'}\" ".
3802                               "href=\"$link_attr{'-href'}\" ".
3803                               "type=\"$link_attr{'-type'}\" ".
3804                               "/>\n";
3805                 }
3806
3807         } else {
3808                 printf('<link rel="alternate" title="%s projects list" '.
3809                        'href="%s" type="text/plain; charset=utf-8" />'."\n",
3810                        esc_attr($site_name), href(project=>undef, action=>"project_index"));
3811                 printf('<link rel="alternate" title="%s projects feeds" '.
3812                        'href="%s" type="text/x-opml" />'."\n",
3813                        esc_attr($site_name), href(project=>undef, action=>"opml"));
3814         }
3815 }
3816
3817 sub print_header_links {
3818         my $status = shift;
3819
3820         # print out each stylesheet that exist, providing backwards capability
3821         # for those people who defined $stylesheet in a config file
3822         if (defined $stylesheet) {
3823                 print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3824         } else {
3825                 foreach my $stylesheet (@stylesheets) {
3826                         next unless $stylesheet;
3827                         print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3828                 }
3829         }
3830         print_feed_meta()
3831                 if ($status eq '200 OK');
3832         if (defined $favicon) {
3833                 print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3834         }
3835 }
3836
3837 sub print_nav_breadcrumbs {
3838         my %opts = @_;
3839
3840         print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3841         if (defined $project) {
3842                 print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3843                 if (defined $action) {
3844                         my $action_print = $action ;
3845                         if (defined $opts{-action_extra}) {
3846                                 $action_print = $cgi->a({-href => href(action=>$action)},
3847                                         $action);
3848                         }
3849                         print " / $action_print";
3850                 }
3851                 if (defined $opts{-action_extra}) {
3852                         print " / $opts{-action_extra}";
3853                 }
3854                 print "\n";
3855         }
3856 }
3857
3858 sub print_search_form {
3859         if (!defined $searchtext) {
3860                 $searchtext = "";
3861         }
3862         my $search_hash;
3863         if (defined $hash_base) {
3864                 $search_hash = $hash_base;
3865         } elsif (defined $hash) {
3866                 $search_hash = $hash;
3867         } else {
3868                 $search_hash = "HEAD";
3869         }
3870         my $action = $my_uri;
3871         my $use_pathinfo = gitweb_check_feature('pathinfo');
3872         if ($use_pathinfo) {
3873                 $action .= "/".esc_url($project);
3874         }
3875         print $cgi->startform(-method => "get", -action => $action) .
3876               "<div class=\"search\">\n" .
3877               (!$use_pathinfo &&
3878               $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3879               $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3880               $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3881               $cgi->popup_menu(-name => 'st', -default => 'commit',
3882                                -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3883               $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3884               " search:\n",
3885               $cgi->textfield(-name => "s", -value => $searchtext, -override => 1) . "\n" .
3886               "<span title=\"Extended regular expression\">" .
3887               $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3888                              -checked => $search_use_regexp) .
3889               "</span>" .
3890               "</div>" .
3891               $cgi->end_form() . "\n";
3892 }
3893
3894 sub git_header_html {
3895         my $status = shift || "200 OK";
3896         my $expires = shift;
3897         my %opts = @_;
3898
3899         my $title = get_page_title();
3900         my $content_type = get_content_type_html();
3901         print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3902                            -status=> $status, -expires => $expires)
3903                 unless ($opts{'-no_http_header'});
3904         my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3905         print <<EOF;
3906 <?xml version="1.0" encoding="utf-8"?>
3907 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3908 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3909 <!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3910 <!-- git core binaries version $git_version -->
3911 <head>
3912 <meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3913 <meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3914 <meta name="robots" content="index, nofollow"/>
3915 <title>$title</title>
3916 EOF
3917         # the stylesheet, favicon etc urls won't work correctly with path_info
3918         # unless we set the appropriate base URL
3919         if ($ENV{'PATH_INFO'}) {
3920                 print "<base href=\"".esc_url($base_url)."\" />\n";
3921         }
3922         print_header_links($status);
3923
3924         if (defined $site_html_head_string) {
3925                 print to_utf8($site_html_head_string);
3926         }
3927
3928         print "</head>\n" .
3929               "<body>\n";
3930
3931         if (defined $site_header && -f $site_header) {
3932                 insert_file($site_header);
3933         }
3934
3935         print "<div class=\"page_header\">\n";
3936         if (defined $logo) {
3937                 print $cgi->a({-href => esc_url($logo_url),
3938                                -title => $logo_label},
3939                               $cgi->img({-src => esc_url($logo),
3940                                          -width => 72, -height => 27,
3941                                          -alt => "git",
3942                                          -class => "logo"}));
3943         }
3944         print_nav_breadcrumbs(%opts);
3945         print "</div>\n";
3946
3947         my $have_search = gitweb_check_feature('search');
3948         if (defined $project && $have_search) {
3949                 print_search_form();
3950         }
3951 }
3952
3953 sub git_footer_html {
3954         my $feed_class = 'rss_logo';
3955
3956         print "<div class=\"page_footer\">\n";
3957         if (defined $project) {
3958                 my $descr = git_get_project_description($project);
3959                 if (defined $descr) {
3960                         print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3961                 }
3962
3963                 my %href_params = get_feed_info();
3964                 if (!%href_params) {
3965                         $feed_class .= ' generic';
3966                 }
3967                 $href_params{'-title'} ||= 'log';
3968
3969                 foreach my $format (qw(RSS Atom)) {
3970                         $href_params{'action'} = lc($format);
3971                         print $cgi->a({-href => href(%href_params),
3972                                       -title => "$href_params{'-title'} $format feed",
3973                                       -class => $feed_class}, $format)."\n";
3974                 }
3975
3976         } else {
3977                 print $cgi->a({-href => href(project=>undef, action=>"opml"),
3978                               -class => $feed_class}, "OPML") . " ";
3979                 print $cgi->a({-href => href(project=>undef, action=>"project_index"),
3980                               -class => $feed_class}, "TXT") . "\n";
3981         }
3982         print "</div>\n"; # class="page_footer"
3983
3984         if (defined $t0 && gitweb_check_feature('timed')) {
3985                 print "<div id=\"generating_info\">\n";
3986                 print 'This page took '.
3987                       '<span id="generating_time" class="time_span">'.
3988                       tv_interval($t0, [ gettimeofday() ]).
3989                       ' seconds </span>'.
3990                       ' and '.
3991                       '<span id="generating_cmd">'.
3992                       $number_of_git_cmds.
3993                       '</span> git commands '.
3994                       " to generate.\n";
3995                 print "</div>\n"; # class="page_footer"
3996         }
3997
3998         if (defined $site_footer && -f $site_footer) {
3999                 insert_file($site_footer);
4000         }
4001
4002         print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
4003         if (defined $action &&
4004             $action eq 'blame_incremental') {
4005                 print qq!<script type="text/javascript">\n!.
4006                       qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
4007                       qq!           "!. href() .qq!");\n!.
4008                       qq!</script>\n!;
4009         } else {
4010                 my ($jstimezone, $tz_cookie, $datetime_class) =
4011                         gitweb_get_feature('javascript-timezone');
4012
4013                 print qq!<script type="text/javascript">\n!.
4014                       qq!window.onload = function () {\n!;
4015                 if (gitweb_check_feature('javascript-actions')) {
4016                         print qq!       fixLinks();\n!;
4017                 }
4018                 if ($jstimezone && $tz_cookie && $datetime_class) {
4019                         print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
4020                               qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
4021                 }
4022                 print qq!};\n!.
4023                       qq!</script>\n!;
4024         }
4025
4026         print "</body>\n" .
4027               "</html>";
4028 }
4029
4030 # die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
4031 # Example: die_error(404, 'Hash not found')
4032 # By convention, use the following status codes (as defined in RFC 2616):
4033 # 400: Invalid or missing CGI parameters, or
4034 #      requested object exists but has wrong type.
4035 # 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
4036 #      this server or project.
4037 # 404: Requested object/revision/project doesn't exist.
4038 # 500: The server isn't configured properly, or
4039 #      an internal error occurred (e.g. failed assertions caused by bugs), or
4040 #      an unknown error occurred (e.g. the git binary died unexpectedly).
4041 # 503: The server is currently unavailable (because it is overloaded,
4042 #      or down for maintenance).  Generally, this is a temporary state.
4043 sub die_error {
4044         my $status = shift || 500;
4045         my $error = esc_html(shift) || "Internal Server Error";
4046         my $extra = shift;
4047         my %opts = @_;
4048
4049         my %http_responses = (
4050                 400 => '400 Bad Request',
4051                 403 => '403 Forbidden',
4052                 404 => '404 Not Found',
4053                 500 => '500 Internal Server Error',
4054                 503 => '503 Service Unavailable',
4055         );
4056         git_header_html($http_responses{$status}, undef, %opts);
4057         print <<EOF;
4058 <div class="page_body">
4059 <br /><br />
4060 $status - $error
4061 <br />
4062 EOF
4063         if (defined $extra) {
4064                 print "<hr />\n" .
4065                       "$extra\n";
4066         }
4067         print "</div>\n";
4068
4069         git_footer_html();
4070         goto DONE_GITWEB
4071                 unless ($opts{'-error_handler'});
4072 }
4073
4074 ## ----------------------------------------------------------------------
4075 ## functions printing or outputting HTML: navigation
4076
4077 sub git_print_page_nav {
4078         my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4079         $extra = '' if !defined $extra; # pager or formats
4080
4081         my @navs = qw(summary shortlog log commit commitdiff tree);
4082         if ($suppress) {
4083                 @navs = grep { $_ ne $suppress } @navs;
4084         }
4085
4086         my %arg = map { $_ => {action=>$_} } @navs;
4087         if (defined $head) {
4088                 for (qw(commit commitdiff)) {
4089                         $arg{$_}{'hash'} = $head;
4090                 }
4091                 if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4092                         for (qw(shortlog log)) {
4093                                 $arg{$_}{'hash'} = $head;
4094                         }
4095                 }
4096         }
4097
4098         $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4099         $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4100
4101         my @actions = gitweb_get_feature('actions');
4102         my %repl = (
4103                 '%' => '%',
4104                 'n' => $project,         # project name
4105                 'f' => $git_dir,         # project path within filesystem
4106                 'h' => $treehead || '',  # current hash ('h' parameter)
4107                 'b' => $treebase || '',  # hash base ('hb' parameter)
4108         );
4109         while (@actions) {
4110                 my ($label, $link, $pos) = splice(@actions,0,3);
4111                 # insert
4112                 @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4113                 # munch munch
4114                 $link =~ s/%([%nfhb])/$repl{$1}/g;
4115                 $arg{$label}{'_href'} = $link;
4116         }
4117
4118         print "<div class=\"page_nav\">\n" .
4119                 (join " | ",
4120                  map { $_ eq $current ?
4121                        $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4122                  } @navs);
4123         print "<br/>\n$extra<br/>\n" .
4124               "</div>\n";
4125 }
4126
4127 # returns a submenu for the nagivation of the refs views (tags, heads,
4128 # remotes) with the current view disabled and the remotes view only
4129 # available if the feature is enabled
4130 sub format_ref_views {
4131         my ($current) = @_;
4132         my @ref_views = qw{tags heads};
4133         push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4134         return join " | ", map {
4135                 $_ eq $current ? $_ :
4136                 $cgi->a({-href => href(action=>$_)}, $_)
4137         } @ref_views
4138 }
4139
4140 sub format_paging_nav {
4141         my ($action, $page, $has_next_link) = @_;
4142         my $paging_nav;
4143
4144
4145         if ($page > 0) {
4146                 $paging_nav .=
4147                         $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4148                         " &sdot; " .
4149                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
4150                                  -accesskey => "p", -title => "Alt-p"}, "prev");
4151         } else {
4152                 $paging_nav .= "first &sdot; prev";
4153         }
4154
4155         if ($has_next_link) {
4156                 $paging_nav .= " &sdot; " .
4157                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
4158                                  -accesskey => "n", -title => "Alt-n"}, "next");
4159         } else {
4160                 $paging_nav .= " &sdot; next";
4161         }
4162
4163         return $paging_nav;
4164 }
4165
4166 ## ......................................................................
4167 ## functions printing or outputting HTML: div
4168
4169 sub git_print_header_div {
4170         my ($action, $title, $hash, $hash_base) = @_;
4171         my %args = ();
4172
4173         $args{'action'} = $action;
4174         $args{'hash'} = $hash if $hash;
4175         $args{'hash_base'} = $hash_base if $hash_base;
4176
4177         print "<div class=\"header\">\n" .
4178               $cgi->a({-href => href(%args), -class => "title"},
4179               $title ? $title : $action) .
4180               "\n</div>\n";
4181 }
4182
4183 sub format_repo_url {
4184         my ($name, $url) = @_;
4185         return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4186 }
4187
4188 # Group output by placing it in a DIV element and adding a header.
4189 # Options for start_div() can be provided by passing a hash reference as the
4190 # first parameter to the function.
4191 # Options to git_print_header_div() can be provided by passing an array
4192 # reference. This must follow the options to start_div if they are present.
4193 # The content can be a scalar, which is output as-is, a scalar reference, which
4194 # is output after html escaping, an IO handle passed either as *handle or
4195 # *handle{IO}, or a function reference. In the latter case all following
4196 # parameters will be taken as argument to the content function call.
4197 sub git_print_section {
4198         my ($div_args, $header_args, $content);
4199         my $arg = shift;
4200         if (ref($arg) eq 'HASH') {
4201                 $div_args = $arg;
4202                 $arg = shift;
4203         }
4204         if (ref($arg) eq 'ARRAY') {
4205                 $header_args = $arg;
4206                 $arg = shift;
4207         }
4208         $content = $arg;
4209
4210         print $cgi->start_div($div_args);
4211         git_print_header_div(@$header_args);
4212
4213         if (ref($content) eq 'CODE') {
4214                 $content->(@_);
4215         } elsif (ref($content) eq 'SCALAR') {
4216                 print esc_html($$content);
4217         } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4218                 print <$content>;
4219         } elsif (!ref($content) && defined($content)) {
4220                 print $content;
4221         }
4222
4223         print $cgi->end_div;
4224 }
4225
4226 sub format_timestamp_html {
4227         my $date = shift;
4228         my $strtime = $date->{'rfc2822'};
4229
4230         my (undef, undef, $datetime_class) =
4231                 gitweb_get_feature('javascript-timezone');
4232         if ($datetime_class) {
4233                 $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4234         }
4235
4236         my $localtime_format = '(%02d:%02d %s)';
4237         if ($date->{'hour_local'} < 6) {
4238                 $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4239         }
4240         $strtime .= ' ' .
4241                     sprintf($localtime_format,
4242                             $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4243
4244         return $strtime;
4245 }
4246
4247 # Outputs the author name and date in long form
4248 sub git_print_authorship {
4249         my $co = shift;
4250         my %opts = @_;
4251         my $tag = $opts{-tag} || 'div';
4252         my $author = $co->{'author_name'};
4253
4254         my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4255         print "<$tag class=\"author_date\">" .
4256               format_search_author($author, "author", esc_html($author)) .
4257               " [".format_timestamp_html(\%ad)."]".
4258               git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4259               "</$tag>\n";
4260 }
4261
4262 # Outputs table rows containing the full author or committer information,
4263 # in the format expected for 'commit' view (& similar).
4264 # Parameters are a commit hash reference, followed by the list of people
4265 # to output information for. If the list is empty it defaults to both
4266 # author and committer.
4267 sub git_print_authorship_rows {
4268         my $co = shift;
4269         # too bad we can't use @people = @_ || ('author', 'committer')
4270         my @people = @_;
4271         @people = ('author', 'committer') unless @people;
4272         foreach my $who (@people) {
4273                 my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4274                 print "<tr><td>$who</td><td>" .
4275                       format_search_author($co->{"${who}_name"}, $who,
4276                                            esc_html($co->{"${who}_name"})) . " " .
4277                       format_search_author($co->{"${who}_email"}, $who,
4278                                            esc_html("<" . $co->{"${who}_email"} . ">")) .
4279                       "</td><td rowspan=\"2\">" .
4280                       git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4281                       "</td></tr>\n" .
4282                       "<tr>" .
4283                       "<td></td><td>" .
4284                       format_timestamp_html(\%wd) .
4285                       "</td>" .
4286                       "</tr>\n";
4287         }
4288 }
4289
4290 sub git_print_page_path {
4291         my $name = shift;
4292         my $type = shift;
4293         my $hb = shift;
4294
4295
4296         print "<div class=\"page_path\">";
4297         print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4298                       -title => 'tree root'}, to_utf8("[$project]"));
4299         print " / ";
4300         if (defined $name) {
4301                 my @dirname = split '/', $name;
4302                 my $basename = pop @dirname;
4303                 my $fullname = '';
4304
4305                 foreach my $dir (@dirname) {
4306                         $fullname .= ($fullname ? '/' : '') . $dir;
4307                         print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4308                                                      hash_base=>$hb),
4309                                       -title => $fullname}, esc_path($dir));
4310                         print " / ";
4311                 }
4312                 if (defined $type && $type eq 'blob') {
4313                         print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4314                                                      hash_base=>$hb),
4315                                       -title => $name}, esc_path($basename));
4316                 } elsif (defined $type && $type eq 'tree') {
4317                         print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4318                                                      hash_base=>$hb),
4319                                       -title => $name}, esc_path($basename));
4320                         print " / ";
4321                 } else {
4322                         print esc_path($basename);
4323                 }
4324         }
4325         print "<br/></div>\n";
4326 }
4327
4328 sub git_print_log {
4329         my $log = shift;
4330         my %opts = @_;
4331
4332         if ($opts{'-remove_title'}) {
4333                 # remove title, i.e. first line of log
4334                 shift @$log;
4335         }
4336         # remove leading empty lines
4337         while (defined $log->[0] && $log->[0] eq "") {
4338                 shift @$log;
4339         }
4340
4341         # print log
4342         my $signoff = 0;
4343         my $empty = 0;
4344         foreach my $line (@$log) {
4345                 if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4346                         $signoff = 1;
4347                         $empty = 0;
4348                         if (! $opts{'-remove_signoff'}) {
4349                                 print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4350                                 next;
4351                         } else {
4352                                 # remove signoff lines
4353                                 next;
4354                         }
4355                 } else {
4356                         $signoff = 0;
4357                 }
4358
4359                 # print only one empty line
4360                 # do not print empty line after signoff
4361                 if ($line eq "") {
4362                         next if ($empty || $signoff);
4363                         $empty = 1;
4364                 } else {
4365                         $empty = 0;
4366                 }
4367
4368                 print format_log_line_html($line) . "<br/>\n";
4369         }
4370
4371         if ($opts{'-final_empty_line'}) {
4372                 # end with single empty line
4373                 print "<br/>\n" unless $empty;
4374         }
4375 }
4376
4377 # return link target (what link points to)
4378 sub git_get_link_target {
4379         my $hash = shift;
4380         my $link_target;
4381
4382         # read link
4383         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4384                 or return;
4385         {
4386                 local $/ = undef;
4387                 $link_target = <$fd>;
4388         }
4389         close $fd
4390                 or return;
4391
4392         return $link_target;
4393 }
4394
4395 # given link target, and the directory (basedir) the link is in,
4396 # return target of link relative to top directory (top tree);
4397 # return undef if it is not possible (including absolute links).
4398 sub normalize_link_target {
4399         my ($link_target, $basedir) = @_;
4400
4401         # absolute symlinks (beginning with '/') cannot be normalized
4402         return if (substr($link_target, 0, 1) eq '/');
4403
4404         # normalize link target to path from top (root) tree (dir)
4405         my $path;
4406         if ($basedir) {
4407                 $path = $basedir . '/' . $link_target;
4408         } else {
4409                 # we are in top (root) tree (dir)
4410                 $path = $link_target;
4411         }
4412
4413         # remove //, /./, and /../
4414         my @path_parts;
4415         foreach my $part (split('/', $path)) {
4416                 # discard '.' and ''
4417                 next if (!$part || $part eq '.');
4418                 # handle '..'
4419                 if ($part eq '..') {
4420                         if (@path_parts) {
4421                                 pop @path_parts;
4422                         } else {
4423                                 # link leads outside repository (outside top dir)
4424                                 return;
4425                         }
4426                 } else {
4427                         push @path_parts, $part;
4428                 }
4429         }
4430         $path = join('/', @path_parts);
4431
4432         return $path;
4433 }
4434
4435 # print tree entry (row of git_tree), but without encompassing <tr> element
4436 sub git_print_tree_entry {
4437         my ($t, $basedir, $hash_base, $have_blame) = @_;
4438
4439         my %base_key = ();
4440         $base_key{'hash_base'} = $hash_base if defined $hash_base;
4441
4442         # The format of a table row is: mode list link.  Where mode is
4443         # the mode of the entry, list is the name of the entry, an href,
4444         # and link is the action links of the entry.
4445
4446         print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4447         if (exists $t->{'size'}) {
4448                 print "<td class=\"size\">$t->{'size'}</td>\n";
4449         }
4450         if ($t->{'type'} eq "blob") {
4451                 print "<td class=\"list\">" .
4452                         $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4453                                                file_name=>"$basedir$t->{'name'}", %base_key),
4454                                 -class => "list"}, esc_path($t->{'name'}));
4455                 if (S_ISLNK(oct $t->{'mode'})) {
4456                         my $link_target = git_get_link_target($t->{'hash'});
4457                         if ($link_target) {
4458                                 my $norm_target = normalize_link_target($link_target, $basedir);
4459                                 if (defined $norm_target) {
4460                                         print " -> " .
4461                                               $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4462                                                                      file_name=>$norm_target),
4463                                                        -title => $norm_target}, esc_path($link_target));
4464                                 } else {
4465                                         print " -> " . esc_path($link_target);
4466                                 }
4467                         }
4468                 }
4469                 print "</td>\n";
4470                 print "<td class=\"link\">";
4471                 print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4472                                              file_name=>"$basedir$t->{'name'}", %base_key)},
4473                               "blob");
4474                 if ($have_blame) {
4475                         print " | " .
4476                               $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4477                                                      file_name=>"$basedir$t->{'name'}", %base_key)},
4478                                       "blame");
4479                 }
4480                 if (defined $hash_base) {
4481                         print " | " .
4482                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4483                                                      hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4484                                       "history");
4485                 }
4486                 print " | " .
4487                         $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4488                                                file_name=>"$basedir$t->{'name'}")},
4489                                 "raw");
4490                 print "</td>\n";
4491
4492         } elsif ($t->{'type'} eq "tree") {
4493                 print "<td class=\"list\">";
4494                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4495                                              file_name=>"$basedir$t->{'name'}",
4496                                              %base_key)},
4497                               esc_path($t->{'name'}));
4498                 print "</td>\n";
4499                 print "<td class=\"link\">";
4500                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4501                                              file_name=>"$basedir$t->{'name'}",
4502                                              %base_key)},
4503                               "tree");
4504                 if (defined $hash_base) {
4505                         print " | " .
4506                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4507                                                      file_name=>"$basedir$t->{'name'}")},
4508                                       "history");
4509                 }
4510                 print "</td>\n";
4511         } else {
4512                 # unknown object: we can only present history for it
4513                 # (this includes 'commit' object, i.e. submodule support)
4514                 print "<td class=\"list\">" .
4515                       esc_path($t->{'name'}) .
4516                       "</td>\n";
4517                 print "<td class=\"link\">";
4518                 if (defined $hash_base) {
4519                         print $cgi->a({-href => href(action=>"history",
4520                                                      hash_base=>$hash_base,
4521                                                      file_name=>"$basedir$t->{'name'}")},
4522                                       "history");
4523                 }
4524                 print "</td>\n";
4525         }
4526 }
4527
4528 ## ......................................................................
4529 ## functions printing large fragments of HTML
4530
4531 # get pre-image filenames for merge (combined) diff
4532 sub fill_from_file_info {
4533         my ($diff, @parents) = @_;
4534
4535         $diff->{'from_file'} = [ ];
4536         $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4537         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4538                 if ($diff->{'status'}[$i] eq 'R' ||
4539                     $diff->{'status'}[$i] eq 'C') {
4540                         $diff->{'from_file'}[$i] =
4541                                 git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4542                 }
4543         }
4544
4545         return $diff;
4546 }
4547
4548 # is current raw difftree line of file deletion
4549 sub is_deleted {
4550         my $diffinfo = shift;
4551
4552         return $diffinfo->{'to_id'} eq ('0' x 40);
4553 }
4554
4555 # does patch correspond to [previous] difftree raw line
4556 # $diffinfo  - hashref of parsed raw diff format
4557 # $patchinfo - hashref of parsed patch diff format
4558 #              (the same keys as in $diffinfo)
4559 sub is_patch_split {
4560         my ($diffinfo, $patchinfo) = @_;
4561
4562         return defined $diffinfo && defined $patchinfo
4563                 && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4564 }
4565
4566
4567 sub git_difftree_body {
4568         my ($difftree, $hash, @parents) = @_;
4569         my ($parent) = $parents[0];
4570         my $have_blame = gitweb_check_feature('blame');
4571         print "<div class=\"list_head\">\n";
4572         if ($#{$difftree} > 10) {
4573                 print(($#{$difftree} + 1) . " files changed:\n");
4574         }
4575         print "</div>\n";
4576
4577         print "<table class=\"" .
4578               (@parents > 1 ? "combined " : "") .
4579               "diff_tree\">\n";
4580
4581         # header only for combined diff in 'commitdiff' view
4582         my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4583         if ($has_header) {
4584                 # table header
4585                 print "<thead><tr>\n" .
4586                        "<th></th><th></th>\n"; # filename, patchN link
4587                 for (my $i = 0; $i < @parents; $i++) {
4588                         my $par = $parents[$i];
4589                         print "<th>" .
4590                               $cgi->a({-href => href(action=>"commitdiff",
4591                                                      hash=>$hash, hash_parent=>$par),
4592                                        -title => 'commitdiff to parent number ' .
4593                                                   ($i+1) . ': ' . substr($par,0,7)},
4594                                       $i+1) .
4595                               "&nbsp;</th>\n";
4596                 }
4597                 print "</tr></thead>\n<tbody>\n";
4598         }
4599
4600         my $alternate = 1;
4601         my $patchno = 0;
4602         foreach my $line (@{$difftree}) {
4603                 my $diff = parsed_difftree_line($line);
4604
4605                 if ($alternate) {
4606                         print "<tr class=\"dark\">\n";
4607                 } else {
4608                         print "<tr class=\"light\">\n";
4609                 }
4610                 $alternate ^= 1;
4611
4612                 if (exists $diff->{'nparents'}) { # combined diff
4613
4614                         fill_from_file_info($diff, @parents)
4615                                 unless exists $diff->{'from_file'};
4616
4617                         if (!is_deleted($diff)) {
4618                                 # file exists in the result (child) commit
4619                                 print "<td>" .
4620                                       $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4621                                                              file_name=>$diff->{'to_file'},
4622                                                              hash_base=>$hash),
4623                                               -class => "list"}, esc_path($diff->{'to_file'})) .
4624                                       "</td>\n";
4625                         } else {
4626                                 print "<td>" .
4627                                       esc_path($diff->{'to_file'}) .
4628                                       "</td>\n";
4629                         }
4630
4631                         if ($action eq 'commitdiff') {
4632                                 # link to patch
4633                                 $patchno++;
4634                                 print "<td class=\"link\">" .
4635                                       $cgi->a({-href => href(-anchor=>"patch$patchno")},
4636                                               "patch") .
4637                                       " | " .
4638                                       "</td>\n";
4639                         }
4640
4641                         my $has_history = 0;
4642                         my $not_deleted = 0;
4643                         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4644                                 my $hash_parent = $parents[$i];
4645                                 my $from_hash = $diff->{'from_id'}[$i];
4646                                 my $from_path = $diff->{'from_file'}[$i];
4647                                 my $status = $diff->{'status'}[$i];
4648
4649                                 $has_history ||= ($status ne 'A');
4650                                 $not_deleted ||= ($status ne 'D');
4651
4652                                 if ($status eq 'A') {
4653                                         print "<td  class=\"link\" align=\"right\"> | </td>\n";
4654                                 } elsif ($status eq 'D') {
4655                                         print "<td class=\"link\">" .
4656                                               $cgi->a({-href => href(action=>"blob",
4657                                                                      hash_base=>$hash,
4658                                                                      hash=>$from_hash,
4659                                                                      file_name=>$from_path)},
4660                                                       "blob" . ($i+1)) .
4661                                               " | </td>\n";
4662                                 } else {
4663                                         if ($diff->{'to_id'} eq $from_hash) {
4664                                                 print "<td class=\"link nochange\">";
4665                                         } else {
4666                                                 print "<td class=\"link\">";
4667                                         }
4668                                         print $cgi->a({-href => href(action=>"blobdiff",
4669                                                                      hash=>$diff->{'to_id'},
4670                                                                      hash_parent=>$from_hash,
4671                                                                      hash_base=>$hash,
4672                                                                      hash_parent_base=>$hash_parent,
4673                                                                      file_name=>$diff->{'to_file'},
4674                                                                      file_parent=>$from_path)},
4675                                                       "diff" . ($i+1)) .
4676                                               " | </td>\n";
4677                                 }
4678                         }
4679
4680                         print "<td class=\"link\">";
4681                         if ($not_deleted) {
4682                                 print $cgi->a({-href => href(action=>"blob",
4683                                                              hash=>$diff->{'to_id'},
4684                                                              file_name=>$diff->{'to_file'},
4685                                                              hash_base=>$hash)},
4686                                               "blob");
4687                                 print " | " if ($has_history);
4688                         }
4689                         if ($has_history) {
4690                                 print $cgi->a({-href => href(action=>"history",
4691                                                              file_name=>$diff->{'to_file'},
4692                                                              hash_base=>$hash)},
4693                                               "history");
4694                         }
4695                         print "</td>\n";
4696
4697                         print "</tr>\n";
4698                         next; # instead of 'else' clause, to avoid extra indent
4699                 }
4700                 # else ordinary diff
4701
4702                 my ($to_mode_oct, $to_mode_str, $to_file_type);
4703                 my ($from_mode_oct, $from_mode_str, $from_file_type);
4704                 if ($diff->{'to_mode'} ne ('0' x 6)) {
4705                         $to_mode_oct = oct $diff->{'to_mode'};
4706                         if (S_ISREG($to_mode_oct)) { # only for regular file
4707                                 $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4708                         }
4709                         $to_file_type = file_type($diff->{'to_mode'});
4710                 }
4711                 if ($diff->{'from_mode'} ne ('0' x 6)) {
4712                         $from_mode_oct = oct $diff->{'from_mode'};
4713                         if (S_ISREG($from_mode_oct)) { # only for regular file
4714                                 $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4715                         }
4716                         $from_file_type = file_type($diff->{'from_mode'});
4717                 }
4718
4719                 if ($diff->{'status'} eq "A") { # created
4720                         my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4721                         $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4722                         $mode_chng   .= "]</span>";
4723                         print "<td>";
4724                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4725                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4726                                       -class => "list"}, esc_path($diff->{'file'}));
4727                         print "</td>\n";
4728                         print "<td>$mode_chng</td>\n";
4729                         print "<td class=\"link\">";
4730                         if ($action eq 'commitdiff') {
4731                                 # link to patch
4732                                 $patchno++;
4733                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4734                                               "patch") .
4735                                       " | ";
4736                         }
4737                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4738                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4739                                       "blob");
4740                         print "</td>\n";
4741
4742                 } elsif ($diff->{'status'} eq "D") { # deleted
4743                         my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4744                         print "<td>";
4745                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4746                                                      hash_base=>$parent, file_name=>$diff->{'file'}),
4747                                        -class => "list"}, esc_path($diff->{'file'}));
4748                         print "</td>\n";
4749                         print "<td>$mode_chng</td>\n";
4750                         print "<td class=\"link\">";
4751                         if ($action eq 'commitdiff') {
4752                                 # link to patch
4753                                 $patchno++;
4754                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4755                                               "patch") .
4756                                       " | ";
4757                         }
4758                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4759                                                      hash_base=>$parent, file_name=>$diff->{'file'})},
4760                                       "blob") . " | ";
4761                         if ($have_blame) {
4762                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4763                                                              file_name=>$diff->{'file'})},
4764                                               "blame") . " | ";
4765                         }
4766                         print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4767                                                      file_name=>$diff->{'file'})},
4768                                       "history");
4769                         print "</td>\n";
4770
4771                 } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4772                         my $mode_chnge = "";
4773                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4774                                 $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4775                                 if ($from_file_type ne $to_file_type) {
4776                                         $mode_chnge .= " from $from_file_type to $to_file_type";
4777                                 }
4778                                 if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4779                                         if ($from_mode_str && $to_mode_str) {
4780                                                 $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4781                                         } elsif ($to_mode_str) {
4782                                                 $mode_chnge .= " mode: $to_mode_str";
4783                                         }
4784                                 }
4785                                 $mode_chnge .= "]</span>\n";
4786                         }
4787                         print "<td>";
4788                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4789                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4790                                       -class => "list"}, esc_path($diff->{'file'}));
4791                         print "</td>\n";
4792                         print "<td>$mode_chnge</td>\n";
4793                         print "<td class=\"link\">";
4794                         if ($action eq 'commitdiff') {
4795                                 # link to patch
4796                                 $patchno++;
4797                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4798                                               "patch") .
4799                                       " | ";
4800                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4801                                 # "commit" view and modified file (not onlu mode changed)
4802                                 print $cgi->a({-href => href(action=>"blobdiff",
4803                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4804                                                              hash_base=>$hash, hash_parent_base=>$parent,
4805                                                              file_name=>$diff->{'file'})},
4806                                               "diff") .
4807                                       " | ";
4808                         }
4809                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4810                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4811                                        "blob") . " | ";
4812                         if ($have_blame) {
4813                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4814                                                              file_name=>$diff->{'file'})},
4815                                               "blame") . " | ";
4816                         }
4817                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4818                                                      file_name=>$diff->{'file'})},
4819                                       "history");
4820                         print "</td>\n";
4821
4822                 } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4823                         my %status_name = ('R' => 'moved', 'C' => 'copied');
4824                         my $nstatus = $status_name{$diff->{'status'}};
4825                         my $mode_chng = "";
4826                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4827                                 # mode also for directories, so we cannot use $to_mode_str
4828                                 $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4829                         }
4830                         print "<td>" .
4831                               $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4832                                                      hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4833                                       -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4834                               "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4835                               $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4836                                                      hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4837                                       -class => "list"}, esc_path($diff->{'from_file'})) .
4838                               " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4839                               "<td class=\"link\">";
4840                         if ($action eq 'commitdiff') {
4841                                 # link to patch
4842                                 $patchno++;
4843                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4844                                               "patch") .
4845                                       " | ";
4846                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4847                                 # "commit" view and modified file (not only pure rename or copy)
4848                                 print $cgi->a({-href => href(action=>"blobdiff",
4849                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4850                                                              hash_base=>$hash, hash_parent_base=>$parent,
4851                                                              file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4852                                               "diff") .
4853                                       " | ";
4854                         }
4855                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4856                                                      hash_base=>$parent, file_name=>$diff->{'to_file'})},
4857                                       "blob") . " | ";
4858                         if ($have_blame) {
4859                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4860                                                              file_name=>$diff->{'to_file'})},
4861                                               "blame") . " | ";
4862                         }
4863                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4864                                                     file_name=>$diff->{'to_file'})},
4865                                       "history");
4866                         print "</td>\n";
4867
4868                 } # we should not encounter Unmerged (U) or Unknown (X) status
4869                 print "</tr>\n";
4870         }
4871         print "</tbody>" if $has_header;
4872         print "</table>\n";
4873 }
4874
4875 sub print_sidebyside_diff_chunk {
4876         my @chunk = @_;
4877         my (@ctx, @rem, @add);
4878
4879         return unless @chunk;
4880
4881         # incomplete last line might be among removed or added lines,
4882         # or both, or among context lines: find which
4883         for (my $i = 1; $i < @chunk; $i++) {
4884                 if ($chunk[$i][0] eq 'incomplete') {
4885                         $chunk[$i][0] = $chunk[$i-1][0];
4886                 }
4887         }
4888
4889         # guardian
4890         push @chunk, ["", ""];
4891
4892         foreach my $line_info (@chunk) {
4893                 my ($class, $line) = @$line_info;
4894
4895                 # print chunk headers
4896                 if ($class && $class eq 'chunk_header') {
4897                         print $line;
4898                         next;
4899                 }
4900
4901                 ## print from accumulator when type of class of lines change
4902                 # empty contents block on start rem/add block, or end of chunk
4903                 if (@ctx && (!$class || $class eq 'rem' || $class eq 'add')) {
4904                         print join '',
4905                                 '<div class="chunk_block ctx">',
4906                                         '<div class="old">',
4907                                         @ctx,
4908                                         '</div>',
4909                                         '<div class="new">',
4910                                         @ctx,
4911                                         '</div>',
4912                                 '</div>';
4913                         @ctx = ();
4914                 }
4915                 # empty add/rem block on start context block, or end of chunk
4916                 if ((@rem || @add) && (!$class || $class eq 'ctx')) {
4917                         if (!@add) {
4918                                 # pure removal
4919                                 print join '',
4920                                         '<div class="chunk_block rem">',
4921                                                 '<div class="old">',
4922                                                 @rem,
4923                                                 '</div>',
4924                                         '</div>';
4925                         } elsif (!@rem) {
4926                                 # pure addition
4927                                 print join '',
4928                                         '<div class="chunk_block add">',
4929                                                 '<div class="new">',
4930                                                 @add,
4931                                                 '</div>',
4932                                         '</div>';
4933                         } else {
4934                                 # assume that it is change
4935                                 print join '',
4936                                         '<div class="chunk_block chg">',
4937                                                 '<div class="old">',
4938                                                 @rem,
4939                                                 '</div>',
4940                                                 '<div class="new">',
4941                                                 @add,
4942                                                 '</div>',
4943                                         '</div>';
4944                         }
4945                         @rem = @add = ();
4946                 }
4947
4948                 ## adding lines to accumulator
4949                 # guardian value
4950                 last unless $line;
4951                 # rem, add or change
4952                 if ($class eq 'rem') {
4953                         push @rem, $line;
4954                 } elsif ($class eq 'add') {
4955                         push @add, $line;
4956                 }
4957                 # context line
4958                 if ($class eq 'ctx') {
4959                         push @ctx, $line;
4960                 }
4961         }
4962 }
4963
4964 sub git_patchset_body {
4965         my ($fd, $diff_style, $difftree, $hash, @hash_parents) = @_;
4966         my ($hash_parent) = $hash_parents[0];
4967
4968         my $is_combined = (@hash_parents > 1);
4969         my $patch_idx = 0;
4970         my $patch_number = 0;
4971         my $patch_line;
4972         my $diffinfo;
4973         my $to_name;
4974         my (%from, %to);
4975         my @chunk; # for side-by-side diff
4976
4977         print "<div class=\"patchset\">\n";
4978
4979         # skip to first patch
4980         while ($patch_line = <$fd>) {
4981                 chomp $patch_line;
4982
4983                 last if ($patch_line =~ m/^diff /);
4984         }
4985
4986  PATCH:
4987         while ($patch_line) {
4988
4989                 # parse "git diff" header line
4990                 if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
4991                         # $1 is from_name, which we do not use
4992                         $to_name = unquote($2);
4993                         $to_name =~ s!^b/!!;
4994                 } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
4995                         # $1 is 'cc' or 'combined', which we do not use
4996                         $to_name = unquote($2);
4997                 } else {
4998                         $to_name = undef;
4999                 }
5000
5001                 # check if current patch belong to current raw line
5002                 # and parse raw git-diff line if needed
5003                 if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
5004                         # this is continuation of a split patch
5005                         print "<div class=\"patch cont\">\n";
5006                 } else {
5007                         # advance raw git-diff output if needed
5008                         $patch_idx++ if defined $diffinfo;
5009
5010                         # read and prepare patch information
5011                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5012
5013                         # compact combined diff output can have some patches skipped
5014                         # find which patch (using pathname of result) we are at now;
5015                         if ($is_combined) {
5016                                 while ($to_name ne $diffinfo->{'to_file'}) {
5017                                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5018                                               format_diff_cc_simplified($diffinfo, @hash_parents) .
5019                                               "</div>\n";  # class="patch"
5020
5021                                         $patch_idx++;
5022                                         $patch_number++;
5023
5024                                         last if $patch_idx > $#$difftree;
5025                                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5026                                 }
5027                         }
5028
5029                         # modifies %from, %to hashes
5030                         parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
5031
5032                         # this is first patch for raw difftree line with $patch_idx index
5033                         # we index @$difftree array from 0, but number patches from 1
5034                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
5035                 }
5036
5037                 # git diff header
5038                 #assert($patch_line =~ m/^diff /) if DEBUG;
5039                 #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
5040                 $patch_number++;
5041                 # print "git diff" header
5042                 print format_git_diff_header_line($patch_line, $diffinfo,
5043                                                   \%from, \%to);
5044
5045                 # print extended diff header
5046                 print "<div class=\"diff extended_header\">\n";
5047         EXTENDED_HEADER:
5048                 while ($patch_line = <$fd>) {
5049                         chomp $patch_line;
5050
5051                         last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
5052
5053                         print format_extended_diff_header_line($patch_line, $diffinfo,
5054                                                                \%from, \%to);
5055                 }
5056                 print "</div>\n"; # class="diff extended_header"
5057
5058                 # from-file/to-file diff header
5059                 if (! $patch_line) {
5060                         print "</div>\n"; # class="patch"
5061                         last PATCH;
5062                 }
5063                 next PATCH if ($patch_line =~ m/^diff /);
5064                 #assert($patch_line =~ m/^---/) if DEBUG;
5065
5066                 my $last_patch_line = $patch_line;
5067                 $patch_line = <$fd>;
5068                 chomp $patch_line;
5069                 #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
5070
5071                 print format_diff_from_to_header($last_patch_line, $patch_line,
5072                                                  $diffinfo, \%from, \%to,
5073                                                  @hash_parents);
5074
5075                 # the patch itself
5076         LINE:
5077                 while ($patch_line = <$fd>) {
5078                         chomp $patch_line;
5079
5080                         next PATCH if ($patch_line =~ m/^diff /);
5081
5082                         my ($class, $line) = process_diff_line($patch_line, \%from, \%to);
5083                         my $diff_classes = "diff";
5084                         $diff_classes .= " $class" if ($class);
5085                         $line = "<div class=\"$diff_classes\">$line</div>\n";
5086
5087                         if ($diff_style eq 'sidebyside' && !$is_combined) {
5088                                 if ($class eq 'chunk_header') {
5089                                         print_sidebyside_diff_chunk(@chunk);
5090                                         @chunk = ( [ $class, $line ] );
5091                                 } else {
5092                                         push @chunk, [ $class, $line ];
5093                                 }
5094                         } else {
5095                                 # default 'inline' style and unknown styles
5096                                 print $line;
5097                         }
5098                 }
5099
5100         } continue {
5101                 if (@chunk) {
5102                         print_sidebyside_diff_chunk(@chunk);
5103                         @chunk = ();
5104                 }
5105                 print "</div>\n"; # class="patch"
5106         }
5107
5108         # for compact combined (--cc) format, with chunk and patch simplification
5109         # the patchset might be empty, but there might be unprocessed raw lines
5110         for (++$patch_idx if $patch_number > 0;
5111              $patch_idx < @$difftree;
5112              ++$patch_idx) {
5113                 # read and prepare patch information
5114                 $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
5115
5116                 # generate anchor for "patch" links in difftree / whatchanged part
5117                 print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
5118                       format_diff_cc_simplified($diffinfo, @hash_parents) .
5119                       "</div>\n";  # class="patch"
5120
5121                 $patch_number++;
5122         }
5123
5124         if ($patch_number == 0) {
5125                 if (@hash_parents > 1) {
5126                         print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
5127                 } else {
5128                         print "<div class=\"diff nodifferences\">No differences found</div>\n";
5129                 }
5130         }
5131
5132         print "</div>\n"; # class="patchset"
5133 }
5134
5135 # . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
5136
5137 # fills project list info (age, description, owner, category, forks)
5138 # for each project in the list, removing invalid projects from
5139 # returned list
5140 # NOTE: modifies $projlist, but does not remove entries from it
5141 sub fill_project_list_info {
5142         my $projlist = shift;
5143         my @projects;
5144
5145         my $show_ctags = gitweb_check_feature('ctags');
5146  PROJECT:
5147         foreach my $pr (@$projlist) {
5148                 my (@activity) = git_get_last_activity($pr->{'path'});
5149                 unless (@activity) {
5150                         next PROJECT;
5151                 }
5152                 ($pr->{'age'}, $pr->{'age_string'}) = @activity;
5153                 if (!defined $pr->{'descr'}) {
5154                         my $descr = git_get_project_description($pr->{'path'}) || "";
5155                         $descr = to_utf8($descr);
5156                         $pr->{'descr_long'} = $descr;
5157                         $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
5158                 }
5159                 if (!defined $pr->{'owner'}) {
5160                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
5161                 }
5162                 if ($show_ctags) {
5163                         $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
5164                 }
5165                 if ($projects_list_group_categories && !defined $pr->{'category'}) {
5166                         my $cat = git_get_project_category($pr->{'path'}) ||
5167                                                            $project_list_default_category;
5168                         $pr->{'category'} = to_utf8($cat);
5169                 }
5170
5171                 push @projects, $pr;
5172         }
5173
5174         return @projects;
5175 }
5176
5177 sub sort_projects_list {
5178         my ($projlist, $order) = @_;
5179         my @projects;
5180
5181         my %order_info = (
5182                 project => { key => 'path', type => 'str' },
5183                 descr => { key => 'descr_long', type => 'str' },
5184                 owner => { key => 'owner', type => 'str' },
5185                 age => { key => 'age', type => 'num' }
5186         );
5187         my $oi = $order_info{$order};
5188         return @$projlist unless defined $oi;
5189         if ($oi->{'type'} eq 'str') {
5190                 @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5191         } else {
5192                 @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5193         }
5194
5195         return @projects;
5196 }
5197
5198 # returns a hash of categories, containing the list of project
5199 # belonging to each category
5200 sub build_projlist_by_category {
5201         my ($projlist, $from, $to) = @_;
5202         my %categories;
5203
5204         $from = 0 unless defined $from;
5205         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5206
5207         for (my $i = $from; $i <= $to; $i++) {
5208                 my $pr = $projlist->[$i];
5209                 push @{$categories{ $pr->{'category'} }}, $pr;
5210         }
5211
5212         return wantarray ? %categories : \%categories;
5213 }
5214
5215 # print 'sort by' <th> element, generating 'sort by $name' replay link
5216 # if that order is not selected
5217 sub print_sort_th {
5218         print format_sort_th(@_);
5219 }
5220
5221 sub format_sort_th {
5222         my ($name, $order, $header) = @_;
5223         my $sort_th = "";
5224         $header ||= ucfirst($name);
5225
5226         if ($order eq $name) {
5227                 $sort_th .= "<th>$header</th>\n";
5228         } else {
5229                 $sort_th .= "<th>" .
5230                             $cgi->a({-href => href(-replay=>1, order=>$name),
5231                                      -class => "header"}, $header) .
5232                             "</th>\n";
5233         }
5234
5235         return $sort_th;
5236 }
5237
5238 sub git_project_list_rows {
5239         my ($projlist, $from, $to, $check_forks) = @_;
5240
5241         $from = 0 unless defined $from;
5242         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5243
5244         my $alternate = 1;
5245         for (my $i = $from; $i <= $to; $i++) {
5246                 my $pr = $projlist->[$i];
5247
5248                 if ($alternate) {
5249                         print "<tr class=\"dark\">\n";
5250                 } else {
5251                         print "<tr class=\"light\">\n";
5252                 }
5253                 $alternate ^= 1;
5254
5255                 if ($check_forks) {
5256                         print "<td>";
5257                         if ($pr->{'forks'}) {
5258                                 my $nforks = scalar @{$pr->{'forks'}};
5259                                 if ($nforks > 0) {
5260                                         print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5261                                                        -title => "$nforks forks"}, "+");
5262                                 } else {
5263                                         print $cgi->span({-title => "$nforks forks"}, "+");
5264                                 }
5265                         }
5266                         print "</td>\n";
5267                 }
5268                 print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5269                                         -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
5270                       "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5271                                         -class => "list", -title => $pr->{'descr_long'}},
5272                                         esc_html($pr->{'descr'})) . "</td>\n" .
5273                       "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5274                 print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5275                       (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
5276                       "<td class=\"link\">" .
5277                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5278                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5279                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5280                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5281                       ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5282                       "</td>\n" .
5283                       "</tr>\n";
5284         }
5285 }
5286
5287 sub git_project_list_body {
5288         # actually uses global variable $project
5289         my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5290         my @projects = @$projlist;
5291
5292         my $check_forks = gitweb_check_feature('forks');
5293         my $show_ctags  = gitweb_check_feature('ctags');
5294         my $tagfilter = $show_ctags ? $input_params{'ctag'} : undef;
5295         $check_forks = undef
5296                 if ($tagfilter || $search_regexp);
5297
5298         # filtering out forks before filling info allows to do less work
5299         @projects = filter_forks_from_projects_list(\@projects)
5300                 if ($check_forks);
5301         @projects = fill_project_list_info(\@projects);
5302         # searching projects require filling to be run before it
5303         @projects = search_projects_list(\@projects,
5304                                          'search_regexp' => $search_regexp,
5305                                          'tagfilter'  => $tagfilter)
5306                 if ($tagfilter || $search_regexp);
5307
5308         $order ||= $default_projects_order;
5309         $from = 0 unless defined $from;
5310         $to = $#projects if (!defined $to || $#projects < $to);
5311
5312         # short circuit
5313         if ($from > $to) {
5314                 print "<center>\n".
5315                       "<b>No such projects found</b><br />\n".
5316                       "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5317                       "</center>\n<br />\n";
5318                 return;
5319         }
5320
5321         @projects = sort_projects_list(\@projects, $order);
5322
5323         if ($show_ctags) {
5324                 my $ctags = git_gather_all_ctags(\@projects);
5325                 my $cloud = git_populate_project_tagcloud($ctags);
5326                 print git_show_project_tagcloud($cloud, 64);
5327         }
5328
5329         print "<table class=\"project_list\">\n";
5330         unless ($no_header) {
5331                 print "<tr>\n";
5332                 if ($check_forks) {
5333                         print "<th></th>\n";
5334                 }
5335                 print_sort_th('project', $order, 'Project');
5336                 print_sort_th('descr', $order, 'Description');
5337                 print_sort_th('owner', $order, 'Owner');
5338                 print_sort_th('age', $order, 'Last Change');
5339                 print "<th></th>\n" . # for links
5340                       "</tr>\n";
5341         }
5342
5343         if ($projects_list_group_categories) {
5344                 # only display categories with projects in the $from-$to window
5345                 @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5346                 my %categories = build_projlist_by_category(\@projects, $from, $to);
5347                 foreach my $cat (sort keys %categories) {
5348                         unless ($cat eq "") {
5349                                 print "<tr>\n";
5350                                 if ($check_forks) {
5351                                         print "<td></td>\n";
5352                                 }
5353                                 print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5354                                 print "</tr>\n";
5355                         }
5356
5357                         git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5358                 }
5359         } else {
5360                 git_project_list_rows(\@projects, $from, $to, $check_forks);
5361         }
5362
5363         if (defined $extra) {
5364                 print "<tr>\n";
5365                 if ($check_forks) {
5366                         print "<td></td>\n";
5367                 }
5368                 print "<td colspan=\"5\">$extra</td>\n" .
5369                       "</tr>\n";
5370         }
5371         print "</table>\n";
5372 }
5373
5374 sub git_log_body {
5375         # uses global variable $project
5376         my ($commitlist, $from, $to, $refs, $extra) = @_;
5377
5378         $from = 0 unless defined $from;
5379         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5380
5381         for (my $i = 0; $i <= $to; $i++) {
5382                 my %co = %{$commitlist->[$i]};
5383                 next if !%co;
5384                 my $commit = $co{'id'};
5385                 my $ref = format_ref_marker($refs, $commit);
5386                 git_print_header_div('commit',
5387                                "<span class=\"age\">$co{'age_string'}</span>" .
5388                                esc_html($co{'title'}) . $ref,
5389                                $commit);
5390                 print "<div class=\"title_text\">\n" .
5391                       "<div class=\"log_link\">\n" .
5392                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5393                       " | " .
5394                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5395                       " | " .
5396                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5397                       "<br/>\n" .
5398                       "</div>\n";
5399                       git_print_authorship(\%co, -tag => 'span');
5400                       print "<br/>\n</div>\n";
5401
5402                 print "<div class=\"log_body\">\n";
5403                 git_print_log($co{'comment'}, -final_empty_line=> 1);
5404                 print "</div>\n";
5405         }
5406         if ($extra) {
5407                 print "<div class=\"page_nav\">\n";
5408                 print "$extra\n";
5409                 print "</div>\n";
5410         }
5411 }
5412
5413 sub git_shortlog_body {
5414         # uses global variable $project
5415         my ($commitlist, $from, $to, $refs, $extra) = @_;
5416
5417         $from = 0 unless defined $from;
5418         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5419
5420         print "<table class=\"shortlog\">\n";
5421         my $alternate = 1;
5422         for (my $i = $from; $i <= $to; $i++) {
5423                 my %co = %{$commitlist->[$i]};
5424                 my $commit = $co{'id'};
5425                 my $ref = format_ref_marker($refs, $commit);
5426                 if ($alternate) {
5427                         print "<tr class=\"dark\">\n";
5428                 } else {
5429                         print "<tr class=\"light\">\n";
5430                 }
5431                 $alternate ^= 1;
5432                 # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5433                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5434                       format_author_html('td', \%co, 10) . "<td>";
5435                 print format_subject_html($co{'title'}, $co{'title_short'},
5436                                           href(action=>"commit", hash=>$commit), $ref);
5437                 print "</td>\n" .
5438                       "<td class=\"link\">" .
5439                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5440                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5441                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5442                 my $snapshot_links = format_snapshot_links($commit);
5443                 if (defined $snapshot_links) {
5444                         print " | " . $snapshot_links;
5445                 }
5446                 print "</td>\n" .
5447                       "</tr>\n";
5448         }
5449         if (defined $extra) {
5450                 print "<tr>\n" .
5451                       "<td colspan=\"4\">$extra</td>\n" .
5452                       "</tr>\n";
5453         }
5454         print "</table>\n";
5455 }
5456
5457 sub git_history_body {
5458         # Warning: assumes constant type (blob or tree) during history
5459         my ($commitlist, $from, $to, $refs, $extra,
5460             $file_name, $file_hash, $ftype) = @_;
5461
5462         $from = 0 unless defined $from;
5463         $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5464
5465         print "<table class=\"history\">\n";
5466         my $alternate = 1;
5467         for (my $i = $from; $i <= $to; $i++) {
5468                 my %co = %{$commitlist->[$i]};
5469                 if (!%co) {
5470                         next;
5471                 }
5472                 my $commit = $co{'id'};
5473
5474                 my $ref = format_ref_marker($refs, $commit);
5475
5476                 if ($alternate) {
5477                         print "<tr class=\"dark\">\n";
5478                 } else {
5479                         print "<tr class=\"light\">\n";
5480                 }
5481                 $alternate ^= 1;
5482                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5483         # shortlog:   format_author_html('td', \%co, 10)
5484                       format_author_html('td', \%co, 15, 3) . "<td>";
5485                 # originally git_history used chop_str($co{'title'}, 50)
5486                 print format_subject_html($co{'title'}, $co{'title_short'},
5487                                           href(action=>"commit", hash=>$commit), $ref);
5488                 print "</td>\n" .
5489                       "<td class=\"link\">" .
5490                       $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5491                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5492
5493                 if ($ftype eq 'blob') {
5494                         my $blob_current = $file_hash;
5495                         my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5496                         if (defined $blob_current && defined $blob_parent &&
5497                                         $blob_current ne $blob_parent) {
5498                                 print " | " .
5499                                         $cgi->a({-href => href(action=>"blobdiff",
5500                                                                hash=>$blob_current, hash_parent=>$blob_parent,
5501                                                                hash_base=>$hash_base, hash_parent_base=>$commit,
5502                                                                file_name=>$file_name)},
5503                                                 "diff to current");
5504                         }
5505                 }
5506                 print "</td>\n" .
5507                       "</tr>\n";
5508         }
5509         if (defined $extra) {
5510                 print "<tr>\n" .
5511                       "<td colspan=\"4\">$extra</td>\n" .
5512                       "</tr>\n";
5513         }
5514         print "</table>\n";
5515 }
5516
5517 sub git_tags_body {
5518         # uses global variable $project
5519         my ($taglist, $from, $to, $extra) = @_;
5520         $from = 0 unless defined $from;
5521         $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5522
5523         print "<table class=\"tags\">\n";
5524         my $alternate = 1;
5525         for (my $i = $from; $i <= $to; $i++) {
5526                 my $entry = $taglist->[$i];
5527                 my %tag = %$entry;
5528                 my $comment = $tag{'subject'};
5529                 my $comment_short;
5530                 if (defined $comment) {
5531                         $comment_short = chop_str($comment, 30, 5);
5532                 }
5533                 if ($alternate) {
5534                         print "<tr class=\"dark\">\n";
5535                 } else {
5536                         print "<tr class=\"light\">\n";
5537                 }
5538                 $alternate ^= 1;
5539                 if (defined $tag{'age'}) {
5540                         print "<td><i>$tag{'age'}</i></td>\n";
5541                 } else {
5542                         print "<td></td>\n";
5543                 }
5544                 print "<td>" .
5545                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5546                                -class => "list name"}, esc_html($tag{'name'})) .
5547                       "</td>\n" .
5548                       "<td>";
5549                 if (defined $comment) {
5550                         print format_subject_html($comment, $comment_short,
5551                                                   href(action=>"tag", hash=>$tag{'id'}));
5552                 }
5553                 print "</td>\n" .
5554                       "<td class=\"selflink\">";
5555                 if ($tag{'type'} eq "tag") {
5556                         print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5557                 } else {
5558                         print "&nbsp;";
5559                 }
5560                 print "</td>\n" .
5561                       "<td class=\"link\">" . " | " .
5562                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5563                 if ($tag{'reftype'} eq "commit") {
5564                         print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5565                               " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5566                 } elsif ($tag{'reftype'} eq "blob") {
5567                         print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5568                 }
5569                 print "</td>\n" .
5570                       "</tr>";
5571         }
5572         if (defined $extra) {
5573                 print "<tr>\n" .
5574                       "<td colspan=\"5\">$extra</td>\n" .
5575                       "</tr>\n";
5576         }
5577         print "</table>\n";
5578 }
5579
5580 sub git_heads_body {
5581         # uses global variable $project
5582         my ($headlist, $head_at, $from, $to, $extra) = @_;
5583         $from = 0 unless defined $from;
5584         $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5585
5586         print "<table class=\"heads\">\n";
5587         my $alternate = 1;
5588         for (my $i = $from; $i <= $to; $i++) {
5589                 my $entry = $headlist->[$i];
5590                 my %ref = %$entry;
5591                 my $curr = defined $head_at && $ref{'id'} eq $head_at;
5592                 if ($alternate) {
5593                         print "<tr class=\"dark\">\n";
5594                 } else {
5595                         print "<tr class=\"light\">\n";
5596                 }
5597                 $alternate ^= 1;
5598                 print "<td><i>$ref{'age'}</i></td>\n" .
5599                       ($curr ? "<td class=\"current_head\">" : "<td>") .
5600                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5601                                -class => "list name"},esc_html($ref{'name'})) .
5602                       "</td>\n" .
5603                       "<td class=\"link\">" .
5604                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5605                       $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5606                       $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5607                       "</td>\n" .
5608                       "</tr>";
5609         }
5610         if (defined $extra) {
5611                 print "<tr>\n" .
5612                       "<td colspan=\"3\">$extra</td>\n" .
5613                       "</tr>\n";
5614         }
5615         print "</table>\n";
5616 }
5617
5618 # Display a single remote block
5619 sub git_remote_block {
5620         my ($remote, $rdata, $limit, $head) = @_;
5621
5622         my $heads = $rdata->{'heads'};
5623         my $fetch = $rdata->{'fetch'};
5624         my $push = $rdata->{'push'};
5625
5626         my $urls_table = "<table class=\"projects_list\">\n" ;
5627
5628         if (defined $fetch) {
5629                 if ($fetch eq $push) {
5630                         $urls_table .= format_repo_url("URL", $fetch);
5631                 } else {
5632                         $urls_table .= format_repo_url("Fetch URL", $fetch);
5633                         $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5634                 }
5635         } elsif (defined $push) {
5636                 $urls_table .= format_repo_url("Push URL", $push);
5637         } else {
5638                 $urls_table .= format_repo_url("", "No remote URL");
5639         }
5640
5641         $urls_table .= "</table>\n";
5642
5643         my $dots;
5644         if (defined $limit && $limit < @$heads) {
5645                 $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5646         }
5647
5648         print $urls_table;
5649         git_heads_body($heads, $head, 0, $limit, $dots);
5650 }
5651
5652 # Display a list of remote names with the respective fetch and push URLs
5653 sub git_remotes_list {
5654         my ($remotedata, $limit) = @_;
5655         print "<table class=\"heads\">\n";
5656         my $alternate = 1;
5657         my @remotes = sort keys %$remotedata;
5658
5659         my $limited = $limit && $limit < @remotes;
5660
5661         $#remotes = $limit - 1 if $limited;
5662
5663         while (my $remote = shift @remotes) {
5664                 my $rdata = $remotedata->{$remote};
5665                 my $fetch = $rdata->{'fetch'};
5666                 my $push = $rdata->{'push'};
5667                 if ($alternate) {
5668                         print "<tr class=\"dark\">\n";
5669                 } else {
5670                         print "<tr class=\"light\">\n";
5671                 }
5672                 $alternate ^= 1;
5673                 print "<td>" .
5674                       $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5675                                -class=> "list name"},esc_html($remote)) .
5676                       "</td>";
5677                 print "<td class=\"link\">" .
5678                       (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5679                       " | " .
5680                       (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5681                       "</td>";
5682
5683                 print "</tr>\n";
5684         }
5685
5686         if ($limited) {
5687                 print "<tr>\n" .
5688                       "<td colspan=\"3\">" .
5689                       $cgi->a({-href => href(action=>"remotes")}, "...") .
5690                       "</td>\n" . "</tr>\n";
5691         }
5692
5693         print "</table>";
5694 }
5695
5696 # Display remote heads grouped by remote, unless there are too many
5697 # remotes, in which case we only display the remote names
5698 sub git_remotes_body {
5699         my ($remotedata, $limit, $head) = @_;
5700         if ($limit and $limit < keys %$remotedata) {
5701                 git_remotes_list($remotedata, $limit);
5702         } else {
5703                 fill_remote_heads($remotedata);
5704                 while (my ($remote, $rdata) = each %$remotedata) {
5705                         git_print_section({-class=>"remote", -id=>$remote},
5706                                 ["remotes", $remote, $remote], sub {
5707                                         git_remote_block($remote, $rdata, $limit, $head);
5708                                 });
5709                 }
5710         }
5711 }
5712
5713 sub git_search_message {
5714         my %co = @_;
5715
5716         my $greptype;
5717         if ($searchtype eq 'commit') {
5718                 $greptype = "--grep=";
5719         } elsif ($searchtype eq 'author') {
5720                 $greptype = "--author=";
5721         } elsif ($searchtype eq 'committer') {
5722                 $greptype = "--committer=";
5723         }
5724         $greptype .= $searchtext;
5725         my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
5726                                        $greptype, '--regexp-ignore-case',
5727                                        $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
5728
5729         my $paging_nav = '';
5730         if ($page > 0) {
5731                 $paging_nav .=
5732                         $cgi->a({-href => href(-replay=>1, page=>undef)},
5733                                 "first") .
5734                         " &sdot; " .
5735                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
5736                                  -accesskey => "p", -title => "Alt-p"}, "prev");
5737         } else {
5738                 $paging_nav .= "first &sdot; prev";
5739         }
5740         my $next_link = '';
5741         if ($#commitlist >= 100) {
5742                 $next_link =
5743                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
5744                                  -accesskey => "n", -title => "Alt-n"}, "next");
5745                 $paging_nav .= " &sdot; $next_link";
5746         } else {
5747                 $paging_nav .= " &sdot; next";
5748         }
5749
5750         git_header_html();
5751
5752         git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
5753         git_print_header_div('commit', esc_html($co{'title'}), $hash);
5754         if ($page == 0 && !@commitlist) {
5755                 print "<p>No match.</p>\n";
5756         } else {
5757                 git_search_grep_body(\@commitlist, 0, 99, $next_link);
5758         }
5759
5760         git_footer_html();
5761 }
5762
5763 sub git_search_changes {
5764         my %co = @_;
5765
5766         local $/ = "\n";
5767         open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
5768                 '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
5769                 ($search_use_regexp ? '--pickaxe-regex' : ())
5770                         or die_error(500, "Open git-log failed");
5771
5772         git_header_html();
5773
5774         git_print_page_nav('','', $hash,$co{'tree'},$hash);
5775         git_print_header_div('commit', esc_html($co{'title'}), $hash);
5776
5777         print "<table class=\"pickaxe search\">\n";
5778         my $alternate = 1;
5779         undef %co;
5780         my @files;
5781         while (my $line = <$fd>) {
5782                 chomp $line;
5783                 next unless $line;
5784
5785                 my %set = parse_difftree_raw_line($line);
5786                 if (defined $set{'commit'}) {
5787                         # finish previous commit
5788                         if (%co) {
5789                                 print "</td>\n" .
5790                                       "<td class=\"link\">" .
5791                                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5792                                               "commit") .
5793                                       " | " .
5794                                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5795                                                              hash_base=>$co{'id'})},
5796                                               "tree") .
5797                                       "</td>\n" .
5798                                       "</tr>\n";
5799                         }
5800
5801                         if ($alternate) {
5802                                 print "<tr class=\"dark\">\n";
5803                         } else {
5804                                 print "<tr class=\"light\">\n";
5805                         }
5806                         $alternate ^= 1;
5807                         %co = parse_commit($set{'commit'});
5808                         my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
5809                         print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5810                               "<td><i>$author</i></td>\n" .
5811                               "<td>" .
5812                               $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5813                                       -class => "list subject"},
5814                                       chop_and_escape_str($co{'title'}, 50) . "<br/>");
5815                 } elsif (defined $set{'to_id'}) {
5816                         next if ($set{'to_id'} =~ m/^0{40}$/);
5817
5818                         print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
5819                                                      hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
5820                                       -class => "list"},
5821                                       "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
5822                               "<br/>\n";
5823                 }
5824         }
5825         close $fd;
5826
5827         # finish last commit (warning: repetition!)
5828         if (%co) {
5829                 print "</td>\n" .
5830                       "<td class=\"link\">" .
5831                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})},
5832                               "commit") .
5833                       " | " .
5834                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'},
5835                                              hash_base=>$co{'id'})},
5836                               "tree") .
5837                       "</td>\n" .
5838                       "</tr>\n";
5839         }
5840
5841         print "</table>\n";
5842
5843         git_footer_html();
5844 }
5845
5846 sub git_search_files {
5847         my %co = @_;
5848
5849         local $/ = "\n";
5850         open my $fd, "-|", git_cmd(), 'grep', '-n', '-z',
5851                 $search_use_regexp ? ('-E', '-i') : '-F',
5852                 $searchtext, $co{'tree'}
5853                         or die_error(500, "Open git-grep failed");
5854
5855         git_header_html();
5856
5857         git_print_page_nav('','', $hash,$co{'tree'},$hash);
5858         git_print_header_div('commit', esc_html($co{'title'}), $hash);
5859
5860         print "<table class=\"grep_search\">\n";
5861         my $alternate = 1;
5862         my $matches = 0;
5863         my $lastfile = '';
5864         my $file_href;
5865         while (my $line = <$fd>) {
5866                 chomp $line;
5867                 my ($file, $lno, $ltext, $binary);
5868                 last if ($matches++ > 1000);
5869                 if ($line =~ /^Binary file (.+) matches$/) {
5870                         $file = $1;
5871                         $binary = 1;
5872                 } else {
5873                         ($file, $lno, $ltext) = split(/\0/, $line, 3);
5874                         $file =~ s/^$co{'tree'}://;
5875                 }
5876                 if ($file ne $lastfile) {
5877                         $lastfile and print "</td></tr>\n";
5878                         if ($alternate++) {
5879                                 print "<tr class=\"dark\">\n";
5880                         } else {
5881                                 print "<tr class=\"light\">\n";
5882                         }
5883                         $file_href = href(action=>"blob", hash_base=>$co{'id'},
5884                                           file_name=>$file);
5885                         print "<td class=\"list\">".
5886                                 $cgi->a({-href => $file_href, -class => "list"}, esc_path($file));
5887                         print "</td><td>\n";
5888                         $lastfile = $file;
5889                 }
5890                 if ($binary) {
5891                         print "<div class=\"binary\">Binary file</div>\n";
5892                 } else {
5893                         $ltext = untabify($ltext);
5894                         if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
5895                                 $ltext = esc_html($1, -nbsp=>1);
5896                                 $ltext .= '<span class="match">';
5897                                 $ltext .= esc_html($2, -nbsp=>1);
5898                                 $ltext .= '</span>';
5899                                 $ltext .= esc_html($3, -nbsp=>1);
5900                         } else {
5901                                 $ltext = esc_html($ltext, -nbsp=>1);
5902                         }
5903                         print "<div class=\"pre\">" .
5904                                 $cgi->a({-href => $file_href.'#l'.$lno,
5905                                         -class => "linenr"}, sprintf('%4i', $lno)) .
5906                                 ' ' .  $ltext . "</div>\n";
5907                 }
5908         }
5909         if ($lastfile) {
5910                 print "</td></tr>\n";
5911                 if ($matches > 1000) {
5912                         print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
5913                 }
5914         } else {
5915                 print "<div class=\"diff nodifferences\">No matches found</div>\n";
5916         }
5917         close $fd;
5918
5919         print "</table>\n";
5920
5921         git_footer_html();
5922 }
5923
5924 sub git_search_grep_body {
5925         my ($commitlist, $from, $to, $extra) = @_;
5926         $from = 0 unless defined $from;
5927         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5928
5929         print "<table class=\"commit_search\">\n";
5930         my $alternate = 1;
5931         for (my $i = $from; $i <= $to; $i++) {
5932                 my %co = %{$commitlist->[$i]};
5933                 if (!%co) {
5934                         next;
5935                 }
5936                 my $commit = $co{'id'};
5937                 if ($alternate) {
5938                         print "<tr class=\"dark\">\n";
5939                 } else {
5940                         print "<tr class=\"light\">\n";
5941                 }
5942                 $alternate ^= 1;
5943                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5944                       format_author_html('td', \%co, 15, 5) .
5945                       "<td>" .
5946                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5947                                -class => "list subject"},
5948                               chop_and_escape_str($co{'title'}, 50) . "<br/>");
5949                 my $comment = $co{'comment'};
5950                 foreach my $line (@$comment) {
5951                         if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
5952                                 my ($lead, $match, $trail) = ($1, $2, $3);
5953                                 $match = chop_str($match, 70, 5, 'center');
5954                                 my $contextlen = int((80 - length($match))/2);
5955                                 $contextlen = 30 if ($contextlen > 30);
5956                                 $lead  = chop_str($lead,  $contextlen, 10, 'left');
5957                                 $trail = chop_str($trail, $contextlen, 10, 'right');
5958
5959                                 $lead  = esc_html($lead);
5960                                 $match = esc_html($match);
5961                                 $trail = esc_html($trail);
5962
5963                                 print "$lead<span class=\"match\">$match</span>$trail<br />";
5964                         }
5965                 }
5966                 print "</td>\n" .
5967                       "<td class=\"link\">" .
5968                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5969                       " | " .
5970                       $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5971                       " | " .
5972                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5973                 print "</td>\n" .
5974                       "</tr>\n";
5975         }
5976         if (defined $extra) {
5977                 print "<tr>\n" .
5978                       "<td colspan=\"3\">$extra</td>\n" .
5979                       "</tr>\n";
5980         }
5981         print "</table>\n";
5982 }
5983
5984 ## ======================================================================
5985 ## ======================================================================
5986 ## actions
5987
5988 sub git_project_list {
5989         my $order = $input_params{'order'};
5990         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5991                 die_error(400, "Unknown order parameter");
5992         }
5993
5994         my @list = git_get_projects_list();
5995         if (!@list) {
5996                 die_error(404, "No projects found");
5997         }
5998
5999         git_header_html();
6000         if (defined $home_text && -f $home_text) {
6001                 print "<div class=\"index_include\">\n";
6002                 insert_file($home_text);
6003                 print "</div>\n";
6004         }
6005         print $cgi->startform(-method => "get") .
6006               "<p class=\"projsearch\">Search:\n" .
6007               $cgi->textfield(-name => "s", -value => $searchtext, -override => 1) . "\n" .
6008               "</p>" .
6009               $cgi->end_form() . "\n";
6010         git_project_list_body(\@list, $order);
6011         git_footer_html();
6012 }
6013
6014 sub git_forks {
6015         my $order = $input_params{'order'};
6016         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
6017                 die_error(400, "Unknown order parameter");
6018         }
6019
6020         my @list = git_get_projects_list($project);
6021         if (!@list) {
6022                 die_error(404, "No forks found");
6023         }
6024
6025         git_header_html();
6026         git_print_page_nav('','');
6027         git_print_header_div('summary', "$project forks");
6028         git_project_list_body(\@list, $order);
6029         git_footer_html();
6030 }
6031
6032 sub git_project_index {
6033         my @projects = git_get_projects_list();
6034         if (!@projects) {
6035                 die_error(404, "No projects found");
6036         }
6037
6038         print $cgi->header(
6039                 -type => 'text/plain',
6040                 -charset => 'utf-8',
6041                 -content_disposition => 'inline; filename="index.aux"');
6042
6043         foreach my $pr (@projects) {
6044                 if (!exists $pr->{'owner'}) {
6045                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
6046                 }
6047
6048                 my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
6049                 # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
6050                 $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6051                 $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
6052                 $path  =~ s/ /\+/g;
6053                 $owner =~ s/ /\+/g;
6054
6055                 print "$path $owner\n";
6056         }
6057 }
6058
6059 sub git_summary {
6060         my $descr = git_get_project_description($project) || "none";
6061         my %co = parse_commit("HEAD");
6062         my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
6063         my $head = $co{'id'};
6064         my $remote_heads = gitweb_check_feature('remote_heads');
6065
6066         my $owner = git_get_project_owner($project);
6067
6068         my $refs = git_get_references();
6069         # These get_*_list functions return one more to allow us to see if
6070         # there are more ...
6071         my @taglist  = git_get_tags_list(16);
6072         my @headlist = git_get_heads_list(16);
6073         my %remotedata = $remote_heads ? git_get_remotes_list() : ();
6074         my @forklist;
6075         my $check_forks = gitweb_check_feature('forks');
6076
6077         if ($check_forks) {
6078                 # find forks of a project
6079                 @forklist = git_get_projects_list($project);
6080                 # filter out forks of forks
6081                 @forklist = filter_forks_from_projects_list(\@forklist)
6082                         if (@forklist);
6083         }
6084
6085         git_header_html();
6086         git_print_page_nav('summary','', $head);
6087
6088         print "<div class=\"title\">&nbsp;</div>\n";
6089         print "<table class=\"projects_list\">\n" .
6090               "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
6091               "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
6092         if (defined $cd{'rfc2822'}) {
6093                 print "<tr id=\"metadata_lchange\"><td>last change</td>" .
6094                       "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
6095         }
6096
6097         # use per project git URL list in $projectroot/$project/cloneurl
6098         # or make project git URL from git base URL and project name
6099         my $url_tag = "URL";
6100         my @url_list = git_get_project_url_list($project);
6101         @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
6102         foreach my $git_url (@url_list) {
6103                 next unless $git_url;
6104                 print format_repo_url($url_tag, $git_url);
6105                 $url_tag = "";
6106         }
6107
6108         # Tag cloud
6109         my $show_ctags = gitweb_check_feature('ctags');
6110         if ($show_ctags) {
6111                 my $ctags = git_get_project_ctags($project);
6112                 if (%$ctags) {
6113                         # without ability to add tags, don't show if there are none
6114                         my $cloud = git_populate_project_tagcloud($ctags);
6115                         print "<tr id=\"metadata_ctags\">" .
6116                               "<td>content tags</td>" .
6117                               "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
6118                               "</tr>\n";
6119                 }
6120         }
6121
6122         print "</table>\n";
6123
6124         # If XSS prevention is on, we don't include README.html.
6125         # TODO: Allow a readme in some safe format.
6126         if (!$prevent_xss && -s "$projectroot/$project/README.html") {
6127                 print "<div class=\"title\">readme</div>\n" .
6128                       "<div class=\"readme\">\n";
6129                 insert_file("$projectroot/$project/README.html");
6130                 print "\n</div>\n"; # class="readme"
6131         }
6132
6133         # we need to request one more than 16 (0..15) to check if
6134         # those 16 are all
6135         my @commitlist = $head ? parse_commits($head, 17) : ();
6136         if (@commitlist) {
6137                 git_print_header_div('shortlog');
6138                 git_shortlog_body(\@commitlist, 0, 15, $refs,
6139                                   $#commitlist <=  15 ? undef :
6140                                   $cgi->a({-href => href(action=>"shortlog")}, "..."));
6141         }
6142
6143         if (@taglist) {
6144                 git_print_header_div('tags');
6145                 git_tags_body(\@taglist, 0, 15,
6146                               $#taglist <=  15 ? undef :
6147                               $cgi->a({-href => href(action=>"tags")}, "..."));
6148         }
6149
6150         if (@headlist) {
6151                 git_print_header_div('heads');
6152                 git_heads_body(\@headlist, $head, 0, 15,
6153                                $#headlist <= 15 ? undef :
6154                                $cgi->a({-href => href(action=>"heads")}, "..."));
6155         }
6156
6157         if (%remotedata) {
6158                 git_print_header_div('remotes');
6159                 git_remotes_body(\%remotedata, 15, $head);
6160         }
6161
6162         if (@forklist) {
6163                 git_print_header_div('forks');
6164                 git_project_list_body(\@forklist, 'age', 0, 15,
6165                                       $#forklist <= 15 ? undef :
6166                                       $cgi->a({-href => href(action=>"forks")}, "..."),
6167                                       'no_header');
6168         }
6169
6170         git_footer_html();
6171 }
6172
6173 sub git_tag {
6174         my %tag = parse_tag($hash);
6175
6176         if (! %tag) {
6177                 die_error(404, "Unknown tag object");
6178         }
6179
6180         my $head = git_get_head_hash($project);
6181         git_header_html();
6182         git_print_page_nav('','', $head,undef,$head);
6183         git_print_header_div('commit', esc_html($tag{'name'}), $hash);
6184         print "<div class=\"title_text\">\n" .
6185               "<table class=\"object_header\">\n" .
6186               "<tr>\n" .
6187               "<td>object</td>\n" .
6188               "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6189                                $tag{'object'}) . "</td>\n" .
6190               "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
6191                                               $tag{'type'}) . "</td>\n" .
6192               "</tr>\n";
6193         if (defined($tag{'author'})) {
6194                 git_print_authorship_rows(\%tag, 'author');
6195         }
6196         print "</table>\n\n" .
6197               "</div>\n";
6198         print "<div class=\"page_body\">";
6199         my $comment = $tag{'comment'};
6200         foreach my $line (@$comment) {
6201                 chomp $line;
6202                 print esc_html($line, -nbsp=>1) . "<br/>\n";
6203         }
6204         print "</div>\n";
6205         git_footer_html();
6206 }
6207
6208 sub git_blame_common {
6209         my $format = shift || 'porcelain';
6210         if ($format eq 'porcelain' && $input_params{'javascript'}) {
6211                 $format = 'incremental';
6212                 $action = 'blame_incremental'; # for page title etc
6213         }
6214
6215         # permissions
6216         gitweb_check_feature('blame')
6217                 or die_error(403, "Blame view not allowed");
6218
6219         # error checking
6220         die_error(400, "No file name given") unless $file_name;
6221         $hash_base ||= git_get_head_hash($project);
6222         die_error(404, "Couldn't find base commit") unless $hash_base;
6223         my %co = parse_commit($hash_base)
6224                 or die_error(404, "Commit not found");
6225         my $ftype = "blob";
6226         if (!defined $hash) {
6227                 $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
6228                         or die_error(404, "Error looking up file");
6229         } else {
6230                 $ftype = git_get_type($hash);
6231                 if ($ftype !~ "blob") {
6232                         die_error(400, "Object is not a blob");
6233                 }
6234         }
6235
6236         my $fd;
6237         if ($format eq 'incremental') {
6238                 # get file contents (as base)
6239                 open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
6240                         or die_error(500, "Open git-cat-file failed");
6241         } elsif ($format eq 'data') {
6242                 # run git-blame --incremental
6243                 open $fd, "-|", git_cmd(), "blame", "--incremental",
6244                         $hash_base, "--", $file_name
6245                         or die_error(500, "Open git-blame --incremental failed");
6246         } else {
6247                 # run git-blame --porcelain
6248                 open $fd, "-|", git_cmd(), "blame", '-p',
6249                         $hash_base, '--', $file_name
6250                         or die_error(500, "Open git-blame --porcelain failed");
6251         }
6252
6253         # incremental blame data returns early
6254         if ($format eq 'data') {
6255                 print $cgi->header(
6256                         -type=>"text/plain", -charset => "utf-8",
6257                         -status=> "200 OK");
6258                 local $| = 1; # output autoflush
6259                 while (my $line = <$fd>) {
6260                         print to_utf8($line);
6261                 }
6262                 close $fd
6263                         or print "ERROR $!\n";
6264
6265                 print 'END';
6266                 if (defined $t0 && gitweb_check_feature('timed')) {
6267                         print ' '.
6268                               tv_interval($t0, [ gettimeofday() ]).
6269                               ' '.$number_of_git_cmds;
6270                 }
6271                 print "\n";
6272
6273                 return;
6274         }
6275
6276         # page header
6277         git_header_html();
6278         my $formats_nav =
6279                 $cgi->a({-href => href(action=>"blob", -replay=>1)},
6280                         "blob") .
6281                 " | ";
6282         if ($format eq 'incremental') {
6283                 $formats_nav .=
6284                         $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
6285                                 "blame") . " (non-incremental)";
6286         } else {
6287                 $formats_nav .=
6288                         $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
6289                                 "blame") . " (incremental)";
6290         }
6291         $formats_nav .=
6292                 " | " .
6293                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6294                         "history") .
6295                 " | " .
6296                 $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
6297                         "HEAD");
6298         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6299         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6300         git_print_page_path($file_name, $ftype, $hash_base);
6301
6302         # page body
6303         if ($format eq 'incremental') {
6304                 print "<noscript>\n<div class=\"error\"><center><b>\n".
6305                       "This page requires JavaScript to run.\n Use ".
6306                       $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
6307                               'this page').
6308                       " instead.\n".
6309                       "</b></center></div>\n</noscript>\n";
6310
6311                 print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
6312         }
6313
6314         print qq!<div class="page_body">\n!;
6315         print qq!<div id="progress_info">... / ...</div>\n!
6316                 if ($format eq 'incremental');
6317         print qq!<table id="blame_table" class="blame" width="100%">\n!.
6318               #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
6319               qq!<thead>\n!.
6320               qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
6321               qq!</thead>\n!.
6322               qq!<tbody>\n!;
6323
6324         my @rev_color = qw(light dark);
6325         my $num_colors = scalar(@rev_color);
6326         my $current_color = 0;
6327
6328         if ($format eq 'incremental') {
6329                 my $color_class = $rev_color[$current_color];
6330
6331                 #contents of a file
6332                 my $linenr = 0;
6333         LINE:
6334                 while (my $line = <$fd>) {
6335                         chomp $line;
6336                         $linenr++;
6337
6338                         print qq!<tr id="l$linenr" class="$color_class">!.
6339                               qq!<td class="sha1"><a href=""> </a></td>!.
6340                               qq!<td class="linenr">!.
6341                               qq!<a class="linenr" href="">$linenr</a></td>!;
6342                         print qq!<td class="pre">! . esc_html($line) . "</td>\n";
6343                         print qq!</tr>\n!;
6344                 }
6345
6346         } else { # porcelain, i.e. ordinary blame
6347                 my %metainfo = (); # saves information about commits
6348
6349                 # blame data
6350         LINE:
6351                 while (my $line = <$fd>) {
6352                         chomp $line;
6353                         # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
6354                         # no <lines in group> for subsequent lines in group of lines
6355                         my ($full_rev, $orig_lineno, $lineno, $group_size) =
6356                            ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
6357                         if (!exists $metainfo{$full_rev}) {
6358                                 $metainfo{$full_rev} = { 'nprevious' => 0 };
6359                         }
6360                         my $meta = $metainfo{$full_rev};
6361                         my $data;
6362                         while ($data = <$fd>) {
6363                                 chomp $data;
6364                                 last if ($data =~ s/^\t//); # contents of line
6365                                 if ($data =~ /^(\S+)(?: (.*))?$/) {
6366                                         $meta->{$1} = $2 unless exists $meta->{$1};
6367                                 }
6368                                 if ($data =~ /^previous /) {
6369                                         $meta->{'nprevious'}++;
6370                                 }
6371                         }
6372                         my $short_rev = substr($full_rev, 0, 8);
6373                         my $author = $meta->{'author'};
6374                         my %date =
6375                                 parse_date($meta->{'author-time'}, $meta->{'author-tz'});
6376                         my $date = $date{'iso-tz'};
6377                         if ($group_size) {
6378                                 $current_color = ($current_color + 1) % $num_colors;
6379                         }
6380                         my $tr_class = $rev_color[$current_color];
6381                         $tr_class .= ' boundary' if (exists $meta->{'boundary'});
6382                         $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
6383                         $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
6384                         print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
6385                         if ($group_size) {
6386                                 print "<td class=\"sha1\"";
6387                                 print " title=\"". esc_html($author) . ", $date\"";
6388                                 print " rowspan=\"$group_size\"" if ($group_size > 1);
6389                                 print ">";
6390                                 print $cgi->a({-href => href(action=>"commit",
6391                                                              hash=>$full_rev,
6392                                                              file_name=>$file_name)},
6393                                               esc_html($short_rev));
6394                                 if ($group_size >= 2) {
6395                                         my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
6396                                         if (@author_initials) {
6397                                                 print "<br />" .
6398                                                       esc_html(join('', @author_initials));
6399                                                 #           or join('.', ...)
6400                                         }
6401                                 }
6402                                 print "</td>\n";
6403                         }
6404                         # 'previous' <sha1 of parent commit> <filename at commit>
6405                         if (exists $meta->{'previous'} &&
6406                             $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6407                                 $meta->{'parent'} = $1;
6408                                 $meta->{'file_parent'} = unquote($2);
6409                         }
6410                         my $linenr_commit =
6411                                 exists($meta->{'parent'}) ?
6412                                 $meta->{'parent'} : $full_rev;
6413                         my $linenr_filename =
6414                                 exists($meta->{'file_parent'}) ?
6415                                 $meta->{'file_parent'} : unquote($meta->{'filename'});
6416                         my $blamed = href(action => 'blame',
6417                                           file_name => $linenr_filename,
6418                                           hash_base => $linenr_commit);
6419                         print "<td class=\"linenr\">";
6420                         print $cgi->a({ -href => "$blamed#l$orig_lineno",
6421                                         -class => "linenr" },
6422                                       esc_html($lineno));
6423                         print "</td>";
6424                         print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6425                         print "</tr>\n";
6426                 } # end while
6427
6428         }
6429
6430         # footer
6431         print "</tbody>\n".
6432               "</table>\n"; # class="blame"
6433         print "</div>\n";   # class="blame_body"
6434         close $fd
6435                 or print "Reading blob failed\n";
6436
6437         git_footer_html();
6438 }
6439
6440 sub git_blame {
6441         git_blame_common();
6442 }
6443
6444 sub git_blame_incremental {
6445         git_blame_common('incremental');
6446 }
6447
6448 sub git_blame_data {
6449         git_blame_common('data');
6450 }
6451
6452 sub git_tags {
6453         my $head = git_get_head_hash($project);
6454         git_header_html();
6455         git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6456         git_print_header_div('summary', $project);
6457
6458         my @tagslist = git_get_tags_list();
6459         if (@tagslist) {
6460                 git_tags_body(\@tagslist);
6461         }
6462         git_footer_html();
6463 }
6464
6465 sub git_heads {
6466         my $head = git_get_head_hash($project);
6467         git_header_html();
6468         git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6469         git_print_header_div('summary', $project);
6470
6471         my @headslist = git_get_heads_list();
6472         if (@headslist) {
6473                 git_heads_body(\@headslist, $head);
6474         }
6475         git_footer_html();
6476 }
6477
6478 # used both for single remote view and for list of all the remotes
6479 sub git_remotes {
6480         gitweb_check_feature('remote_heads')
6481                 or die_error(403, "Remote heads view is disabled");
6482
6483         my $head = git_get_head_hash($project);
6484         my $remote = $input_params{'hash'};
6485
6486         my $remotedata = git_get_remotes_list($remote);
6487         die_error(500, "Unable to get remote information") unless defined $remotedata;
6488
6489         unless (%$remotedata) {
6490                 die_error(404, defined $remote ?
6491                         "Remote $remote not found" :
6492                         "No remotes found");
6493         }
6494
6495         git_header_html(undef, undef, -action_extra => $remote);
6496         git_print_page_nav('', '',  $head, undef, $head,
6497                 format_ref_views($remote ? '' : 'remotes'));
6498
6499         fill_remote_heads($remotedata);
6500         if (defined $remote) {
6501                 git_print_header_div('remotes', "$remote remote for $project");
6502                 git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6503         } else {
6504                 git_print_header_div('summary', "$project remotes");
6505                 git_remotes_body($remotedata, undef, $head);
6506         }
6507
6508         git_footer_html();
6509 }
6510
6511 sub git_blob_plain {
6512         my $type = shift;
6513         my $expires;
6514
6515         if (!defined $hash) {
6516                 if (defined $file_name) {
6517                         my $base = $hash_base || git_get_head_hash($project);
6518                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6519                                 or die_error(404, "Cannot find file");
6520                 } else {
6521                         die_error(400, "No file name defined");
6522                 }
6523         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6524                 # blobs defined by non-textual hash id's can be cached
6525                 $expires = "+1d";
6526         }
6527
6528         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6529                 or die_error(500, "Open git-cat-file blob '$hash' failed");
6530
6531         # content-type (can include charset)
6532         $type = blob_contenttype($fd, $file_name, $type);
6533
6534         # "save as" filename, even when no $file_name is given
6535         my $save_as = "$hash";
6536         if (defined $file_name) {
6537                 $save_as = $file_name;
6538         } elsif ($type =~ m/^text\//) {
6539                 $save_as .= '.txt';
6540         }
6541
6542         # With XSS prevention on, blobs of all types except a few known safe
6543         # ones are served with "Content-Disposition: attachment" to make sure
6544         # they don't run in our security domain.  For certain image types,
6545         # blob view writes an <img> tag referring to blob_plain view, and we
6546         # want to be sure not to break that by serving the image as an
6547         # attachment (though Firefox 3 doesn't seem to care).
6548         my $sandbox = $prevent_xss &&
6549                 $type !~ m!^(?:text/[a-z]+|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6550
6551         # serve text/* as text/plain
6552         if ($prevent_xss &&
6553             ($type =~ m!^text/[a-z]+\b(.*)$! ||
6554              ($type =~ m!^[a-z]+/[a-z]\+xml\b(.*)$! && -T $fd))) {
6555                 my $rest = $1;
6556                 $rest = defined $rest ? $rest : '';
6557                 $type = "text/plain$rest";
6558         }
6559
6560         print $cgi->header(
6561                 -type => $type,
6562                 -expires => $expires,
6563                 -content_disposition =>
6564                         ($sandbox ? 'attachment' : 'inline')
6565                         . '; filename="' . $save_as . '"');
6566         local $/ = undef;
6567         binmode STDOUT, ':raw';
6568         print <$fd>;
6569         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6570         close $fd;
6571 }
6572
6573 sub git_blob {
6574         my $expires;
6575
6576         if (!defined $hash) {
6577                 if (defined $file_name) {
6578                         my $base = $hash_base || git_get_head_hash($project);
6579                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6580                                 or die_error(404, "Cannot find file");
6581                 } else {
6582                         die_error(400, "No file name defined");
6583                 }
6584         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6585                 # blobs defined by non-textual hash id's can be cached
6586                 $expires = "+1d";
6587         }
6588
6589         my $have_blame = gitweb_check_feature('blame');
6590         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6591                 or die_error(500, "Couldn't cat $file_name, $hash");
6592         my $mimetype = blob_mimetype($fd, $file_name);
6593         # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6594         if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6595                 close $fd;
6596                 return git_blob_plain($mimetype);
6597         }
6598         # we can have blame only for text/* mimetype
6599         $have_blame &&= ($mimetype =~ m!^text/!);
6600
6601         my $highlight = gitweb_check_feature('highlight');
6602         my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6603         $fd = run_highlighter($fd, $highlight, $syntax)
6604                 if $syntax;
6605
6606         git_header_html(undef, $expires);
6607         my $formats_nav = '';
6608         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6609                 if (defined $file_name) {
6610                         if ($have_blame) {
6611                                 $formats_nav .=
6612                                         $cgi->a({-href => href(action=>"blame", -replay=>1)},
6613                                                 "blame") .
6614                                         " | ";
6615                         }
6616                         $formats_nav .=
6617                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6618                                         "history") .
6619                                 " | " .
6620                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6621                                         "raw") .
6622                                 " | " .
6623                                 $cgi->a({-href => href(action=>"blob",
6624                                                        hash_base=>"HEAD", file_name=>$file_name)},
6625                                         "HEAD");
6626                 } else {
6627                         $formats_nav .=
6628                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6629                                         "raw");
6630                 }
6631                 git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6632                 git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6633         } else {
6634                 print "<div class=\"page_nav\">\n" .
6635                       "<br/><br/></div>\n" .
6636                       "<div class=\"title\">".esc_html($hash)."</div>\n";
6637         }
6638         git_print_page_path($file_name, "blob", $hash_base);
6639         print "<div class=\"page_body\">\n";
6640         if ($mimetype =~ m!^image/!) {
6641                 print qq!<img type="!.esc_attr($mimetype).qq!"!;
6642                 if ($file_name) {
6643                         print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
6644                 }
6645                 print qq! src="! .
6646                       href(action=>"blob_plain", hash=>$hash,
6647                            hash_base=>$hash_base, file_name=>$file_name) .
6648                       qq!" />\n!;
6649         } else {
6650                 my $nr;
6651                 while (my $line = <$fd>) {
6652                         chomp $line;
6653                         $nr++;
6654                         $line = untabify($line);
6655                         printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
6656                                $nr, esc_attr(href(-replay => 1)), $nr, $nr,
6657                                $syntax ? sanitize($line) : esc_html($line, -nbsp=>1);
6658                 }
6659         }
6660         close $fd
6661                 or print "Reading blob failed.\n";
6662         print "</div>";
6663         git_footer_html();
6664 }
6665
6666 sub git_tree {
6667         if (!defined $hash_base) {
6668                 $hash_base = "HEAD";
6669         }
6670         if (!defined $hash) {
6671                 if (defined $file_name) {
6672                         $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
6673                 } else {
6674                         $hash = $hash_base;
6675                 }
6676         }
6677         die_error(404, "No such tree") unless defined($hash);
6678
6679         my $show_sizes = gitweb_check_feature('show-sizes');
6680         my $have_blame = gitweb_check_feature('blame');
6681
6682         my @entries = ();
6683         {
6684                 local $/ = "\0";
6685                 open my $fd, "-|", git_cmd(), "ls-tree", '-z',
6686                         ($show_sizes ? '-l' : ()), @extra_options, $hash
6687                         or die_error(500, "Open git-ls-tree failed");
6688                 @entries = map { chomp; $_ } <$fd>;
6689                 close $fd
6690                         or die_error(404, "Reading tree failed");
6691         }
6692
6693         my $refs = git_get_references();
6694         my $ref = format_ref_marker($refs, $hash_base);
6695         git_header_html();
6696         my $basedir = '';
6697         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6698                 my @views_nav = ();
6699                 if (defined $file_name) {
6700                         push @views_nav,
6701                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6702                                         "history"),
6703                                 $cgi->a({-href => href(action=>"tree",
6704                                                        hash_base=>"HEAD", file_name=>$file_name)},
6705                                         "HEAD"),
6706                 }
6707                 my $snapshot_links = format_snapshot_links($hash);
6708                 if (defined $snapshot_links) {
6709                         # FIXME: Should be available when we have no hash base as well.
6710                         push @views_nav, $snapshot_links;
6711                 }
6712                 git_print_page_nav('tree','', $hash_base, undef, undef,
6713                                    join(' | ', @views_nav));
6714                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6715         } else {
6716                 undef $hash_base;
6717                 print "<div class=\"page_nav\">\n";
6718                 print "<br/><br/></div>\n";
6719                 print "<div class=\"title\">".esc_html($hash)."</div>\n";
6720         }
6721         if (defined $file_name) {
6722                 $basedir = $file_name;
6723                 if ($basedir ne '' && substr($basedir, -1) ne '/') {
6724                         $basedir .= '/';
6725                 }
6726                 git_print_page_path($file_name, 'tree', $hash_base);
6727         }
6728         print "<div class=\"page_body\">\n";
6729         print "<table class=\"tree\">\n";
6730         my $alternate = 1;
6731         # '..' (top directory) link if possible
6732         if (defined $hash_base &&
6733             defined $file_name && $file_name =~ m![^/]+$!) {
6734                 if ($alternate) {
6735                         print "<tr class=\"dark\">\n";
6736                 } else {
6737                         print "<tr class=\"light\">\n";
6738                 }
6739                 $alternate ^= 1;
6740
6741                 my $up = $file_name;
6742                 $up =~ s!/?[^/]+$!!;
6743                 undef $up unless $up;
6744                 # based on git_print_tree_entry
6745                 print '<td class="mode">' . mode_str('040000') . "</td>\n";
6746                 print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6747                 print '<td class="list">';
6748                 print $cgi->a({-href => href(action=>"tree",
6749                                              hash_base=>$hash_base,
6750                                              file_name=>$up)},
6751                               "..");
6752                 print "</td>\n";
6753                 print "<td class=\"link\"></td>\n";
6754
6755                 print "</tr>\n";
6756         }
6757         foreach my $line (@entries) {
6758                 my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6759
6760                 if ($alternate) {
6761                         print "<tr class=\"dark\">\n";
6762                 } else {
6763                         print "<tr class=\"light\">\n";
6764                 }
6765                 $alternate ^= 1;
6766
6767                 git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6768
6769                 print "</tr>\n";
6770         }
6771         print "</table>\n" .
6772               "</div>";
6773         git_footer_html();
6774 }
6775
6776 sub snapshot_name {
6777         my ($project, $hash) = @_;
6778
6779         # path/to/project.git  -> project
6780         # path/to/project/.git -> project
6781         my $name = to_utf8($project);
6782         $name =~ s,([^/])/*\.git$,$1,;
6783         $name = basename($name);
6784         # sanitize name
6785         $name =~ s/[[:cntrl:]]/?/g;
6786
6787         my $ver = $hash;
6788         if ($hash =~ /^[0-9a-fA-F]+$/) {
6789                 # shorten SHA-1 hash
6790                 my $full_hash = git_get_full_hash($project, $hash);
6791                 if ($full_hash =~ /^$hash/ && length($hash) > 7) {
6792                         $ver = git_get_short_hash($project, $hash);
6793                 }
6794         } elsif ($hash =~ m!^refs/tags/(.*)$!) {
6795                 # tags don't need shortened SHA-1 hash
6796                 $ver = $1;
6797         } else {
6798                 # branches and other need shortened SHA-1 hash
6799                 if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
6800                         $ver = $1;
6801                 }
6802                 $ver .= '-' . git_get_short_hash($project, $hash);
6803         }
6804         # in case of hierarchical branch names
6805         $ver =~ s!/!.!g;
6806
6807         # name = project-version_string
6808         $name = "$name-$ver";
6809
6810         return wantarray ? ($name, $name) : $name;
6811 }
6812
6813 sub git_snapshot {
6814         my $format = $input_params{'snapshot_format'};
6815         if (!@snapshot_fmts) {
6816                 die_error(403, "Snapshots not allowed");
6817         }
6818         # default to first supported snapshot format
6819         $format ||= $snapshot_fmts[0];
6820         if ($format !~ m/^[a-z0-9]+$/) {
6821                 die_error(400, "Invalid snapshot format parameter");
6822         } elsif (!exists($known_snapshot_formats{$format})) {
6823                 die_error(400, "Unknown snapshot format");
6824         } elsif ($known_snapshot_formats{$format}{'disabled'}) {
6825                 die_error(403, "Snapshot format not allowed");
6826         } elsif (!grep($_ eq $format, @snapshot_fmts)) {
6827                 die_error(403, "Unsupported snapshot format");
6828         }
6829
6830         my $type = git_get_type("$hash^{}");
6831         if (!$type) {
6832                 die_error(404, 'Object does not exist');
6833         }  elsif ($type eq 'blob') {
6834                 die_error(400, 'Object is not a tree-ish');
6835         }
6836
6837         my ($name, $prefix) = snapshot_name($project, $hash);
6838         my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
6839         my $cmd = quote_command(
6840                 git_cmd(), 'archive',
6841                 "--format=$known_snapshot_formats{$format}{'format'}",
6842                 "--prefix=$prefix/", $hash);
6843         if (exists $known_snapshot_formats{$format}{'compressor'}) {
6844                 $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
6845         }
6846
6847         $filename =~ s/(["\\])/\\$1/g;
6848         print $cgi->header(
6849                 -type => $known_snapshot_formats{$format}{'type'},
6850                 -content_disposition => 'inline; filename="' . $filename . '"',
6851                 -status => '200 OK');
6852
6853         open my $fd, "-|", $cmd
6854                 or die_error(500, "Execute git-archive failed");
6855         binmode STDOUT, ':raw';
6856         print <$fd>;
6857         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6858         close $fd;
6859 }
6860
6861 sub git_log_generic {
6862         my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
6863
6864         my $head = git_get_head_hash($project);
6865         if (!defined $base) {
6866                 $base = $head;
6867         }
6868         if (!defined $page) {
6869                 $page = 0;
6870         }
6871         my $refs = git_get_references();
6872
6873         my $commit_hash = $base;
6874         if (defined $parent) {
6875                 $commit_hash = "$parent..$base";
6876         }
6877         my @commitlist =
6878                 parse_commits($commit_hash, 101, (100 * $page),
6879                               defined $file_name ? ($file_name, "--full-history") : ());
6880
6881         my $ftype;
6882         if (!defined $file_hash && defined $file_name) {
6883                 # some commits could have deleted file in question,
6884                 # and not have it in tree, but one of them has to have it
6885                 for (my $i = 0; $i < @commitlist; $i++) {
6886                         $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
6887                         last if defined $file_hash;
6888                 }
6889         }
6890         if (defined $file_hash) {
6891                 $ftype = git_get_type($file_hash);
6892         }
6893         if (defined $file_name && !defined $ftype) {
6894                 die_error(500, "Unknown type of object");
6895         }
6896         my %co;
6897         if (defined $file_name) {
6898                 %co = parse_commit($base)
6899                         or die_error(404, "Unknown commit object");
6900         }
6901
6902
6903         my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
6904         my $next_link = '';
6905         if ($#commitlist >= 100) {
6906                 $next_link =
6907                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
6908                                  -accesskey => "n", -title => "Alt-n"}, "next");
6909         }
6910         my $patch_max = gitweb_get_feature('patches');
6911         if ($patch_max && !defined $file_name) {
6912                 if ($patch_max < 0 || @commitlist <= $patch_max) {
6913                         $paging_nav .= " &sdot; " .
6914                                 $cgi->a({-href => href(action=>"patches", -replay=>1)},
6915                                         "patches");
6916                 }
6917         }
6918
6919         git_header_html();
6920         git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
6921         if (defined $file_name) {
6922                 git_print_header_div('commit', esc_html($co{'title'}), $base);
6923         } else {
6924                 git_print_header_div('summary', $project)
6925         }
6926         git_print_page_path($file_name, $ftype, $hash_base)
6927                 if (defined $file_name);
6928
6929         $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
6930                      $file_name, $file_hash, $ftype);
6931
6932         git_footer_html();
6933 }
6934
6935 sub git_log {
6936         git_log_generic('log', \&git_log_body,
6937                         $hash, $hash_parent);
6938 }
6939
6940 sub git_commit {
6941         $hash ||= $hash_base || "HEAD";
6942         my %co = parse_commit($hash)
6943             or die_error(404, "Unknown commit object");
6944
6945         my $parent  = $co{'parent'};
6946         my $parents = $co{'parents'}; # listref
6947
6948         # we need to prepare $formats_nav before any parameter munging
6949         my $formats_nav;
6950         if (!defined $parent) {
6951                 # --root commitdiff
6952                 $formats_nav .= '(initial)';
6953         } elsif (@$parents == 1) {
6954                 # single parent commit
6955                 $formats_nav .=
6956                         '(parent: ' .
6957                         $cgi->a({-href => href(action=>"commit",
6958                                                hash=>$parent)},
6959                                 esc_html(substr($parent, 0, 7))) .
6960                         ')';
6961         } else {
6962                 # merge commit
6963                 $formats_nav .=
6964                         '(merge: ' .
6965                         join(' ', map {
6966                                 $cgi->a({-href => href(action=>"commit",
6967                                                        hash=>$_)},
6968                                         esc_html(substr($_, 0, 7)));
6969                         } @$parents ) .
6970                         ')';
6971         }
6972         if (gitweb_check_feature('patches') && @$parents <= 1) {
6973                 $formats_nav .= " | " .
6974                         $cgi->a({-href => href(action=>"patch", -replay=>1)},
6975                                 "patch");
6976         }
6977
6978         if (!defined $parent) {
6979                 $parent = "--root";
6980         }
6981         my @difftree;
6982         open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
6983                 @diff_opts,
6984                 (@$parents <= 1 ? $parent : '-c'),
6985                 $hash, "--"
6986                 or die_error(500, "Open git-diff-tree failed");
6987         @difftree = map { chomp; $_ } <$fd>;
6988         close $fd or die_error(404, "Reading git-diff-tree failed");
6989
6990         # non-textual hash id's can be cached
6991         my $expires;
6992         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6993                 $expires = "+1d";
6994         }
6995         my $refs = git_get_references();
6996         my $ref = format_ref_marker($refs, $co{'id'});
6997
6998         git_header_html(undef, $expires);
6999         git_print_page_nav('commit', '',
7000                            $hash, $co{'tree'}, $hash,
7001                            $formats_nav);
7002
7003         if (defined $co{'parent'}) {
7004                 git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
7005         } else {
7006                 git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
7007         }
7008         print "<div class=\"title_text\">\n" .
7009               "<table class=\"object_header\">\n";
7010         git_print_authorship_rows(\%co);
7011         print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
7012         print "<tr>" .
7013               "<td>tree</td>" .
7014               "<td class=\"sha1\">" .
7015               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
7016                        class => "list"}, $co{'tree'}) .
7017               "</td>" .
7018               "<td class=\"link\">" .
7019               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
7020                       "tree");
7021         my $snapshot_links = format_snapshot_links($hash);
7022         if (defined $snapshot_links) {
7023                 print " | " . $snapshot_links;
7024         }
7025         print "</td>" .
7026               "</tr>\n";
7027
7028         foreach my $par (@$parents) {
7029                 print "<tr>" .
7030                       "<td>parent</td>" .
7031                       "<td class=\"sha1\">" .
7032                       $cgi->a({-href => href(action=>"commit", hash=>$par),
7033                                class => "list"}, $par) .
7034                       "</td>" .
7035                       "<td class=\"link\">" .
7036                       $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
7037                       " | " .
7038                       $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
7039                       "</td>" .
7040                       "</tr>\n";
7041         }
7042         print "</table>".
7043               "</div>\n";
7044
7045         print "<div class=\"page_body\">\n";
7046         git_print_log($co{'comment'});
7047         print "</div>\n";
7048
7049         git_difftree_body(\@difftree, $hash, @$parents);
7050
7051         git_footer_html();
7052 }
7053
7054 sub git_object {
7055         # object is defined by:
7056         # - hash or hash_base alone
7057         # - hash_base and file_name
7058         my $type;
7059
7060         # - hash or hash_base alone
7061         if ($hash || ($hash_base && !defined $file_name)) {
7062                 my $object_id = $hash || $hash_base;
7063
7064                 open my $fd, "-|", quote_command(
7065                         git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
7066                         or die_error(404, "Object does not exist");
7067                 $type = <$fd>;
7068                 chomp $type;
7069                 close $fd
7070                         or die_error(404, "Object does not exist");
7071
7072         # - hash_base and file_name
7073         } elsif ($hash_base && defined $file_name) {
7074                 $file_name =~ s,/+$,,;
7075
7076                 system(git_cmd(), "cat-file", '-e', $hash_base) == 0
7077                         or die_error(404, "Base object does not exist");
7078
7079                 # here errors should not hapen
7080                 open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
7081                         or die_error(500, "Open git-ls-tree failed");
7082                 my $line = <$fd>;
7083                 close $fd;
7084
7085                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
7086                 unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
7087                         die_error(404, "File or directory for given base does not exist");
7088                 }
7089                 $type = $2;
7090                 $hash = $3;
7091         } else {
7092                 die_error(400, "Not enough information to find object");
7093         }
7094
7095         print $cgi->redirect(-uri => href(action=>$type, -full=>1,
7096                                           hash=>$hash, hash_base=>$hash_base,
7097                                           file_name=>$file_name),
7098                              -status => '302 Found');
7099 }
7100
7101 sub git_blobdiff {
7102         my $format = shift || 'html';
7103         my $diff_style = $input_params{'diff_style'} || 'inline';
7104
7105         my $fd;
7106         my @difftree;
7107         my %diffinfo;
7108         my $expires;
7109
7110         # preparing $fd and %diffinfo for git_patchset_body
7111         # new style URI
7112         if (defined $hash_base && defined $hash_parent_base) {
7113                 if (defined $file_name) {
7114                         # read raw output
7115                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7116                                 $hash_parent_base, $hash_base,
7117                                 "--", (defined $file_parent ? $file_parent : ()), $file_name
7118                                 or die_error(500, "Open git-diff-tree failed");
7119                         @difftree = map { chomp; $_ } <$fd>;
7120                         close $fd
7121                                 or die_error(404, "Reading git-diff-tree failed");
7122                         @difftree
7123                                 or die_error(404, "Blob diff not found");
7124
7125                 } elsif (defined $hash &&
7126                          $hash =~ /[0-9a-fA-F]{40}/) {
7127                         # try to find filename from $hash
7128
7129                         # read filtered raw output
7130                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7131                                 $hash_parent_base, $hash_base, "--"
7132                                 or die_error(500, "Open git-diff-tree failed");
7133                         @difftree =
7134                                 # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
7135                                 # $hash == to_id
7136                                 grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
7137                                 map { chomp; $_ } <$fd>;
7138                         close $fd
7139                                 or die_error(404, "Reading git-diff-tree failed");
7140                         @difftree
7141                                 or die_error(404, "Blob diff not found");
7142
7143                 } else {
7144                         die_error(400, "Missing one of the blob diff parameters");
7145                 }
7146
7147                 if (@difftree > 1) {
7148                         die_error(400, "Ambiguous blob diff specification");
7149                 }
7150
7151                 %diffinfo = parse_difftree_raw_line($difftree[0]);
7152                 $file_parent ||= $diffinfo{'from_file'} || $file_name;
7153                 $file_name   ||= $diffinfo{'to_file'};
7154
7155                 $hash_parent ||= $diffinfo{'from_id'};
7156                 $hash        ||= $diffinfo{'to_id'};
7157
7158                 # non-textual hash id's can be cached
7159                 if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
7160                     $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
7161                         $expires = '+1d';
7162                 }
7163
7164                 # open patch output
7165                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7166                         '-p', ($format eq 'html' ? "--full-index" : ()),
7167                         $hash_parent_base, $hash_base,
7168                         "--", (defined $file_parent ? $file_parent : ()), $file_name
7169                         or die_error(500, "Open git-diff-tree failed");
7170         }
7171
7172         # old/legacy style URI -- not generated anymore since 1.4.3.
7173         if (!%diffinfo) {
7174                 die_error('404 Not Found', "Missing one of the blob diff parameters")
7175         }
7176
7177         # header
7178         if ($format eq 'html') {
7179                 my $formats_nav =
7180                         $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
7181                                 "raw");
7182                 $formats_nav .= diff_style_nav($diff_style);
7183                 git_header_html(undef, $expires);
7184                 if (defined $hash_base && (my %co = parse_commit($hash_base))) {
7185                         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
7186                         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
7187                 } else {
7188                         print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
7189                         print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
7190                 }
7191                 if (defined $file_name) {
7192                         git_print_page_path($file_name, "blob", $hash_base);
7193                 } else {
7194                         print "<div class=\"page_path\"></div>\n";
7195                 }
7196
7197         } elsif ($format eq 'plain') {
7198                 print $cgi->header(
7199                         -type => 'text/plain',
7200                         -charset => 'utf-8',
7201                         -expires => $expires,
7202                         -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
7203
7204                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7205
7206         } else {
7207                 die_error(400, "Unknown blobdiff format");
7208         }
7209
7210         # patch
7211         if ($format eq 'html') {
7212                 print "<div class=\"page_body\">\n";
7213
7214                 git_patchset_body($fd, $diff_style,
7215                                   [ \%diffinfo ], $hash_base, $hash_parent_base);
7216                 close $fd;
7217
7218                 print "</div>\n"; # class="page_body"
7219                 git_footer_html();
7220
7221         } else {
7222                 while (my $line = <$fd>) {
7223                         $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
7224                         $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
7225
7226                         print $line;
7227
7228                         last if $line =~ m!^\+\+\+!;
7229                 }
7230                 local $/ = undef;
7231                 print <$fd>;
7232                 close $fd;
7233         }
7234 }
7235
7236 sub git_blobdiff_plain {
7237         git_blobdiff('plain');
7238 }
7239
7240 # assumes that it is added as later part of already existing navigation,
7241 # so it returns "| foo | bar" rather than just "foo | bar"
7242 sub diff_style_nav {
7243         my ($diff_style, $is_combined) = @_;
7244         $diff_style ||= 'inline';
7245
7246         return "" if ($is_combined);
7247
7248         my @styles = (inline => 'inline', 'sidebyside' => 'side by side');
7249         my %styles = @styles;
7250         @styles =
7251                 @styles[ map { $_ * 2 } 0..$#styles/2 ];
7252
7253         return join '',
7254                 map { " | ".$_ }
7255                 map {
7256                         $_ eq $diff_style ? $styles{$_} :
7257                         $cgi->a({-href => href(-replay=>1, diff_style => $_)}, $styles{$_})
7258                 } @styles;
7259 }
7260
7261 sub git_commitdiff {
7262         my %params = @_;
7263         my $format = $params{-format} || 'html';
7264         my $diff_style = $input_params{'diff_style'} || 'inline';
7265
7266         my ($patch_max) = gitweb_get_feature('patches');
7267         if ($format eq 'patch') {
7268                 die_error(403, "Patch view not allowed") unless $patch_max;
7269         }
7270
7271         $hash ||= $hash_base || "HEAD";
7272         my %co = parse_commit($hash)
7273             or die_error(404, "Unknown commit object");
7274
7275         # choose format for commitdiff for merge
7276         if (! defined $hash_parent && @{$co{'parents'}} > 1) {
7277                 $hash_parent = '--cc';
7278         }
7279         # we need to prepare $formats_nav before almost any parameter munging
7280         my $formats_nav;
7281         if ($format eq 'html') {
7282                 $formats_nav =
7283                         $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
7284                                 "raw");
7285                 if ($patch_max && @{$co{'parents'}} <= 1) {
7286                         $formats_nav .= " | " .
7287                                 $cgi->a({-href => href(action=>"patch", -replay=>1)},
7288                                         "patch");
7289                 }
7290                 $formats_nav .= diff_style_nav($diff_style, @{$co{'parents'}} > 1);
7291
7292                 if (defined $hash_parent &&
7293                     $hash_parent ne '-c' && $hash_parent ne '--cc') {
7294                         # commitdiff with two commits given
7295                         my $hash_parent_short = $hash_parent;
7296                         if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
7297                                 $hash_parent_short = substr($hash_parent, 0, 7);
7298                         }
7299                         $formats_nav .=
7300                                 ' (from';
7301                         for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
7302                                 if ($co{'parents'}[$i] eq $hash_parent) {
7303                                         $formats_nav .= ' parent ' . ($i+1);
7304                                         last;
7305                                 }
7306                         }
7307                         $formats_nav .= ': ' .
7308                                 $cgi->a({-href => href(-replay=>1,
7309                                                        hash=>$hash_parent, hash_base=>undef)},
7310                                         esc_html($hash_parent_short)) .
7311                                 ')';
7312                 } elsif (!$co{'parent'}) {
7313                         # --root commitdiff
7314                         $formats_nav .= ' (initial)';
7315                 } elsif (scalar @{$co{'parents'}} == 1) {
7316                         # single parent commit
7317                         $formats_nav .=
7318                                 ' (parent: ' .
7319                                 $cgi->a({-href => href(-replay=>1,
7320                                                        hash=>$co{'parent'}, hash_base=>undef)},
7321                                         esc_html(substr($co{'parent'}, 0, 7))) .
7322                                 ')';
7323                 } else {
7324                         # merge commit
7325                         if ($hash_parent eq '--cc') {
7326                                 $formats_nav .= ' | ' .
7327                                         $cgi->a({-href => href(-replay=>1,
7328                                                                hash=>$hash, hash_parent=>'-c')},
7329                                                 'combined');
7330                         } else { # $hash_parent eq '-c'
7331                                 $formats_nav .= ' | ' .
7332                                         $cgi->a({-href => href(-replay=>1,
7333                                                                hash=>$hash, hash_parent=>'--cc')},
7334                                                 'compact');
7335                         }
7336                         $formats_nav .=
7337                                 ' (merge: ' .
7338                                 join(' ', map {
7339                                         $cgi->a({-href => href(-replay=>1,
7340                                                                hash=>$_, hash_base=>undef)},
7341                                                 esc_html(substr($_, 0, 7)));
7342                                 } @{$co{'parents'}} ) .
7343                                 ')';
7344                 }
7345         }
7346
7347         my $hash_parent_param = $hash_parent;
7348         if (!defined $hash_parent_param) {
7349                 # --cc for multiple parents, --root for parentless
7350                 $hash_parent_param =
7351                         @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
7352         }
7353
7354         # read commitdiff
7355         my $fd;
7356         my @difftree;
7357         if ($format eq 'html') {
7358                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7359                         "--no-commit-id", "--patch-with-raw", "--full-index",
7360                         $hash_parent_param, $hash, "--"
7361                         or die_error(500, "Open git-diff-tree failed");
7362
7363                 while (my $line = <$fd>) {
7364                         chomp $line;
7365                         # empty line ends raw part of diff-tree output
7366                         last unless $line;
7367                         push @difftree, scalar parse_difftree_raw_line($line);
7368                 }
7369
7370         } elsif ($format eq 'plain') {
7371                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7372                         '-p', $hash_parent_param, $hash, "--"
7373                         or die_error(500, "Open git-diff-tree failed");
7374         } elsif ($format eq 'patch') {
7375                 # For commit ranges, we limit the output to the number of
7376                 # patches specified in the 'patches' feature.
7377                 # For single commits, we limit the output to a single patch,
7378                 # diverging from the git-format-patch default.
7379                 my @commit_spec = ();
7380                 if ($hash_parent) {
7381                         if ($patch_max > 0) {
7382                                 push @commit_spec, "-$patch_max";
7383                         }
7384                         push @commit_spec, '-n', "$hash_parent..$hash";
7385                 } else {
7386                         if ($params{-single}) {
7387                                 push @commit_spec, '-1';
7388                         } else {
7389                                 if ($patch_max > 0) {
7390                                         push @commit_spec, "-$patch_max";
7391                                 }
7392                                 push @commit_spec, "-n";
7393                         }
7394                         push @commit_spec, '--root', $hash;
7395                 }
7396                 open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
7397                         '--encoding=utf8', '--stdout', @commit_spec
7398                         or die_error(500, "Open git-format-patch failed");
7399         } else {
7400                 die_error(400, "Unknown commitdiff format");
7401         }
7402
7403         # non-textual hash id's can be cached
7404         my $expires;
7405         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
7406                 $expires = "+1d";
7407         }
7408
7409         # write commit message
7410         if ($format eq 'html') {
7411                 my $refs = git_get_references();
7412                 my $ref = format_ref_marker($refs, $co{'id'});
7413
7414                 git_header_html(undef, $expires);
7415                 git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
7416                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
7417                 print "<div class=\"title_text\">\n" .
7418                       "<table class=\"object_header\">\n";
7419                 git_print_authorship_rows(\%co);
7420                 print "</table>".
7421                       "</div>\n";
7422                 print "<div class=\"page_body\">\n";
7423                 if (@{$co{'comment'}} > 1) {
7424                         print "<div class=\"log\">\n";
7425                         git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
7426                         print "</div>\n"; # class="log"
7427                 }
7428
7429         } elsif ($format eq 'plain') {
7430                 my $refs = git_get_references("tags");
7431                 my $tagname = git_get_rev_name_tags($hash);
7432                 my $filename = basename($project) . "-$hash.patch";
7433
7434                 print $cgi->header(
7435                         -type => 'text/plain',
7436                         -charset => 'utf-8',
7437                         -expires => $expires,
7438                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7439                 my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7440                 print "From: " . to_utf8($co{'author'}) . "\n";
7441                 print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7442                 print "Subject: " . to_utf8($co{'title'}) . "\n";
7443
7444                 print "X-Git-Tag: $tagname\n" if $tagname;
7445                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7446
7447                 foreach my $line (@{$co{'comment'}}) {
7448                         print to_utf8($line) . "\n";
7449                 }
7450                 print "---\n\n";
7451         } elsif ($format eq 'patch') {
7452                 my $filename = basename($project) . "-$hash.patch";
7453
7454                 print $cgi->header(
7455                         -type => 'text/plain',
7456                         -charset => 'utf-8',
7457                         -expires => $expires,
7458                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7459         }
7460
7461         # write patch
7462         if ($format eq 'html') {
7463                 my $use_parents = !defined $hash_parent ||
7464                         $hash_parent eq '-c' || $hash_parent eq '--cc';
7465                 git_difftree_body(\@difftree, $hash,
7466                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7467                 print "<br/>\n";
7468
7469                 git_patchset_body($fd, $diff_style,
7470                                   \@difftree, $hash,
7471                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7472                 close $fd;
7473                 print "</div>\n"; # class="page_body"
7474                 git_footer_html();
7475
7476         } elsif ($format eq 'plain') {
7477                 local $/ = undef;
7478                 print <$fd>;
7479                 close $fd
7480                         or print "Reading git-diff-tree failed\n";
7481         } elsif ($format eq 'patch') {
7482                 local $/ = undef;
7483                 print <$fd>;
7484                 close $fd
7485                         or print "Reading git-format-patch failed\n";
7486         }
7487 }
7488
7489 sub git_commitdiff_plain {
7490         git_commitdiff(-format => 'plain');
7491 }
7492
7493 # format-patch-style patches
7494 sub git_patch {
7495         git_commitdiff(-format => 'patch', -single => 1);
7496 }
7497
7498 sub git_patches {
7499         git_commitdiff(-format => 'patch');
7500 }
7501
7502 sub git_history {
7503         git_log_generic('history', \&git_history_body,
7504                         $hash_base, $hash_parent_base,
7505                         $file_name, $hash);
7506 }
7507
7508 sub git_search {
7509         $searchtype ||= 'commit';
7510
7511         # check if appropriate features are enabled
7512         gitweb_check_feature('search')
7513                 or die_error(403, "Search is disabled");
7514         if ($searchtype eq 'pickaxe') {
7515                 # pickaxe may take all resources of your box and run for several minutes
7516                 # with every query - so decide by yourself how public you make this feature
7517                 gitweb_check_feature('pickaxe')
7518                         or die_error(403, "Pickaxe search is disabled");
7519         }
7520         if ($searchtype eq 'grep') {
7521                 # grep search might be potentially CPU-intensive, too
7522                 gitweb_check_feature('grep')
7523                         or die_error(403, "Grep search is disabled");
7524         }
7525
7526         if (!defined $searchtext) {
7527                 die_error(400, "Text field is empty");
7528         }
7529         if (!defined $hash) {
7530                 $hash = git_get_head_hash($project);
7531         }
7532         my %co = parse_commit($hash);
7533         if (!%co) {
7534                 die_error(404, "Unknown commit object");
7535         }
7536         if (!defined $page) {
7537                 $page = 0;
7538         }
7539
7540         if ($searchtype eq 'commit' ||
7541             $searchtype eq 'author' ||
7542             $searchtype eq 'committer') {
7543                 git_search_message(%co);
7544         } elsif ($searchtype eq 'pickaxe') {
7545                 git_search_changes(%co);
7546         } elsif ($searchtype eq 'grep') {
7547                 git_search_files(%co);
7548         } else {
7549                 die_error(400, "Unknown search type");
7550         }
7551 }
7552
7553 sub git_search_help {
7554         git_header_html();
7555         git_print_page_nav('','', $hash,$hash,$hash);
7556         print <<EOT;
7557 <p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7558 regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7559 the pattern entered is recognized as the POSIX extended
7560 <a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7561 insensitive).</p>
7562 <dl>
7563 <dt><b>commit</b></dt>
7564 <dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7565 EOT
7566         my $have_grep = gitweb_check_feature('grep');
7567         if ($have_grep) {
7568                 print <<EOT;
7569 <dt><b>grep</b></dt>
7570 <dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7571     a different one) are searched for the given pattern. On large trees, this search can take
7572 a while and put some strain on the server, so please use it with some consideration. Note that
7573 due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7574 case-sensitive.</dd>
7575 EOT
7576         }
7577         print <<EOT;
7578 <dt><b>author</b></dt>
7579 <dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7580 <dt><b>committer</b></dt>
7581 <dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7582 EOT
7583         my $have_pickaxe = gitweb_check_feature('pickaxe');
7584         if ($have_pickaxe) {
7585                 print <<EOT;
7586 <dt><b>pickaxe</b></dt>
7587 <dd>All commits that caused the string to appear or disappear from any file (changes that
7588 added, removed or "modified" the string) will be listed. This search can take a while and
7589 takes a lot of strain on the server, so please use it wisely. Note that since you may be
7590 interested even in changes just changing the case as well, this search is case sensitive.</dd>
7591 EOT
7592         }
7593         print "</dl>\n";
7594         git_footer_html();
7595 }
7596
7597 sub git_shortlog {
7598         git_log_generic('shortlog', \&git_shortlog_body,
7599                         $hash, $hash_parent);
7600 }
7601
7602 ## ......................................................................
7603 ## feeds (RSS, Atom; OPML)
7604
7605 sub git_feed {
7606         my $format = shift || 'atom';
7607         my $have_blame = gitweb_check_feature('blame');
7608
7609         # Atom: http://www.atomenabled.org/developers/syndication/
7610         # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7611         if ($format ne 'rss' && $format ne 'atom') {
7612                 die_error(400, "Unknown web feed format");
7613         }
7614
7615         # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7616         my $head = $hash || 'HEAD';
7617         my @commitlist = parse_commits($head, 150, 0, $file_name);
7618
7619         my %latest_commit;
7620         my %latest_date;
7621         my $content_type = "application/$format+xml";
7622         if (defined $cgi->http('HTTP_ACCEPT') &&
7623                  $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7624                 # browser (feed reader) prefers text/xml
7625                 $content_type = 'text/xml';
7626         }
7627         if (defined($commitlist[0])) {
7628                 %latest_commit = %{$commitlist[0]};
7629                 my $latest_epoch = $latest_commit{'committer_epoch'};
7630                 %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7631                 my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7632                 if (defined $if_modified) {
7633                         my $since;
7634                         if (eval { require HTTP::Date; 1; }) {
7635                                 $since = HTTP::Date::str2time($if_modified);
7636                         } elsif (eval { require Time::ParseDate; 1; }) {
7637                                 $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7638                         }
7639                         if (defined $since && $latest_epoch <= $since) {
7640                                 print $cgi->header(
7641                                         -type => $content_type,
7642                                         -charset => 'utf-8',
7643                                         -last_modified => $latest_date{'rfc2822'},
7644                                         -status => '304 Not Modified');
7645                                 return;
7646                         }
7647                 }
7648                 print $cgi->header(
7649                         -type => $content_type,
7650                         -charset => 'utf-8',
7651                         -last_modified => $latest_date{'rfc2822'});
7652         } else {
7653                 print $cgi->header(
7654                         -type => $content_type,
7655                         -charset => 'utf-8');
7656         }
7657
7658         # Optimization: skip generating the body if client asks only
7659         # for Last-Modified date.
7660         return if ($cgi->request_method() eq 'HEAD');
7661
7662         # header variables
7663         my $title = "$site_name - $project/$action";
7664         my $feed_type = 'log';
7665         if (defined $hash) {
7666                 $title .= " - '$hash'";
7667                 $feed_type = 'branch log';
7668                 if (defined $file_name) {
7669                         $title .= " :: $file_name";
7670                         $feed_type = 'history';
7671                 }
7672         } elsif (defined $file_name) {
7673                 $title .= " - $file_name";
7674                 $feed_type = 'history';
7675         }
7676         $title .= " $feed_type";
7677         my $descr = git_get_project_description($project);
7678         if (defined $descr) {
7679                 $descr = esc_html($descr);
7680         } else {
7681                 $descr = "$project " .
7682                          ($format eq 'rss' ? 'RSS' : 'Atom') .
7683                          " feed";
7684         }
7685         my $owner = git_get_project_owner($project);
7686         $owner = esc_html($owner);
7687
7688         #header
7689         my $alt_url;
7690         if (defined $file_name) {
7691                 $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7692         } elsif (defined $hash) {
7693                 $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7694         } else {
7695                 $alt_url = href(-full=>1, action=>"summary");
7696         }
7697         print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7698         if ($format eq 'rss') {
7699                 print <<XML;
7700 <rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7701 <channel>
7702 XML
7703                 print "<title>$title</title>\n" .
7704                       "<link>$alt_url</link>\n" .
7705                       "<description>$descr</description>\n" .
7706                       "<language>en</language>\n" .
7707                       # project owner is responsible for 'editorial' content
7708                       "<managingEditor>$owner</managingEditor>\n";
7709                 if (defined $logo || defined $favicon) {
7710                         # prefer the logo to the favicon, since RSS
7711                         # doesn't allow both
7712                         my $img = esc_url($logo || $favicon);
7713                         print "<image>\n" .
7714                               "<url>$img</url>\n" .
7715                               "<title>$title</title>\n" .
7716                               "<link>$alt_url</link>\n" .
7717                               "</image>\n";
7718                 }
7719                 if (%latest_date) {
7720                         print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7721                         print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7722                 }
7723                 print "<generator>gitweb v.$version/$git_version</generator>\n";
7724         } elsif ($format eq 'atom') {
7725                 print <<XML;
7726 <feed xmlns="http://www.w3.org/2005/Atom">
7727 XML
7728                 print "<title>$title</title>\n" .
7729                       "<subtitle>$descr</subtitle>\n" .
7730                       '<link rel="alternate" type="text/html" href="' .
7731                       $alt_url . '" />' . "\n" .
7732                       '<link rel="self" type="' . $content_type . '" href="' .
7733                       $cgi->self_url() . '" />' . "\n" .
7734                       "<id>" . href(-full=>1) . "</id>\n" .
7735                       # use project owner for feed author
7736                       "<author><name>$owner</name></author>\n";
7737                 if (defined $favicon) {
7738                         print "<icon>" . esc_url($favicon) . "</icon>\n";
7739                 }
7740                 if (defined $logo) {
7741                         # not twice as wide as tall: 72 x 27 pixels
7742                         print "<logo>" . esc_url($logo) . "</logo>\n";
7743                 }
7744                 if (! %latest_date) {
7745                         # dummy date to keep the feed valid until commits trickle in:
7746                         print "<updated>1970-01-01T00:00:00Z</updated>\n";
7747                 } else {
7748                         print "<updated>$latest_date{'iso-8601'}</updated>\n";
7749                 }
7750                 print "<generator version='$version/$git_version'>gitweb</generator>\n";
7751         }
7752
7753         # contents
7754         for (my $i = 0; $i <= $#commitlist; $i++) {
7755                 my %co = %{$commitlist[$i]};
7756                 my $commit = $co{'id'};
7757                 # we read 150, we always show 30 and the ones more recent than 48 hours
7758                 if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7759                         last;
7760                 }
7761                 my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7762
7763                 # get list of changed files
7764                 open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7765                         $co{'parent'} || "--root",
7766                         $co{'id'}, "--", (defined $file_name ? $file_name : ())
7767                         or next;
7768                 my @difftree = map { chomp; $_ } <$fd>;
7769                 close $fd
7770                         or next;
7771
7772                 # print element (entry, item)
7773                 my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7774                 if ($format eq 'rss') {
7775                         print "<item>\n" .
7776                               "<title>" . esc_html($co{'title'}) . "</title>\n" .
7777                               "<author>" . esc_html($co{'author'}) . "</author>\n" .
7778                               "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7779                               "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7780                               "<link>$co_url</link>\n" .
7781                               "<description>" . esc_html($co{'title'}) . "</description>\n" .
7782                               "<content:encoded>" .
7783                               "<![CDATA[\n";
7784                 } elsif ($format eq 'atom') {
7785                         print "<entry>\n" .
7786                               "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7787                               "<updated>$cd{'iso-8601'}</updated>\n" .
7788                               "<author>\n" .
7789                               "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7790                         if ($co{'author_email'}) {
7791                                 print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7792                         }
7793                         print "</author>\n" .
7794                               # use committer for contributor
7795                               "<contributor>\n" .
7796                               "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7797                         if ($co{'committer_email'}) {
7798                                 print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7799                         }
7800                         print "</contributor>\n" .
7801                               "<published>$cd{'iso-8601'}</published>\n" .
7802                               "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7803                               "<id>$co_url</id>\n" .
7804                               "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
7805                               "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
7806                 }
7807                 my $comment = $co{'comment'};
7808                 print "<pre>\n";
7809                 foreach my $line (@$comment) {
7810                         $line = esc_html($line);
7811                         print "$line\n";
7812                 }
7813                 print "</pre><ul>\n";
7814                 foreach my $difftree_line (@difftree) {
7815                         my %difftree = parse_difftree_raw_line($difftree_line);
7816                         next if !$difftree{'from_id'};
7817
7818                         my $file = $difftree{'file'} || $difftree{'to_file'};
7819
7820                         print "<li>" .
7821                               "[" .
7822                               $cgi->a({-href => href(-full=>1, action=>"blobdiff",
7823                                                      hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
7824                                                      hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
7825                                                      file_name=>$file, file_parent=>$difftree{'from_file'}),
7826                                       -title => "diff"}, 'D');
7827                         if ($have_blame) {
7828                                 print $cgi->a({-href => href(-full=>1, action=>"blame",
7829                                                              file_name=>$file, hash_base=>$commit),
7830                                               -title => "blame"}, 'B');
7831                         }
7832                         # if this is not a feed of a file history
7833                         if (!defined $file_name || $file_name ne $file) {
7834                                 print $cgi->a({-href => href(-full=>1, action=>"history",
7835                                                              file_name=>$file, hash=>$commit),
7836                                               -title => "history"}, 'H');
7837                         }
7838                         $file = esc_path($file);
7839                         print "] ".
7840                               "$file</li>\n";
7841                 }
7842                 if ($format eq 'rss') {
7843                         print "</ul>]]>\n" .
7844                               "</content:encoded>\n" .
7845                               "</item>\n";
7846                 } elsif ($format eq 'atom') {
7847                         print "</ul>\n</div>\n" .
7848                               "</content>\n" .
7849                               "</entry>\n";
7850                 }
7851         }
7852
7853         # end of feed
7854         if ($format eq 'rss') {
7855                 print "</channel>\n</rss>\n";
7856         } elsif ($format eq 'atom') {
7857                 print "</feed>\n";
7858         }
7859 }
7860
7861 sub git_rss {
7862         git_feed('rss');
7863 }
7864
7865 sub git_atom {
7866         git_feed('atom');
7867 }
7868
7869 sub git_opml {
7870         my @list = git_get_projects_list();
7871         if (!@list) {
7872                 die_error(404, "No projects found");
7873         }
7874
7875         print $cgi->header(
7876                 -type => 'text/xml',
7877                 -charset => 'utf-8',
7878                 -content_disposition => 'inline; filename="opml.xml"');
7879
7880         my $title = esc_html($site_name);
7881         print <<XML;
7882 <?xml version="1.0" encoding="utf-8"?>
7883 <opml version="1.0">
7884 <head>
7885   <title>$title OPML Export</title>
7886 </head>
7887 <body>
7888 <outline text="git RSS feeds">
7889 XML
7890
7891         foreach my $pr (@list) {
7892                 my %proj = %$pr;
7893                 my $head = git_get_head_hash($proj{'path'});
7894                 if (!defined $head) {
7895                         next;
7896                 }
7897                 $git_dir = "$projectroot/$proj{'path'}";
7898                 my %co = parse_commit($head);
7899                 if (!%co) {
7900                         next;
7901                 }
7902
7903                 my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7904                 my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7905                 my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7906                 print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7907         }
7908         print <<XML;
7909 </outline>
7910 </body>
7911 </opml>
7912 XML
7913 }