gitweb: Refactor git_header_html
[git] / gitweb / gitweb.perl
1 #!/usr/bin/perl
2
3 # gitweb - simple web interface to track changes in git repositories
4 #
5 # (C) 2005-2006, Kay Sievers <kay.sievers@vrfy.org>
6 # (C) 2005, Christian Gierke
7 #
8 # This program is licensed under the GPLv2
9
10 use 5.008;
11 use strict;
12 use warnings;
13 use CGI qw(:standard :escapeHTML -nosticky);
14 use CGI::Util qw(unescape);
15 use CGI::Carp qw(fatalsToBrowser set_message);
16 use Encode;
17 use Fcntl ':mode';
18 use File::Find qw();
19 use File::Basename qw(basename);
20 use Time::HiRes qw(gettimeofday tv_interval);
21 binmode STDOUT, ':utf8';
22
23 our $t0 = [ gettimeofday() ];
24 our $number_of_git_cmds = 0;
25
26 BEGIN {
27         CGI->compile() if $ENV{'MOD_PERL'};
28 }
29
30 our $version = "++GIT_VERSION++";
31
32 our ($my_url, $my_uri, $base_url, $path_info, $home_link);
33 sub evaluate_uri {
34         our $cgi;
35
36         our $my_url = $cgi->url();
37         our $my_uri = $cgi->url(-absolute => 1);
38
39         # Base URL for relative URLs in gitweb ($logo, $favicon, ...),
40         # needed and used only for URLs with nonempty PATH_INFO
41         our $base_url = $my_url;
42
43         # When the script is used as DirectoryIndex, the URL does not contain the name
44         # of the script file itself, and $cgi->url() fails to strip PATH_INFO, so we
45         # have to do it ourselves. We make $path_info global because it's also used
46         # later on.
47         #
48         # Another issue with the script being the DirectoryIndex is that the resulting
49         # $my_url data is not the full script URL: this is good, because we want
50         # generated links to keep implying the script name if it wasn't explicitly
51         # indicated in the URL we're handling, but it means that $my_url cannot be used
52         # as base URL.
53         # Therefore, if we needed to strip PATH_INFO, then we know that we have
54         # to build the base URL ourselves:
55         our $path_info = $ENV{"PATH_INFO"};
56         if ($path_info) {
57                 if ($my_url =~ s,\Q$path_info\E$,, &&
58                     $my_uri =~ s,\Q$path_info\E$,, &&
59                     defined $ENV{'SCRIPT_NAME'}) {
60                         $base_url = $cgi->url(-base => 1) . $ENV{'SCRIPT_NAME'};
61                 }
62         }
63
64         # target of the home link on top of all pages
65         our $home_link = $my_uri || "/";
66 }
67
68 # core git executable to use
69 # this can just be "git" if your webserver has a sensible PATH
70 our $GIT = "++GIT_BINDIR++/git";
71
72 # absolute fs-path which will be prepended to the project path
73 #our $projectroot = "/pub/scm";
74 our $projectroot = "++GITWEB_PROJECTROOT++";
75
76 # fs traversing limit for getting project list
77 # the number is relative to the projectroot
78 our $project_maxdepth = "++GITWEB_PROJECT_MAXDEPTH++";
79
80 # string of the home link on top of all pages
81 our $home_link_str = "++GITWEB_HOME_LINK_STR++";
82
83 # name of your site or organization to appear in page titles
84 # replace this with something more descriptive for clearer bookmarks
85 our $site_name = "++GITWEB_SITENAME++"
86                  || ($ENV{'SERVER_NAME'} || "Untitled") . " Git";
87
88 # filename of html text to include at top of each page
89 our $site_header = "++GITWEB_SITE_HEADER++";
90 # html text to include at home page
91 our $home_text = "++GITWEB_HOMETEXT++";
92 # filename of html text to include at bottom of each page
93 our $site_footer = "++GITWEB_SITE_FOOTER++";
94
95 # URI of stylesheets
96 our @stylesheets = ("++GITWEB_CSS++");
97 # URI of a single stylesheet, which can be overridden in GITWEB_CONFIG.
98 our $stylesheet = undef;
99 # URI of GIT logo (72x27 size)
100 our $logo = "++GITWEB_LOGO++";
101 # URI of GIT favicon, assumed to be image/png type
102 our $favicon = "++GITWEB_FAVICON++";
103 # URI of gitweb.js (JavaScript code for gitweb)
104 our $javascript = "++GITWEB_JS++";
105
106 # URI and label (title) of GIT logo link
107 #our $logo_url = "http://www.kernel.org/pub/software/scm/git/docs/";
108 #our $logo_label = "git documentation";
109 our $logo_url = "http://git-scm.com/";
110 our $logo_label = "git homepage";
111
112 # source of projects list
113 our $projects_list = "++GITWEB_LIST++";
114
115 # the width (in characters) of the projects list "Description" column
116 our $projects_list_description_width = 25;
117
118 # group projects by category on the projects list
119 # (enabled if this variable evaluates to true)
120 our $projects_list_group_categories = 0;
121
122 # default category if none specified
123 # (leave the empty string for no category)
124 our $project_list_default_category = "";
125
126 # default order of projects list
127 # valid values are none, project, descr, owner, and age
128 our $default_projects_order = "project";
129
130 # show repository only if this file exists
131 # (only effective if this variable evaluates to true)
132 our $export_ok = "++GITWEB_EXPORT_OK++";
133
134 # show repository only if this subroutine returns true
135 # when given the path to the project, for example:
136 #    sub { return -e "$_[0]/git-daemon-export-ok"; }
137 our $export_auth_hook = undef;
138
139 # only allow viewing of repositories also shown on the overview page
140 our $strict_export = "++GITWEB_STRICT_EXPORT++";
141
142 # list of git base URLs used for URL to where fetch project from,
143 # i.e. full URL is "$git_base_url/$project"
144 our @git_base_url_list = grep { $_ ne '' } ("++GITWEB_BASE_URL++");
145
146 # default blob_plain mimetype and default charset for text/plain blob
147 our $default_blob_plain_mimetype = 'text/plain';
148 our $default_text_plain_charset  = undef;
149
150 # file to use for guessing MIME types before trying /etc/mime.types
151 # (relative to the current git repository)
152 our $mimetypes_file = undef;
153
154 # assume this charset if line contains non-UTF-8 characters;
155 # it should be valid encoding (see Encoding::Supported(3pm) for list),
156 # for which encoding all byte sequences are valid, for example
157 # 'iso-8859-1' aka 'latin1' (it is decoded without checking, so it
158 # could be even 'utf-8' for the old behavior)
159 our $fallback_encoding = 'latin1';
160
161 # rename detection options for git-diff and git-diff-tree
162 # - default is '-M', with the cost proportional to
163 #   (number of removed files) * (number of new files).
164 # - more costly is '-C' (which implies '-M'), with the cost proportional to
165 #   (number of changed files + number of removed files) * (number of new files)
166 # - even more costly is '-C', '--find-copies-harder' with cost
167 #   (number of files in the original tree) * (number of new files)
168 # - one might want to include '-B' option, e.g. '-B', '-M'
169 our @diff_opts = ('-M'); # taken from git_commit
170
171 # Disables features that would allow repository owners to inject script into
172 # the gitweb domain.
173 our $prevent_xss = 0;
174
175 # Path to the highlight executable to use (must be the one from
176 # http://www.andre-simon.de due to assumptions about parameters and output).
177 # Useful if highlight is not installed on your webserver's PATH.
178 # [Default: highlight]
179 our $highlight_bin = "++HIGHLIGHT_BIN++";
180
181 # information about snapshot formats that gitweb is capable of serving
182 our %known_snapshot_formats = (
183         # name => {
184         #       'display' => display name,
185         #       'type' => mime type,
186         #       'suffix' => filename suffix,
187         #       'format' => --format for git-archive,
188         #       'compressor' => [compressor command and arguments]
189         #                       (array reference, optional)
190         #       'disabled' => boolean (optional)}
191         #
192         'tgz' => {
193                 'display' => 'tar.gz',
194                 'type' => 'application/x-gzip',
195                 'suffix' => '.tar.gz',
196                 'format' => 'tar',
197                 'compressor' => ['gzip', '-n']},
198
199         'tbz2' => {
200                 'display' => 'tar.bz2',
201                 'type' => 'application/x-bzip2',
202                 'suffix' => '.tar.bz2',
203                 'format' => 'tar',
204                 'compressor' => ['bzip2']},
205
206         'txz' => {
207                 'display' => 'tar.xz',
208                 'type' => 'application/x-xz',
209                 'suffix' => '.tar.xz',
210                 'format' => 'tar',
211                 'compressor' => ['xz'],
212                 'disabled' => 1},
213
214         'zip' => {
215                 'display' => 'zip',
216                 'type' => 'application/x-zip',
217                 'suffix' => '.zip',
218                 'format' => 'zip'},
219 );
220
221 # Aliases so we understand old gitweb.snapshot values in repository
222 # configuration.
223 our %known_snapshot_format_aliases = (
224         'gzip'  => 'tgz',
225         'bzip2' => 'tbz2',
226         'xz'    => 'txz',
227
228         # backward compatibility: legacy gitweb config support
229         'x-gzip' => undef, 'gz' => undef,
230         'x-bzip2' => undef, 'bz2' => undef,
231         'x-zip' => undef, '' => undef,
232 );
233
234 # Pixel sizes for icons and avatars. If the default font sizes or lineheights
235 # are changed, it may be appropriate to change these values too via
236 # $GITWEB_CONFIG.
237 our %avatar_size = (
238         'default' => 16,
239         'double'  => 32
240 );
241
242 # Used to set the maximum load that we will still respond to gitweb queries.
243 # If server load exceed this value then return "503 server busy" error.
244 # If gitweb cannot determined server load, it is taken to be 0.
245 # Leave it undefined (or set to 'undef') to turn off load checking.
246 our $maxload = 300;
247
248 # configuration for 'highlight' (http://www.andre-simon.de/)
249 # match by basename
250 our %highlight_basename = (
251         #'Program' => 'py',
252         #'Library' => 'py',
253         'SConstruct' => 'py', # SCons equivalent of Makefile
254         'Makefile' => 'make',
255 );
256 # match by extension
257 our %highlight_ext = (
258         # main extensions, defining name of syntax;
259         # see files in /usr/share/highlight/langDefs/ directory
260         map { $_ => $_ }
261                 qw(py c cpp rb java css php sh pl js tex bib xml awk bat ini spec tcl sql make),
262         # alternate extensions, see /etc/highlight/filetypes.conf
263         'h' => 'c',
264         map { $_ => 'sh'  } qw(bash zsh ksh),
265         map { $_ => 'cpp' } qw(cxx c++ cc),
266         map { $_ => 'php' } qw(php3 php4 php5 phps),
267         map { $_ => 'pl'  } qw(perl pm), # perhaps also 'cgi'
268         map { $_ => 'make'} qw(mak mk),
269         map { $_ => 'xml' } qw(xhtml html htm),
270 );
271
272 # You define site-wide feature defaults here; override them with
273 # $GITWEB_CONFIG as necessary.
274 our %feature = (
275         # feature => {
276         #       'sub' => feature-sub (subroutine),
277         #       'override' => allow-override (boolean),
278         #       'default' => [ default options...] (array reference)}
279         #
280         # if feature is overridable (it means that allow-override has true value),
281         # then feature-sub will be called with default options as parameters;
282         # return value of feature-sub indicates if to enable specified feature
283         #
284         # if there is no 'sub' key (no feature-sub), then feature cannot be
285         # overridden
286         #
287         # use gitweb_get_feature(<feature>) to retrieve the <feature> value
288         # (an array) or gitweb_check_feature(<feature>) to check if <feature>
289         # is enabled
290
291         # Enable the 'blame' blob view, showing the last commit that modified
292         # each line in the file. This can be very CPU-intensive.
293
294         # To enable system wide have in $GITWEB_CONFIG
295         # $feature{'blame'}{'default'} = [1];
296         # To have project specific config enable override in $GITWEB_CONFIG
297         # $feature{'blame'}{'override'} = 1;
298         # and in project config gitweb.blame = 0|1;
299         'blame' => {
300                 'sub' => sub { feature_bool('blame', @_) },
301                 'override' => 0,
302                 'default' => [0]},
303
304         # Enable the 'snapshot' link, providing a compressed archive of any
305         # tree. This can potentially generate high traffic if you have large
306         # project.
307
308         # Value is a list of formats defined in %known_snapshot_formats that
309         # you wish to offer.
310         # To disable system wide have in $GITWEB_CONFIG
311         # $feature{'snapshot'}{'default'} = [];
312         # To have project specific config enable override in $GITWEB_CONFIG
313         # $feature{'snapshot'}{'override'} = 1;
314         # and in project config, a comma-separated list of formats or "none"
315         # to disable.  Example: gitweb.snapshot = tbz2,zip;
316         'snapshot' => {
317                 'sub' => \&feature_snapshot,
318                 'override' => 0,
319                 'default' => ['tgz']},
320
321         # Enable text search, which will list the commits which match author,
322         # committer or commit text to a given string.  Enabled by default.
323         # Project specific override is not supported.
324         'search' => {
325                 'override' => 0,
326                 'default' => [1]},
327
328         # Enable grep search, which will list the files in currently selected
329         # tree containing the given string. Enabled by default. This can be
330         # potentially CPU-intensive, of course.
331         # Note that you need to have 'search' feature enabled too.
332
333         # To enable system wide have in $GITWEB_CONFIG
334         # $feature{'grep'}{'default'} = [1];
335         # To have project specific config enable override in $GITWEB_CONFIG
336         # $feature{'grep'}{'override'} = 1;
337         # and in project config gitweb.grep = 0|1;
338         'grep' => {
339                 'sub' => sub { feature_bool('grep', @_) },
340                 'override' => 0,
341                 'default' => [1]},
342
343         # Enable the pickaxe search, which will list the commits that modified
344         # a given string in a file. This can be practical and quite faster
345         # alternative to 'blame', but still potentially CPU-intensive.
346         # Note that you need to have 'search' feature enabled too.
347
348         # To enable system wide have in $GITWEB_CONFIG
349         # $feature{'pickaxe'}{'default'} = [1];
350         # To have project specific config enable override in $GITWEB_CONFIG
351         # $feature{'pickaxe'}{'override'} = 1;
352         # and in project config gitweb.pickaxe = 0|1;
353         'pickaxe' => {
354                 'sub' => sub { feature_bool('pickaxe', @_) },
355                 'override' => 0,
356                 'default' => [1]},
357
358         # Enable showing size of blobs in a 'tree' view, in a separate
359         # column, similar to what 'ls -l' does.  This cost a bit of IO.
360
361         # To disable system wide have in $GITWEB_CONFIG
362         # $feature{'show-sizes'}{'default'} = [0];
363         # To have project specific config enable override in $GITWEB_CONFIG
364         # $feature{'show-sizes'}{'override'} = 1;
365         # and in project config gitweb.showsizes = 0|1;
366         'show-sizes' => {
367                 'sub' => sub { feature_bool('showsizes', @_) },
368                 'override' => 0,
369                 'default' => [1]},
370
371         # Make gitweb use an alternative format of the URLs which can be
372         # more readable and natural-looking: project name is embedded
373         # directly in the path and the query string contains other
374         # auxiliary information. All gitweb installations recognize
375         # URL in either format; this configures in which formats gitweb
376         # generates links.
377
378         # To enable system wide have in $GITWEB_CONFIG
379         # $feature{'pathinfo'}{'default'} = [1];
380         # Project specific override is not supported.
381
382         # Note that you will need to change the default location of CSS,
383         # favicon, logo and possibly other files to an absolute URL. Also,
384         # if gitweb.cgi serves as your indexfile, you will need to force
385         # $my_uri to contain the script name in your $GITWEB_CONFIG.
386         'pathinfo' => {
387                 'override' => 0,
388                 'default' => [0]},
389
390         # Make gitweb consider projects in project root subdirectories
391         # to be forks of existing projects. Given project $projname.git,
392         # projects matching $projname/*.git will not be shown in the main
393         # projects list, instead a '+' mark will be added to $projname
394         # there and a 'forks' view will be enabled for the project, listing
395         # all the forks. If project list is taken from a file, forks have
396         # to be listed after the main project.
397
398         # To enable system wide have in $GITWEB_CONFIG
399         # $feature{'forks'}{'default'} = [1];
400         # Project specific override is not supported.
401         'forks' => {
402                 'override' => 0,
403                 'default' => [0]},
404
405         # Insert custom links to the action bar of all project pages.
406         # This enables you mainly to link to third-party scripts integrating
407         # into gitweb; e.g. git-browser for graphical history representation
408         # or custom web-based repository administration interface.
409
410         # The 'default' value consists of a list of triplets in the form
411         # (label, link, position) where position is the label after which
412         # to insert the link and link is a format string where %n expands
413         # to the project name, %f to the project path within the filesystem,
414         # %h to the current hash (h gitweb parameter) and %b to the current
415         # hash base (hb gitweb parameter); %% expands to %.
416
417         # To enable system wide have in $GITWEB_CONFIG e.g.
418         # $feature{'actions'}{'default'} = [('graphiclog',
419         #       '/git-browser/by-commit.html?r=%n', 'summary')];
420         # Project specific override is not supported.
421         'actions' => {
422                 'override' => 0,
423                 'default' => []},
424
425         # Allow gitweb scan project content tags of project repository,
426         # and display the popular Web 2.0-ish "tag cloud" near the projects
427         # list.  Note that this is something COMPLETELY different from the
428         # normal Git tags.
429
430         # gitweb by itself can show existing tags, but it does not handle
431         # tagging itself; you need to do it externally, outside gitweb.
432         # The format is described in git_get_project_ctags() subroutine.
433         # You may want to install the HTML::TagCloud Perl module to get
434         # a pretty tag cloud instead of just a list of tags.
435
436         # To enable system wide have in $GITWEB_CONFIG
437         # $feature{'ctags'}{'default'} = [1];
438         # Project specific override is not supported.
439
440         # In the future whether ctags editing is enabled might depend
441         # on the value, but using 1 should always mean no editing of ctags.
442         'ctags' => {
443                 'override' => 0,
444                 'default' => [0]},
445
446         # The maximum number of patches in a patchset generated in patch
447         # view. Set this to 0 or undef to disable patch view, or to a
448         # negative number to remove any limit.
449
450         # To disable system wide have in $GITWEB_CONFIG
451         # $feature{'patches'}{'default'} = [0];
452         # To have project specific config enable override in $GITWEB_CONFIG
453         # $feature{'patches'}{'override'} = 1;
454         # and in project config gitweb.patches = 0|n;
455         # where n is the maximum number of patches allowed in a patchset.
456         'patches' => {
457                 'sub' => \&feature_patches,
458                 'override' => 0,
459                 'default' => [16]},
460
461         # Avatar support. When this feature is enabled, views such as
462         # shortlog or commit will display an avatar associated with
463         # the email of the committer(s) and/or author(s).
464
465         # Currently available providers are gravatar and picon.
466         # If an unknown provider is specified, the feature is disabled.
467
468         # Gravatar depends on Digest::MD5.
469         # Picon currently relies on the indiana.edu database.
470
471         # To enable system wide have in $GITWEB_CONFIG
472         # $feature{'avatar'}{'default'} = ['<provider>'];
473         # where <provider> is either gravatar or picon.
474         # To have project specific config enable override in $GITWEB_CONFIG
475         # $feature{'avatar'}{'override'} = 1;
476         # and in project config gitweb.avatar = <provider>;
477         'avatar' => {
478                 'sub' => \&feature_avatar,
479                 'override' => 0,
480                 'default' => ['']},
481
482         # Enable displaying how much time and how many git commands
483         # it took to generate and display page.  Disabled by default.
484         # Project specific override is not supported.
485         'timed' => {
486                 'override' => 0,
487                 'default' => [0]},
488
489         # Enable turning some links into links to actions which require
490         # JavaScript to run (like 'blame_incremental').  Not enabled by
491         # default.  Project specific override is currently not supported.
492         'javascript-actions' => {
493                 'override' => 0,
494                 'default' => [0]},
495
496         # Enable and configure ability to change common timezone for dates
497         # in gitweb output via JavaScript.  Enabled by default.
498         # Project specific override is not supported.
499         'javascript-timezone' => {
500                 'override' => 0,
501                 'default' => [
502                         'local',     # default timezone: 'utc', 'local', or '(-|+)HHMM' format,
503                                      # or undef to turn off this feature
504                         'gitweb_tz', # name of cookie where to store selected timezone
505                         'datetime',  # CSS class used to mark up dates for manipulation
506                 ]},
507
508         # Syntax highlighting support. This is based on Daniel Svensson's
509         # and Sham Chukoury's work in gitweb-xmms2.git.
510         # It requires the 'highlight' program present in $PATH,
511         # and therefore is disabled by default.
512
513         # To enable system wide have in $GITWEB_CONFIG
514         # $feature{'highlight'}{'default'} = [1];
515
516         'highlight' => {
517                 'sub' => sub { feature_bool('highlight', @_) },
518                 'override' => 0,
519                 'default' => [0]},
520
521         # Enable displaying of remote heads in the heads list
522
523         # To enable system wide have in $GITWEB_CONFIG
524         # $feature{'remote_heads'}{'default'} = [1];
525         # To have project specific config enable override in $GITWEB_CONFIG
526         # $feature{'remote_heads'}{'override'} = 1;
527         # and in project config gitweb.remote_heads = 0|1;
528         'remote_heads' => {
529                 'sub' => sub { feature_bool('remote_heads', @_) },
530                 'override' => 0,
531                 'default' => [0]},
532 );
533
534 sub gitweb_get_feature {
535         my ($name) = @_;
536         return unless exists $feature{$name};
537         my ($sub, $override, @defaults) = (
538                 $feature{$name}{'sub'},
539                 $feature{$name}{'override'},
540                 @{$feature{$name}{'default'}});
541         # project specific override is possible only if we have project
542         our $git_dir; # global variable, declared later
543         if (!$override || !defined $git_dir) {
544                 return @defaults;
545         }
546         if (!defined $sub) {
547                 warn "feature $name is not overridable";
548                 return @defaults;
549         }
550         return $sub->(@defaults);
551 }
552
553 # A wrapper to check if a given feature is enabled.
554 # With this, you can say
555 #
556 #   my $bool_feat = gitweb_check_feature('bool_feat');
557 #   gitweb_check_feature('bool_feat') or somecode;
558 #
559 # instead of
560 #
561 #   my ($bool_feat) = gitweb_get_feature('bool_feat');
562 #   (gitweb_get_feature('bool_feat'))[0] or somecode;
563 #
564 sub gitweb_check_feature {
565         return (gitweb_get_feature(@_))[0];
566 }
567
568
569 sub feature_bool {
570         my $key = shift;
571         my ($val) = git_get_project_config($key, '--bool');
572
573         if (!defined $val) {
574                 return ($_[0]);
575         } elsif ($val eq 'true') {
576                 return (1);
577         } elsif ($val eq 'false') {
578                 return (0);
579         }
580 }
581
582 sub feature_snapshot {
583         my (@fmts) = @_;
584
585         my ($val) = git_get_project_config('snapshot');
586
587         if ($val) {
588                 @fmts = ($val eq 'none' ? () : split /\s*[,\s]\s*/, $val);
589         }
590
591         return @fmts;
592 }
593
594 sub feature_patches {
595         my @val = (git_get_project_config('patches', '--int'));
596
597         if (@val) {
598                 return @val;
599         }
600
601         return ($_[0]);
602 }
603
604 sub feature_avatar {
605         my @val = (git_get_project_config('avatar'));
606
607         return @val ? @val : @_;
608 }
609
610 # checking HEAD file with -e is fragile if the repository was
611 # initialized long time ago (i.e. symlink HEAD) and was pack-ref'ed
612 # and then pruned.
613 sub check_head_link {
614         my ($dir) = @_;
615         my $headfile = "$dir/HEAD";
616         return ((-e $headfile) ||
617                 (-l $headfile && readlink($headfile) =~ /^refs\/heads\//));
618 }
619
620 sub check_export_ok {
621         my ($dir) = @_;
622         return (check_head_link($dir) &&
623                 (!$export_ok || -e "$dir/$export_ok") &&
624                 (!$export_auth_hook || $export_auth_hook->($dir)));
625 }
626
627 # process alternate names for backward compatibility
628 # filter out unsupported (unknown) snapshot formats
629 sub filter_snapshot_fmts {
630         my @fmts = @_;
631
632         @fmts = map {
633                 exists $known_snapshot_format_aliases{$_} ?
634                        $known_snapshot_format_aliases{$_} : $_} @fmts;
635         @fmts = grep {
636                 exists $known_snapshot_formats{$_} &&
637                 !$known_snapshot_formats{$_}{'disabled'}} @fmts;
638 }
639
640 # If it is set to code reference, it is code that it is to be run once per
641 # request, allowing updating configurations that change with each request,
642 # while running other code in config file only once.
643 #
644 # Otherwise, if it is false then gitweb would process config file only once;
645 # if it is true then gitweb config would be run for each request.
646 our $per_request_config = 1;
647
648 # read and parse gitweb config file given by its parameter.
649 # returns true on success, false on recoverable error, allowing
650 # to chain this subroutine, using first file that exists.
651 # dies on errors during parsing config file, as it is unrecoverable.
652 sub read_config_file {
653         my $filename = shift;
654         return unless defined $filename;
655         # die if there are errors parsing config file
656         if (-e $filename) {
657                 do $filename;
658                 die $@ if $@;
659                 return 1;
660         }
661         return;
662 }
663
664 our ($GITWEB_CONFIG, $GITWEB_CONFIG_SYSTEM);
665 sub evaluate_gitweb_config {
666         our $GITWEB_CONFIG = $ENV{'GITWEB_CONFIG'} || "++GITWEB_CONFIG++";
667         our $GITWEB_CONFIG_SYSTEM = $ENV{'GITWEB_CONFIG_SYSTEM'} || "++GITWEB_CONFIG_SYSTEM++";
668
669         # use first config file that exists
670         read_config_file($GITWEB_CONFIG) or
671         read_config_file($GITWEB_CONFIG_SYSTEM);
672 }
673
674 # Get loadavg of system, to compare against $maxload.
675 # Currently it requires '/proc/loadavg' present to get loadavg;
676 # if it is not present it returns 0, which means no load checking.
677 sub get_loadavg {
678         if( -e '/proc/loadavg' ){
679                 open my $fd, '<', '/proc/loadavg'
680                         or return 0;
681                 my @load = split(/\s+/, scalar <$fd>);
682                 close $fd;
683
684                 # The first three columns measure CPU and IO utilization of the last one,
685                 # five, and 10 minute periods.  The fourth column shows the number of
686                 # currently running processes and the total number of processes in the m/n
687                 # format.  The last column displays the last process ID used.
688                 return $load[0] || 0;
689         }
690         # additional checks for load average should go here for things that don't export
691         # /proc/loadavg
692
693         return 0;
694 }
695
696 # version of the core git binary
697 our $git_version;
698 sub evaluate_git_version {
699         our $git_version = qx("$GIT" --version) =~ m/git version (.*)$/ ? $1 : "unknown";
700         $number_of_git_cmds++;
701 }
702
703 sub check_loadavg {
704         if (defined $maxload && get_loadavg() > $maxload) {
705                 die_error(503, "The load average on the server is too high");
706         }
707 }
708
709 # ======================================================================
710 # input validation and dispatch
711
712 # input parameters can be collected from a variety of sources (presently, CGI
713 # and PATH_INFO), so we define an %input_params hash that collects them all
714 # together during validation: this allows subsequent uses (e.g. href()) to be
715 # agnostic of the parameter origin
716
717 our %input_params = ();
718
719 # input parameters are stored with the long parameter name as key. This will
720 # also be used in the href subroutine to convert parameters to their CGI
721 # equivalent, and since the href() usage is the most frequent one, we store
722 # the name -> CGI key mapping here, instead of the reverse.
723 #
724 # XXX: Warning: If you touch this, check the search form for updating,
725 # too.
726
727 our @cgi_param_mapping = (
728         project => "p",
729         action => "a",
730         file_name => "f",
731         file_parent => "fp",
732         hash => "h",
733         hash_parent => "hp",
734         hash_base => "hb",
735         hash_parent_base => "hpb",
736         page => "pg",
737         order => "o",
738         searchtext => "s",
739         searchtype => "st",
740         snapshot_format => "sf",
741         extra_options => "opt",
742         search_use_regexp => "sr",
743         ctag => "by_tag",
744         # this must be last entry (for manipulation from JavaScript)
745         javascript => "js"
746 );
747 our %cgi_param_mapping = @cgi_param_mapping;
748
749 # we will also need to know the possible actions, for validation
750 our %actions = (
751         "blame" => \&git_blame,
752         "blame_incremental" => \&git_blame_incremental,
753         "blame_data" => \&git_blame_data,
754         "blobdiff" => \&git_blobdiff,
755         "blobdiff_plain" => \&git_blobdiff_plain,
756         "blob" => \&git_blob,
757         "blob_plain" => \&git_blob_plain,
758         "commitdiff" => \&git_commitdiff,
759         "commitdiff_plain" => \&git_commitdiff_plain,
760         "commit" => \&git_commit,
761         "forks" => \&git_forks,
762         "heads" => \&git_heads,
763         "history" => \&git_history,
764         "log" => \&git_log,
765         "patch" => \&git_patch,
766         "patches" => \&git_patches,
767         "remotes" => \&git_remotes,
768         "rss" => \&git_rss,
769         "atom" => \&git_atom,
770         "search" => \&git_search,
771         "search_help" => \&git_search_help,
772         "shortlog" => \&git_shortlog,
773         "summary" => \&git_summary,
774         "tag" => \&git_tag,
775         "tags" => \&git_tags,
776         "tree" => \&git_tree,
777         "snapshot" => \&git_snapshot,
778         "object" => \&git_object,
779         # those below don't need $project
780         "opml" => \&git_opml,
781         "project_list" => \&git_project_list,
782         "project_index" => \&git_project_index,
783 );
784
785 # finally, we have the hash of allowed extra_options for the commands that
786 # allow them
787 our %allowed_options = (
788         "--no-merges" => [ qw(rss atom log shortlog history) ],
789 );
790
791 # fill %input_params with the CGI parameters. All values except for 'opt'
792 # should be single values, but opt can be an array. We should probably
793 # build an array of parameters that can be multi-valued, but since for the time
794 # being it's only this one, we just single it out
795 sub evaluate_query_params {
796         our $cgi;
797
798         while (my ($name, $symbol) = each %cgi_param_mapping) {
799                 if ($symbol eq 'opt') {
800                         $input_params{$name} = [ $cgi->param($symbol) ];
801                 } else {
802                         $input_params{$name} = $cgi->param($symbol);
803                 }
804         }
805 }
806
807 # now read PATH_INFO and update the parameter list for missing parameters
808 sub evaluate_path_info {
809         return if defined $input_params{'project'};
810         return if !$path_info;
811         $path_info =~ s,^/+,,;
812         return if !$path_info;
813
814         # find which part of PATH_INFO is project
815         my $project = $path_info;
816         $project =~ s,/+$,,;
817         while ($project && !check_head_link("$projectroot/$project")) {
818                 $project =~ s,/*[^/]*$,,;
819         }
820         return unless $project;
821         $input_params{'project'} = $project;
822
823         # do not change any parameters if an action is given using the query string
824         return if $input_params{'action'};
825         $path_info =~ s,^\Q$project\E/*,,;
826
827         # next, check if we have an action
828         my $action = $path_info;
829         $action =~ s,/.*$,,;
830         if (exists $actions{$action}) {
831                 $path_info =~ s,^$action/*,,;
832                 $input_params{'action'} = $action;
833         }
834
835         # list of actions that want hash_base instead of hash, but can have no
836         # pathname (f) parameter
837         my @wants_base = (
838                 'tree',
839                 'history',
840         );
841
842         # we want to catch, among others
843         # [$hash_parent_base[:$file_parent]..]$hash_parent[:$file_name]
844         my ($parentrefname, $parentpathname, $refname, $pathname) =
845                 ($path_info =~ /^(?:(.+?)(?::(.+))?\.\.)?([^:]+?)?(?::(.+))?$/);
846
847         # first, analyze the 'current' part
848         if (defined $pathname) {
849                 # we got "branch:filename" or "branch:dir/"
850                 # we could use git_get_type(branch:pathname), but:
851                 # - it needs $git_dir
852                 # - it does a git() call
853                 # - the convention of terminating directories with a slash
854                 #   makes it superfluous
855                 # - embedding the action in the PATH_INFO would make it even
856                 #   more superfluous
857                 $pathname =~ s,^/+,,;
858                 if (!$pathname || substr($pathname, -1) eq "/") {
859                         $input_params{'action'} ||= "tree";
860                         $pathname =~ s,/$,,;
861                 } else {
862                         # the default action depends on whether we had parent info
863                         # or not
864                         if ($parentrefname) {
865                                 $input_params{'action'} ||= "blobdiff_plain";
866                         } else {
867                                 $input_params{'action'} ||= "blob_plain";
868                         }
869                 }
870                 $input_params{'hash_base'} ||= $refname;
871                 $input_params{'file_name'} ||= $pathname;
872         } elsif (defined $refname) {
873                 # we got "branch". In this case we have to choose if we have to
874                 # set hash or hash_base.
875                 #
876                 # Most of the actions without a pathname only want hash to be
877                 # set, except for the ones specified in @wants_base that want
878                 # hash_base instead. It should also be noted that hand-crafted
879                 # links having 'history' as an action and no pathname or hash
880                 # set will fail, but that happens regardless of PATH_INFO.
881                 if (defined $parentrefname) {
882                         # if there is parent let the default be 'shortlog' action
883                         # (for http://git.example.com/repo.git/A..B links); if there
884                         # is no parent, dispatch will detect type of object and set
885                         # action appropriately if required (if action is not set)
886                         $input_params{'action'} ||= "shortlog";
887                 }
888                 if ($input_params{'action'} &&
889                     grep { $_ eq $input_params{'action'} } @wants_base) {
890                         $input_params{'hash_base'} ||= $refname;
891                 } else {
892                         $input_params{'hash'} ||= $refname;
893                 }
894         }
895
896         # next, handle the 'parent' part, if present
897         if (defined $parentrefname) {
898                 # a missing pathspec defaults to the 'current' filename, allowing e.g.
899                 # someproject/blobdiff/oldrev..newrev:/filename
900                 if ($parentpathname) {
901                         $parentpathname =~ s,^/+,,;
902                         $parentpathname =~ s,/$,,;
903                         $input_params{'file_parent'} ||= $parentpathname;
904                 } else {
905                         $input_params{'file_parent'} ||= $input_params{'file_name'};
906                 }
907                 # we assume that hash_parent_base is wanted if a path was specified,
908                 # or if the action wants hash_base instead of hash
909                 if (defined $input_params{'file_parent'} ||
910                         grep { $_ eq $input_params{'action'} } @wants_base) {
911                         $input_params{'hash_parent_base'} ||= $parentrefname;
912                 } else {
913                         $input_params{'hash_parent'} ||= $parentrefname;
914                 }
915         }
916
917         # for the snapshot action, we allow URLs in the form
918         # $project/snapshot/$hash.ext
919         # where .ext determines the snapshot and gets removed from the
920         # passed $refname to provide the $hash.
921         #
922         # To be able to tell that $refname includes the format extension, we
923         # require the following two conditions to be satisfied:
924         # - the hash input parameter MUST have been set from the $refname part
925         #   of the URL (i.e. they must be equal)
926         # - the snapshot format MUST NOT have been defined already (e.g. from
927         #   CGI parameter sf)
928         # It's also useless to try any matching unless $refname has a dot,
929         # so we check for that too
930         if (defined $input_params{'action'} &&
931                 $input_params{'action'} eq 'snapshot' &&
932                 defined $refname && index($refname, '.') != -1 &&
933                 $refname eq $input_params{'hash'} &&
934                 !defined $input_params{'snapshot_format'}) {
935                 # We loop over the known snapshot formats, checking for
936                 # extensions. Allowed extensions are both the defined suffix
937                 # (which includes the initial dot already) and the snapshot
938                 # format key itself, with a prepended dot
939                 while (my ($fmt, $opt) = each %known_snapshot_formats) {
940                         my $hash = $refname;
941                         unless ($hash =~ s/(\Q$opt->{'suffix'}\E|\Q.$fmt\E)$//) {
942                                 next;
943                         }
944                         my $sfx = $1;
945                         # a valid suffix was found, so set the snapshot format
946                         # and reset the hash parameter
947                         $input_params{'snapshot_format'} = $fmt;
948                         $input_params{'hash'} = $hash;
949                         # we also set the format suffix to the one requested
950                         # in the URL: this way a request for e.g. .tgz returns
951                         # a .tgz instead of a .tar.gz
952                         $known_snapshot_formats{$fmt}{'suffix'} = $sfx;
953                         last;
954                 }
955         }
956 }
957
958 our ($action, $project, $file_name, $file_parent, $hash, $hash_parent, $hash_base,
959      $hash_parent_base, @extra_options, $page, $searchtype, $search_use_regexp,
960      $searchtext, $search_regexp);
961 sub evaluate_and_validate_params {
962         our $action = $input_params{'action'};
963         if (defined $action) {
964                 if (!validate_action($action)) {
965                         die_error(400, "Invalid action parameter");
966                 }
967         }
968
969         # parameters which are pathnames
970         our $project = $input_params{'project'};
971         if (defined $project) {
972                 if (!validate_project($project)) {
973                         undef $project;
974                         die_error(404, "No such project");
975                 }
976         }
977
978         our $file_name = $input_params{'file_name'};
979         if (defined $file_name) {
980                 if (!validate_pathname($file_name)) {
981                         die_error(400, "Invalid file parameter");
982                 }
983         }
984
985         our $file_parent = $input_params{'file_parent'};
986         if (defined $file_parent) {
987                 if (!validate_pathname($file_parent)) {
988                         die_error(400, "Invalid file parent parameter");
989                 }
990         }
991
992         # parameters which are refnames
993         our $hash = $input_params{'hash'};
994         if (defined $hash) {
995                 if (!validate_refname($hash)) {
996                         die_error(400, "Invalid hash parameter");
997                 }
998         }
999
1000         our $hash_parent = $input_params{'hash_parent'};
1001         if (defined $hash_parent) {
1002                 if (!validate_refname($hash_parent)) {
1003                         die_error(400, "Invalid hash parent parameter");
1004                 }
1005         }
1006
1007         our $hash_base = $input_params{'hash_base'};
1008         if (defined $hash_base) {
1009                 if (!validate_refname($hash_base)) {
1010                         die_error(400, "Invalid hash base parameter");
1011                 }
1012         }
1013
1014         our @extra_options = @{$input_params{'extra_options'}};
1015         # @extra_options is always defined, since it can only be (currently) set from
1016         # CGI, and $cgi->param() returns the empty array in array context if the param
1017         # is not set
1018         foreach my $opt (@extra_options) {
1019                 if (not exists $allowed_options{$opt}) {
1020                         die_error(400, "Invalid option parameter");
1021                 }
1022                 if (not grep(/^$action$/, @{$allowed_options{$opt}})) {
1023                         die_error(400, "Invalid option parameter for this action");
1024                 }
1025         }
1026
1027         our $hash_parent_base = $input_params{'hash_parent_base'};
1028         if (defined $hash_parent_base) {
1029                 if (!validate_refname($hash_parent_base)) {
1030                         die_error(400, "Invalid hash parent base parameter");
1031                 }
1032         }
1033
1034         # other parameters
1035         our $page = $input_params{'page'};
1036         if (defined $page) {
1037                 if ($page =~ m/[^0-9]/) {
1038                         die_error(400, "Invalid page parameter");
1039                 }
1040         }
1041
1042         our $searchtype = $input_params{'searchtype'};
1043         if (defined $searchtype) {
1044                 if ($searchtype =~ m/[^a-z]/) {
1045                         die_error(400, "Invalid searchtype parameter");
1046                 }
1047         }
1048
1049         our $search_use_regexp = $input_params{'search_use_regexp'};
1050
1051         our $searchtext = $input_params{'searchtext'};
1052         our $search_regexp;
1053         if (defined $searchtext) {
1054                 if (length($searchtext) < 2) {
1055                         die_error(403, "At least two characters are required for search parameter");
1056                 }
1057                 $search_regexp = $search_use_regexp ? $searchtext : quotemeta $searchtext;
1058         }
1059 }
1060
1061 # path to the current git repository
1062 our $git_dir;
1063 sub evaluate_git_dir {
1064         our $git_dir = "$projectroot/$project" if $project;
1065 }
1066
1067 our (@snapshot_fmts, $git_avatar);
1068 sub configure_gitweb_features {
1069         # list of supported snapshot formats
1070         our @snapshot_fmts = gitweb_get_feature('snapshot');
1071         @snapshot_fmts = filter_snapshot_fmts(@snapshot_fmts);
1072
1073         # check that the avatar feature is set to a known provider name,
1074         # and for each provider check if the dependencies are satisfied.
1075         # if the provider name is invalid or the dependencies are not met,
1076         # reset $git_avatar to the empty string.
1077         our ($git_avatar) = gitweb_get_feature('avatar');
1078         if ($git_avatar eq 'gravatar') {
1079                 $git_avatar = '' unless (eval { require Digest::MD5; 1; });
1080         } elsif ($git_avatar eq 'picon') {
1081                 # no dependencies
1082         } else {
1083                 $git_avatar = '';
1084         }
1085 }
1086
1087 # custom error handler: 'die <message>' is Internal Server Error
1088 sub handle_errors_html {
1089         my $msg = shift; # it is already HTML escaped
1090
1091         # to avoid infinite loop where error occurs in die_error,
1092         # change handler to default handler, disabling handle_errors_html
1093         set_message("Error occured when inside die_error:\n$msg");
1094
1095         # you cannot jump out of die_error when called as error handler;
1096         # the subroutine set via CGI::Carp::set_message is called _after_
1097         # HTTP headers are already written, so it cannot write them itself
1098         die_error(undef, undef, $msg, -error_handler => 1, -no_http_header => 1);
1099 }
1100 set_message(\&handle_errors_html);
1101
1102 # dispatch
1103 sub dispatch {
1104         if (!defined $action) {
1105                 if (defined $hash) {
1106                         $action = git_get_type($hash);
1107                 } elsif (defined $hash_base && defined $file_name) {
1108                         $action = git_get_type("$hash_base:$file_name");
1109                 } elsif (defined $project) {
1110                         $action = 'summary';
1111                 } else {
1112                         $action = 'project_list';
1113                 }
1114         }
1115         if (!defined($actions{$action})) {
1116                 die_error(400, "Unknown action");
1117         }
1118         if ($action !~ m/^(?:opml|project_list|project_index)$/ &&
1119             !$project) {
1120                 die_error(400, "Project needed");
1121         }
1122         $actions{$action}->();
1123 }
1124
1125 sub reset_timer {
1126         our $t0 = [ gettimeofday() ]
1127                 if defined $t0;
1128         our $number_of_git_cmds = 0;
1129 }
1130
1131 our $first_request = 1;
1132 sub run_request {
1133         reset_timer();
1134
1135         evaluate_uri();
1136         if ($first_request) {
1137                 evaluate_gitweb_config();
1138                 evaluate_git_version();
1139         }
1140         if ($per_request_config) {
1141                 if (ref($per_request_config) eq 'CODE') {
1142                         $per_request_config->();
1143                 } elsif (!$first_request) {
1144                         evaluate_gitweb_config();
1145                 }
1146         }
1147         check_loadavg();
1148
1149         # $projectroot and $projects_list might be set in gitweb config file
1150         $projects_list ||= $projectroot;
1151
1152         evaluate_query_params();
1153         evaluate_path_info();
1154         evaluate_and_validate_params();
1155         evaluate_git_dir();
1156
1157         configure_gitweb_features();
1158
1159         dispatch();
1160 }
1161
1162 our $is_last_request = sub { 1 };
1163 our ($pre_dispatch_hook, $post_dispatch_hook, $pre_listen_hook);
1164 our $CGI = 'CGI';
1165 our $cgi;
1166 sub configure_as_fcgi {
1167         require CGI::Fast;
1168         our $CGI = 'CGI::Fast';
1169
1170         my $request_number = 0;
1171         # let each child service 100 requests
1172         our $is_last_request = sub { ++$request_number > 100 };
1173 }
1174 sub evaluate_argv {
1175         my $script_name = $ENV{'SCRIPT_NAME'} || $ENV{'SCRIPT_FILENAME'} || __FILE__;
1176         configure_as_fcgi()
1177                 if $script_name =~ /\.fcgi$/;
1178
1179         return unless (@ARGV);
1180
1181         require Getopt::Long;
1182         Getopt::Long::GetOptions(
1183                 'fastcgi|fcgi|f' => \&configure_as_fcgi,
1184                 'nproc|n=i' => sub {
1185                         my ($arg, $val) = @_;
1186                         return unless eval { require FCGI::ProcManager; 1; };
1187                         my $proc_manager = FCGI::ProcManager->new({
1188                                 n_processes => $val,
1189                         });
1190                         our $pre_listen_hook    = sub { $proc_manager->pm_manage()        };
1191                         our $pre_dispatch_hook  = sub { $proc_manager->pm_pre_dispatch()  };
1192                         our $post_dispatch_hook = sub { $proc_manager->pm_post_dispatch() };
1193                 },
1194         );
1195 }
1196
1197 sub run {
1198         evaluate_argv();
1199
1200         $first_request = 1;
1201         $pre_listen_hook->()
1202                 if $pre_listen_hook;
1203
1204  REQUEST:
1205         while ($cgi = $CGI->new()) {
1206                 $pre_dispatch_hook->()
1207                         if $pre_dispatch_hook;
1208
1209                 run_request();
1210
1211                 $post_dispatch_hook->()
1212                         if $post_dispatch_hook;
1213                 $first_request = 0;
1214
1215                 last REQUEST if ($is_last_request->());
1216         }
1217
1218  DONE_GITWEB:
1219         1;
1220 }
1221
1222 run();
1223
1224 if (defined caller) {
1225         # wrapped in a subroutine processing requests,
1226         # e.g. mod_perl with ModPerl::Registry, or PSGI with Plack::App::WrapCGI
1227         return;
1228 } else {
1229         # pure CGI script, serving single request
1230         exit;
1231 }
1232
1233 ## ======================================================================
1234 ## action links
1235
1236 # possible values of extra options
1237 # -full => 0|1      - use absolute/full URL ($my_uri/$my_url as base)
1238 # -replay => 1      - start from a current view (replay with modifications)
1239 # -path_info => 0|1 - don't use/use path_info URL (if possible)
1240 # -anchor => ANCHOR - add #ANCHOR to end of URL, implies -replay if used alone
1241 sub href {
1242         my %params = @_;
1243         # default is to use -absolute url() i.e. $my_uri
1244         my $href = $params{-full} ? $my_url : $my_uri;
1245
1246         # implicit -replay, must be first of implicit params
1247         $params{-replay} = 1 if (keys %params == 1 && $params{-anchor});
1248
1249         $params{'project'} = $project unless exists $params{'project'};
1250
1251         if ($params{-replay}) {
1252                 while (my ($name, $symbol) = each %cgi_param_mapping) {
1253                         if (!exists $params{$name}) {
1254                                 $params{$name} = $input_params{$name};
1255                         }
1256                 }
1257         }
1258
1259         my $use_pathinfo = gitweb_check_feature('pathinfo');
1260         if (defined $params{'project'} &&
1261             (exists $params{-path_info} ? $params{-path_info} : $use_pathinfo)) {
1262                 # try to put as many parameters as possible in PATH_INFO:
1263                 #   - project name
1264                 #   - action
1265                 #   - hash_parent or hash_parent_base:/file_parent
1266                 #   - hash or hash_base:/filename
1267                 #   - the snapshot_format as an appropriate suffix
1268
1269                 # When the script is the root DirectoryIndex for the domain,
1270                 # $href here would be something like http://gitweb.example.com/
1271                 # Thus, we strip any trailing / from $href, to spare us double
1272                 # slashes in the final URL
1273                 $href =~ s,/$,,;
1274
1275                 # Then add the project name, if present
1276                 $href .= "/".esc_path_info($params{'project'});
1277                 delete $params{'project'};
1278
1279                 # since we destructively absorb parameters, we keep this
1280                 # boolean that remembers if we're handling a snapshot
1281                 my $is_snapshot = $params{'action'} eq 'snapshot';
1282
1283                 # Summary just uses the project path URL, any other action is
1284                 # added to the URL
1285                 if (defined $params{'action'}) {
1286                         $href .= "/".esc_path_info($params{'action'})
1287                                 unless $params{'action'} eq 'summary';
1288                         delete $params{'action'};
1289                 }
1290
1291                 # Next, we put hash_parent_base:/file_parent..hash_base:/file_name,
1292                 # stripping nonexistent or useless pieces
1293                 $href .= "/" if ($params{'hash_base'} || $params{'hash_parent_base'}
1294                         || $params{'hash_parent'} || $params{'hash'});
1295                 if (defined $params{'hash_base'}) {
1296                         if (defined $params{'hash_parent_base'}) {
1297                                 $href .= esc_path_info($params{'hash_parent_base'});
1298                                 # skip the file_parent if it's the same as the file_name
1299                                 if (defined $params{'file_parent'}) {
1300                                         if (defined $params{'file_name'} && $params{'file_parent'} eq $params{'file_name'}) {
1301                                                 delete $params{'file_parent'};
1302                                         } elsif ($params{'file_parent'} !~ /\.\./) {
1303                                                 $href .= ":/".esc_path_info($params{'file_parent'});
1304                                                 delete $params{'file_parent'};
1305                                         }
1306                                 }
1307                                 $href .= "..";
1308                                 delete $params{'hash_parent'};
1309                                 delete $params{'hash_parent_base'};
1310                         } elsif (defined $params{'hash_parent'}) {
1311                                 $href .= esc_path_info($params{'hash_parent'}). "..";
1312                                 delete $params{'hash_parent'};
1313                         }
1314
1315                         $href .= esc_path_info($params{'hash_base'});
1316                         if (defined $params{'file_name'} && $params{'file_name'} !~ /\.\./) {
1317                                 $href .= ":/".esc_path_info($params{'file_name'});
1318                                 delete $params{'file_name'};
1319                         }
1320                         delete $params{'hash'};
1321                         delete $params{'hash_base'};
1322                 } elsif (defined $params{'hash'}) {
1323                         $href .= esc_path_info($params{'hash'});
1324                         delete $params{'hash'};
1325                 }
1326
1327                 # If the action was a snapshot, we can absorb the
1328                 # snapshot_format parameter too
1329                 if ($is_snapshot) {
1330                         my $fmt = $params{'snapshot_format'};
1331                         # snapshot_format should always be defined when href()
1332                         # is called, but just in case some code forgets, we
1333                         # fall back to the default
1334                         $fmt ||= $snapshot_fmts[0];
1335                         $href .= $known_snapshot_formats{$fmt}{'suffix'};
1336                         delete $params{'snapshot_format'};
1337                 }
1338         }
1339
1340         # now encode the parameters explicitly
1341         my @result = ();
1342         for (my $i = 0; $i < @cgi_param_mapping; $i += 2) {
1343                 my ($name, $symbol) = ($cgi_param_mapping[$i], $cgi_param_mapping[$i+1]);
1344                 if (defined $params{$name}) {
1345                         if (ref($params{$name}) eq "ARRAY") {
1346                                 foreach my $par (@{$params{$name}}) {
1347                                         push @result, $symbol . "=" . esc_param($par);
1348                                 }
1349                         } else {
1350                                 push @result, $symbol . "=" . esc_param($params{$name});
1351                         }
1352                 }
1353         }
1354         $href .= "?" . join(';', @result) if scalar @result;
1355
1356         # final transformation: trailing spaces must be escaped (URI-encoded)
1357         $href =~ s/(\s+)$/CGI::escape($1)/e;
1358
1359         if ($params{-anchor}) {
1360                 $href .= "#".esc_param($params{-anchor});
1361         }
1362
1363         return $href;
1364 }
1365
1366
1367 ## ======================================================================
1368 ## validation, quoting/unquoting and escaping
1369
1370 sub validate_action {
1371         my $input = shift || return undef;
1372         return undef unless exists $actions{$input};
1373         return $input;
1374 }
1375
1376 sub validate_project {
1377         my $input = shift || return undef;
1378         if (!validate_pathname($input) ||
1379                 !(-d "$projectroot/$input") ||
1380                 !check_export_ok("$projectroot/$input") ||
1381                 ($strict_export && !project_in_list($input))) {
1382                 return undef;
1383         } else {
1384                 return $input;
1385         }
1386 }
1387
1388 sub validate_pathname {
1389         my $input = shift || return undef;
1390
1391         # no '.' or '..' as elements of path, i.e. no '.' nor '..'
1392         # at the beginning, at the end, and between slashes.
1393         # also this catches doubled slashes
1394         if ($input =~ m!(^|/)(|\.|\.\.)(/|$)!) {
1395                 return undef;
1396         }
1397         # no null characters
1398         if ($input =~ m!\0!) {
1399                 return undef;
1400         }
1401         return $input;
1402 }
1403
1404 sub validate_refname {
1405         my $input = shift || return undef;
1406
1407         # textual hashes are O.K.
1408         if ($input =~ m/^[0-9a-fA-F]{40}$/) {
1409                 return $input;
1410         }
1411         # it must be correct pathname
1412         $input = validate_pathname($input)
1413                 or return undef;
1414         # restrictions on ref name according to git-check-ref-format
1415         if ($input =~ m!(/\.|\.\.|[\000-\040\177 ~^:?*\[]|/$)!) {
1416                 return undef;
1417         }
1418         return $input;
1419 }
1420
1421 # decode sequences of octets in utf8 into Perl's internal form,
1422 # which is utf-8 with utf8 flag set if needed.  gitweb writes out
1423 # in utf-8 thanks to "binmode STDOUT, ':utf8'" at beginning
1424 sub to_utf8 {
1425         my $str = shift;
1426         return undef unless defined $str;
1427         if (utf8::valid($str)) {
1428                 utf8::decode($str);
1429                 return $str;
1430         } else {
1431                 return decode($fallback_encoding, $str, Encode::FB_DEFAULT);
1432         }
1433 }
1434
1435 # quote unsafe chars, but keep the slash, even when it's not
1436 # correct, but quoted slashes look too horrible in bookmarks
1437 sub esc_param {
1438         my $str = shift;
1439         return undef unless defined $str;
1440         $str =~ s/([^A-Za-z0-9\-_.~()\/:@ ]+)/CGI::escape($1)/eg;
1441         $str =~ s/ /\+/g;
1442         return $str;
1443 }
1444
1445 # the quoting rules for path_info fragment are slightly different
1446 sub esc_path_info {
1447         my $str = shift;
1448         return undef unless defined $str;
1449
1450         # path_info doesn't treat '+' as space (specially), but '?' must be escaped
1451         $str =~ s/([^A-Za-z0-9\-_.~();\/;:@&= +]+)/CGI::escape($1)/eg;
1452
1453         return $str;
1454 }
1455
1456 # quote unsafe chars in whole URL, so some characters cannot be quoted
1457 sub esc_url {
1458         my $str = shift;
1459         return undef unless defined $str;
1460         $str =~ s/([^A-Za-z0-9\-_.~();\/;?:@&= ]+)/CGI::escape($1)/eg;
1461         $str =~ s/ /\+/g;
1462         return $str;
1463 }
1464
1465 # quote unsafe characters in HTML attributes
1466 sub esc_attr {
1467
1468         # for XHTML conformance escaping '"' to '&quot;' is not enough
1469         return esc_html(@_);
1470 }
1471
1472 # replace invalid utf8 character with SUBSTITUTION sequence
1473 sub esc_html {
1474         my $str = shift;
1475         my %opts = @_;
1476
1477         return undef unless defined $str;
1478
1479         $str = to_utf8($str);
1480         $str = $cgi->escapeHTML($str);
1481         if ($opts{'-nbsp'}) {
1482                 $str =~ s/ /&nbsp;/g;
1483         }
1484         $str =~ s|([[:cntrl:]])|(($1 ne "\t") ? quot_cec($1) : $1)|eg;
1485         return $str;
1486 }
1487
1488 # quote control characters and escape filename to HTML
1489 sub esc_path {
1490         my $str = shift;
1491         my %opts = @_;
1492
1493         return undef unless defined $str;
1494
1495         $str = to_utf8($str);
1496         $str = $cgi->escapeHTML($str);
1497         if ($opts{'-nbsp'}) {
1498                 $str =~ s/ /&nbsp;/g;
1499         }
1500         $str =~ s|([[:cntrl:]])|quot_cec($1)|eg;
1501         return $str;
1502 }
1503
1504 # Make control characters "printable", using character escape codes (CEC)
1505 sub quot_cec {
1506         my $cntrl = shift;
1507         my %opts = @_;
1508         my %es = ( # character escape codes, aka escape sequences
1509                 "\t" => '\t',   # tab            (HT)
1510                 "\n" => '\n',   # line feed      (LF)
1511                 "\r" => '\r',   # carrige return (CR)
1512                 "\f" => '\f',   # form feed      (FF)
1513                 "\b" => '\b',   # backspace      (BS)
1514                 "\a" => '\a',   # alarm (bell)   (BEL)
1515                 "\e" => '\e',   # escape         (ESC)
1516                 "\013" => '\v', # vertical tab   (VT)
1517                 "\000" => '\0', # nul character  (NUL)
1518         );
1519         my $chr = ( (exists $es{$cntrl})
1520                     ? $es{$cntrl}
1521                     : sprintf('\%2x', ord($cntrl)) );
1522         if ($opts{-nohtml}) {
1523                 return $chr;
1524         } else {
1525                 return "<span class=\"cntrl\">$chr</span>";
1526         }
1527 }
1528
1529 # Alternatively use unicode control pictures codepoints,
1530 # Unicode "printable representation" (PR)
1531 sub quot_upr {
1532         my $cntrl = shift;
1533         my %opts = @_;
1534
1535         my $chr = sprintf('&#%04d;', 0x2400+ord($cntrl));
1536         if ($opts{-nohtml}) {
1537                 return $chr;
1538         } else {
1539                 return "<span class=\"cntrl\">$chr</span>";
1540         }
1541 }
1542
1543 # git may return quoted and escaped filenames
1544 sub unquote {
1545         my $str = shift;
1546
1547         sub unq {
1548                 my $seq = shift;
1549                 my %es = ( # character escape codes, aka escape sequences
1550                         't' => "\t",   # tab            (HT, TAB)
1551                         'n' => "\n",   # newline        (NL)
1552                         'r' => "\r",   # return         (CR)
1553                         'f' => "\f",   # form feed      (FF)
1554                         'b' => "\b",   # backspace      (BS)
1555                         'a' => "\a",   # alarm (bell)   (BEL)
1556                         'e' => "\e",   # escape         (ESC)
1557                         'v' => "\013", # vertical tab   (VT)
1558                 );
1559
1560                 if ($seq =~ m/^[0-7]{1,3}$/) {
1561                         # octal char sequence
1562                         return chr(oct($seq));
1563                 } elsif (exists $es{$seq}) {
1564                         # C escape sequence, aka character escape code
1565                         return $es{$seq};
1566                 }
1567                 # quoted ordinary character
1568                 return $seq;
1569         }
1570
1571         if ($str =~ m/^"(.*)"$/) {
1572                 # needs unquoting
1573                 $str = $1;
1574                 $str =~ s/\\([^0-7]|[0-7]{1,3})/unq($1)/eg;
1575         }
1576         return $str;
1577 }
1578
1579 # escape tabs (convert tabs to spaces)
1580 sub untabify {
1581         my $line = shift;
1582
1583         while ((my $pos = index($line, "\t")) != -1) {
1584                 if (my $count = (8 - ($pos % 8))) {
1585                         my $spaces = ' ' x $count;
1586                         $line =~ s/\t/$spaces/;
1587                 }
1588         }
1589
1590         return $line;
1591 }
1592
1593 sub project_in_list {
1594         my $project = shift;
1595         my @list = git_get_projects_list();
1596         return @list && scalar(grep { $_->{'path'} eq $project } @list);
1597 }
1598
1599 ## ----------------------------------------------------------------------
1600 ## HTML aware string manipulation
1601
1602 # Try to chop given string on a word boundary between position
1603 # $len and $len+$add_len. If there is no word boundary there,
1604 # chop at $len+$add_len. Do not chop if chopped part plus ellipsis
1605 # (marking chopped part) would be longer than given string.
1606 sub chop_str {
1607         my $str = shift;
1608         my $len = shift;
1609         my $add_len = shift || 10;
1610         my $where = shift || 'right'; # 'left' | 'center' | 'right'
1611
1612         # Make sure perl knows it is utf8 encoded so we don't
1613         # cut in the middle of a utf8 multibyte char.
1614         $str = to_utf8($str);
1615
1616         # allow only $len chars, but don't cut a word if it would fit in $add_len
1617         # if it doesn't fit, cut it if it's still longer than the dots we would add
1618         # remove chopped character entities entirely
1619
1620         # when chopping in the middle, distribute $len into left and right part
1621         # return early if chopping wouldn't make string shorter
1622         if ($where eq 'center') {
1623                 return $str if ($len + 5 >= length($str)); # filler is length 5
1624                 $len = int($len/2);
1625         } else {
1626                 return $str if ($len + 4 >= length($str)); # filler is length 4
1627         }
1628
1629         # regexps: ending and beginning with word part up to $add_len
1630         my $endre = qr/.{$len}\w{0,$add_len}/;
1631         my $begre = qr/\w{0,$add_len}.{$len}/;
1632
1633         if ($where eq 'left') {
1634                 $str =~ m/^(.*?)($begre)$/;
1635                 my ($lead, $body) = ($1, $2);
1636                 if (length($lead) > 4) {
1637                         $lead = " ...";
1638                 }
1639                 return "$lead$body";
1640
1641         } elsif ($where eq 'center') {
1642                 $str =~ m/^($endre)(.*)$/;
1643                 my ($left, $str)  = ($1, $2);
1644                 $str =~ m/^(.*?)($begre)$/;
1645                 my ($mid, $right) = ($1, $2);
1646                 if (length($mid) > 5) {
1647                         $mid = " ... ";
1648                 }
1649                 return "$left$mid$right";
1650
1651         } else {
1652                 $str =~ m/^($endre)(.*)$/;
1653                 my $body = $1;
1654                 my $tail = $2;
1655                 if (length($tail) > 4) {
1656                         $tail = "... ";
1657                 }
1658                 return "$body$tail";
1659         }
1660 }
1661
1662 # takes the same arguments as chop_str, but also wraps a <span> around the
1663 # result with a title attribute if it does get chopped. Additionally, the
1664 # string is HTML-escaped.
1665 sub chop_and_escape_str {
1666         my ($str) = @_;
1667
1668         my $chopped = chop_str(@_);
1669         if ($chopped eq $str) {
1670                 return esc_html($chopped);
1671         } else {
1672                 $str =~ s/[[:cntrl:]]/?/g;
1673                 return $cgi->span({-title=>$str}, esc_html($chopped));
1674         }
1675 }
1676
1677 ## ----------------------------------------------------------------------
1678 ## functions returning short strings
1679
1680 # CSS class for given age value (in seconds)
1681 sub age_class {
1682         my $age = shift;
1683
1684         if (!defined $age) {
1685                 return "noage";
1686         } elsif ($age < 60*60*2) {
1687                 return "age0";
1688         } elsif ($age < 60*60*24*2) {
1689                 return "age1";
1690         } else {
1691                 return "age2";
1692         }
1693 }
1694
1695 # convert age in seconds to "nn units ago" string
1696 sub age_string {
1697         my $age = shift;
1698         my $age_str;
1699
1700         if ($age > 60*60*24*365*2) {
1701                 $age_str = (int $age/60/60/24/365);
1702                 $age_str .= " years ago";
1703         } elsif ($age > 60*60*24*(365/12)*2) {
1704                 $age_str = int $age/60/60/24/(365/12);
1705                 $age_str .= " months ago";
1706         } elsif ($age > 60*60*24*7*2) {
1707                 $age_str = int $age/60/60/24/7;
1708                 $age_str .= " weeks ago";
1709         } elsif ($age > 60*60*24*2) {
1710                 $age_str = int $age/60/60/24;
1711                 $age_str .= " days ago";
1712         } elsif ($age > 60*60*2) {
1713                 $age_str = int $age/60/60;
1714                 $age_str .= " hours ago";
1715         } elsif ($age > 60*2) {
1716                 $age_str = int $age/60;
1717                 $age_str .= " min ago";
1718         } elsif ($age > 2) {
1719                 $age_str = int $age;
1720                 $age_str .= " sec ago";
1721         } else {
1722                 $age_str .= " right now";
1723         }
1724         return $age_str;
1725 }
1726
1727 use constant {
1728         S_IFINVALID => 0030000,
1729         S_IFGITLINK => 0160000,
1730 };
1731
1732 # submodule/subproject, a commit object reference
1733 sub S_ISGITLINK {
1734         my $mode = shift;
1735
1736         return (($mode & S_IFMT) == S_IFGITLINK)
1737 }
1738
1739 # convert file mode in octal to symbolic file mode string
1740 sub mode_str {
1741         my $mode = oct shift;
1742
1743         if (S_ISGITLINK($mode)) {
1744                 return 'm---------';
1745         } elsif (S_ISDIR($mode & S_IFMT)) {
1746                 return 'drwxr-xr-x';
1747         } elsif (S_ISLNK($mode)) {
1748                 return 'lrwxrwxrwx';
1749         } elsif (S_ISREG($mode)) {
1750                 # git cares only about the executable bit
1751                 if ($mode & S_IXUSR) {
1752                         return '-rwxr-xr-x';
1753                 } else {
1754                         return '-rw-r--r--';
1755                 };
1756         } else {
1757                 return '----------';
1758         }
1759 }
1760
1761 # convert file mode in octal to file type string
1762 sub file_type {
1763         my $mode = shift;
1764
1765         if ($mode !~ m/^[0-7]+$/) {
1766                 return $mode;
1767         } else {
1768                 $mode = oct $mode;
1769         }
1770
1771         if (S_ISGITLINK($mode)) {
1772                 return "submodule";
1773         } elsif (S_ISDIR($mode & S_IFMT)) {
1774                 return "directory";
1775         } elsif (S_ISLNK($mode)) {
1776                 return "symlink";
1777         } elsif (S_ISREG($mode)) {
1778                 return "file";
1779         } else {
1780                 return "unknown";
1781         }
1782 }
1783
1784 # convert file mode in octal to file type description string
1785 sub file_type_long {
1786         my $mode = shift;
1787
1788         if ($mode !~ m/^[0-7]+$/) {
1789                 return $mode;
1790         } else {
1791                 $mode = oct $mode;
1792         }
1793
1794         if (S_ISGITLINK($mode)) {
1795                 return "submodule";
1796         } elsif (S_ISDIR($mode & S_IFMT)) {
1797                 return "directory";
1798         } elsif (S_ISLNK($mode)) {
1799                 return "symlink";
1800         } elsif (S_ISREG($mode)) {
1801                 if ($mode & S_IXUSR) {
1802                         return "executable";
1803                 } else {
1804                         return "file";
1805                 };
1806         } else {
1807                 return "unknown";
1808         }
1809 }
1810
1811
1812 ## ----------------------------------------------------------------------
1813 ## functions returning short HTML fragments, or transforming HTML fragments
1814 ## which don't belong to other sections
1815
1816 # format line of commit message.
1817 sub format_log_line_html {
1818         my $line = shift;
1819
1820         $line = esc_html($line, -nbsp=>1);
1821         $line =~ s{\b([0-9a-fA-F]{8,40})\b}{
1822                 $cgi->a({-href => href(action=>"object", hash=>$1),
1823                                         -class => "text"}, $1);
1824         }eg;
1825
1826         return $line;
1827 }
1828
1829 # format marker of refs pointing to given object
1830
1831 # the destination action is chosen based on object type and current context:
1832 # - for annotated tags, we choose the tag view unless it's the current view
1833 #   already, in which case we go to shortlog view
1834 # - for other refs, we keep the current view if we're in history, shortlog or
1835 #   log view, and select shortlog otherwise
1836 sub format_ref_marker {
1837         my ($refs, $id) = @_;
1838         my $markers = '';
1839
1840         if (defined $refs->{$id}) {
1841                 foreach my $ref (@{$refs->{$id}}) {
1842                         # this code exploits the fact that non-lightweight tags are the
1843                         # only indirect objects, and that they are the only objects for which
1844                         # we want to use tag instead of shortlog as action
1845                         my ($type, $name) = qw();
1846                         my $indirect = ($ref =~ s/\^\{\}$//);
1847                         # e.g. tags/v2.6.11 or heads/next
1848                         if ($ref =~ m!^(.*?)s?/(.*)$!) {
1849                                 $type = $1;
1850                                 $name = $2;
1851                         } else {
1852                                 $type = "ref";
1853                                 $name = $ref;
1854                         }
1855
1856                         my $class = $type;
1857                         $class .= " indirect" if $indirect;
1858
1859                         my $dest_action = "shortlog";
1860
1861                         if ($indirect) {
1862                                 $dest_action = "tag" unless $action eq "tag";
1863                         } elsif ($action =~ /^(history|(short)?log)$/) {
1864                                 $dest_action = $action;
1865                         }
1866
1867                         my $dest = "";
1868                         $dest .= "refs/" unless $ref =~ m!^refs/!;
1869                         $dest .= $ref;
1870
1871                         my $link = $cgi->a({
1872                                 -href => href(
1873                                         action=>$dest_action,
1874                                         hash=>$dest
1875                                 )}, $name);
1876
1877                         $markers .= " <span class=\"".esc_attr($class)."\" title=\"".esc_attr($ref)."\">" .
1878                                 $link . "</span>";
1879                 }
1880         }
1881
1882         if ($markers) {
1883                 return ' <span class="refs">'. $markers . '</span>';
1884         } else {
1885                 return "";
1886         }
1887 }
1888
1889 # format, perhaps shortened and with markers, title line
1890 sub format_subject_html {
1891         my ($long, $short, $href, $extra) = @_;
1892         $extra = '' unless defined($extra);
1893
1894         if (length($short) < length($long)) {
1895                 $long =~ s/[[:cntrl:]]/?/g;
1896                 return $cgi->a({-href => $href, -class => "list subject",
1897                                 -title => to_utf8($long)},
1898                        esc_html($short)) . $extra;
1899         } else {
1900                 return $cgi->a({-href => $href, -class => "list subject"},
1901                        esc_html($long)) . $extra;
1902         }
1903 }
1904
1905 # Rather than recomputing the url for an email multiple times, we cache it
1906 # after the first hit. This gives a visible benefit in views where the avatar
1907 # for the same email is used repeatedly (e.g. shortlog).
1908 # The cache is shared by all avatar engines (currently gravatar only), which
1909 # are free to use it as preferred. Since only one avatar engine is used for any
1910 # given page, there's no risk for cache conflicts.
1911 our %avatar_cache = ();
1912
1913 # Compute the picon url for a given email, by using the picon search service over at
1914 # http://www.cs.indiana.edu/picons/search.html
1915 sub picon_url {
1916         my $email = lc shift;
1917         if (!$avatar_cache{$email}) {
1918                 my ($user, $domain) = split('@', $email);
1919                 $avatar_cache{$email} =
1920                         "http://www.cs.indiana.edu/cgi-pub/kinzler/piconsearch.cgi/" .
1921                         "$domain/$user/" .
1922                         "users+domains+unknown/up/single";
1923         }
1924         return $avatar_cache{$email};
1925 }
1926
1927 # Compute the gravatar url for a given email, if it's not in the cache already.
1928 # Gravatar stores only the part of the URL before the size, since that's the
1929 # one computationally more expensive. This also allows reuse of the cache for
1930 # different sizes (for this particular engine).
1931 sub gravatar_url {
1932         my $email = lc shift;
1933         my $size = shift;
1934         $avatar_cache{$email} ||=
1935                 "http://www.gravatar.com/avatar/" .
1936                         Digest::MD5::md5_hex($email) . "?s=";
1937         return $avatar_cache{$email} . $size;
1938 }
1939
1940 # Insert an avatar for the given $email at the given $size if the feature
1941 # is enabled.
1942 sub git_get_avatar {
1943         my ($email, %opts) = @_;
1944         my $pre_white  = ($opts{-pad_before} ? "&nbsp;" : "");
1945         my $post_white = ($opts{-pad_after}  ? "&nbsp;" : "");
1946         $opts{-size} ||= 'default';
1947         my $size = $avatar_size{$opts{-size}} || $avatar_size{'default'};
1948         my $url = "";
1949         if ($git_avatar eq 'gravatar') {
1950                 $url = gravatar_url($email, $size);
1951         } elsif ($git_avatar eq 'picon') {
1952                 $url = picon_url($email);
1953         }
1954         # Other providers can be added by extending the if chain, defining $url
1955         # as needed. If no variant puts something in $url, we assume avatars
1956         # are completely disabled/unavailable.
1957         if ($url) {
1958                 return $pre_white .
1959                        "<img width=\"$size\" " .
1960                             "class=\"avatar\" " .
1961                             "src=\"".esc_url($url)."\" " .
1962                             "alt=\"\" " .
1963                        "/>" . $post_white;
1964         } else {
1965                 return "";
1966         }
1967 }
1968
1969 sub format_search_author {
1970         my ($author, $searchtype, $displaytext) = @_;
1971         my $have_search = gitweb_check_feature('search');
1972
1973         if ($have_search) {
1974                 my $performed = "";
1975                 if ($searchtype eq 'author') {
1976                         $performed = "authored";
1977                 } elsif ($searchtype eq 'committer') {
1978                         $performed = "committed";
1979                 }
1980
1981                 return $cgi->a({-href => href(action=>"search", hash=>$hash,
1982                                 searchtext=>$author,
1983                                 searchtype=>$searchtype), class=>"list",
1984                                 title=>"Search for commits $performed by $author"},
1985                                 $displaytext);
1986
1987         } else {
1988                 return $displaytext;
1989         }
1990 }
1991
1992 # format the author name of the given commit with the given tag
1993 # the author name is chopped and escaped according to the other
1994 # optional parameters (see chop_str).
1995 sub format_author_html {
1996         my $tag = shift;
1997         my $co = shift;
1998         my $author = chop_and_escape_str($co->{'author_name'}, @_);
1999         return "<$tag class=\"author\">" .
2000                format_search_author($co->{'author_name'}, "author",
2001                        git_get_avatar($co->{'author_email'}, -pad_after => 1) .
2002                        $author) .
2003                "</$tag>";
2004 }
2005
2006 # format git diff header line, i.e. "diff --(git|combined|cc) ..."
2007 sub format_git_diff_header_line {
2008         my $line = shift;
2009         my $diffinfo = shift;
2010         my ($from, $to) = @_;
2011
2012         if ($diffinfo->{'nparents'}) {
2013                 # combined diff
2014                 $line =~ s!^(diff (.*?) )"?.*$!$1!;
2015                 if ($to->{'href'}) {
2016                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2017                                          esc_path($to->{'file'}));
2018                 } else { # file was deleted (no href)
2019                         $line .= esc_path($to->{'file'});
2020                 }
2021         } else {
2022                 # "ordinary" diff
2023                 $line =~ s!^(diff (.*?) )"?a/.*$!$1!;
2024                 if ($from->{'href'}) {
2025                         $line .= $cgi->a({-href => $from->{'href'}, -class => "path"},
2026                                          'a/' . esc_path($from->{'file'}));
2027                 } else { # file was added (no href)
2028                         $line .= 'a/' . esc_path($from->{'file'});
2029                 }
2030                 $line .= ' ';
2031                 if ($to->{'href'}) {
2032                         $line .= $cgi->a({-href => $to->{'href'}, -class => "path"},
2033                                          'b/' . esc_path($to->{'file'}));
2034                 } else { # file was deleted
2035                         $line .= 'b/' . esc_path($to->{'file'});
2036                 }
2037         }
2038
2039         return "<div class=\"diff header\">$line</div>\n";
2040 }
2041
2042 # format extended diff header line, before patch itself
2043 sub format_extended_diff_header_line {
2044         my $line = shift;
2045         my $diffinfo = shift;
2046         my ($from, $to) = @_;
2047
2048         # match <path>
2049         if ($line =~ s!^((copy|rename) from ).*$!$1! && $from->{'href'}) {
2050                 $line .= $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2051                                        esc_path($from->{'file'}));
2052         }
2053         if ($line =~ s!^((copy|rename) to ).*$!$1! && $to->{'href'}) {
2054                 $line .= $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2055                                  esc_path($to->{'file'}));
2056         }
2057         # match single <mode>
2058         if ($line =~ m/\s(\d{6})$/) {
2059                 $line .= '<span class="info"> (' .
2060                          file_type_long($1) .
2061                          ')</span>';
2062         }
2063         # match <hash>
2064         if ($line =~ m/^index [0-9a-fA-F]{40},[0-9a-fA-F]{40}/) {
2065                 # can match only for combined diff
2066                 $line = 'index ';
2067                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2068                         if ($from->{'href'}[$i]) {
2069                                 $line .= $cgi->a({-href=>$from->{'href'}[$i],
2070                                                   -class=>"hash"},
2071                                                  substr($diffinfo->{'from_id'}[$i],0,7));
2072                         } else {
2073                                 $line .= '0' x 7;
2074                         }
2075                         # separator
2076                         $line .= ',' if ($i < $diffinfo->{'nparents'} - 1);
2077                 }
2078                 $line .= '..';
2079                 if ($to->{'href'}) {
2080                         $line .= $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2081                                          substr($diffinfo->{'to_id'},0,7));
2082                 } else {
2083                         $line .= '0' x 7;
2084                 }
2085
2086         } elsif ($line =~ m/^index [0-9a-fA-F]{40}..[0-9a-fA-F]{40}/) {
2087                 # can match only for ordinary diff
2088                 my ($from_link, $to_link);
2089                 if ($from->{'href'}) {
2090                         $from_link = $cgi->a({-href=>$from->{'href'}, -class=>"hash"},
2091                                              substr($diffinfo->{'from_id'},0,7));
2092                 } else {
2093                         $from_link = '0' x 7;
2094                 }
2095                 if ($to->{'href'}) {
2096                         $to_link = $cgi->a({-href=>$to->{'href'}, -class=>"hash"},
2097                                            substr($diffinfo->{'to_id'},0,7));
2098                 } else {
2099                         $to_link = '0' x 7;
2100                 }
2101                 my ($from_id, $to_id) = ($diffinfo->{'from_id'}, $diffinfo->{'to_id'});
2102                 $line =~ s!$from_id\.\.$to_id!$from_link..$to_link!;
2103         }
2104
2105         return $line . "<br/>\n";
2106 }
2107
2108 # format from-file/to-file diff header
2109 sub format_diff_from_to_header {
2110         my ($from_line, $to_line, $diffinfo, $from, $to, @parents) = @_;
2111         my $line;
2112         my $result = '';
2113
2114         $line = $from_line;
2115         #assert($line =~ m/^---/) if DEBUG;
2116         # no extra formatting for "^--- /dev/null"
2117         if (! $diffinfo->{'nparents'}) {
2118                 # ordinary (single parent) diff
2119                 if ($line =~ m!^--- "?a/!) {
2120                         if ($from->{'href'}) {
2121                                 $line = '--- a/' .
2122                                         $cgi->a({-href=>$from->{'href'}, -class=>"path"},
2123                                                 esc_path($from->{'file'}));
2124                         } else {
2125                                 $line = '--- a/' .
2126                                         esc_path($from->{'file'});
2127                         }
2128                 }
2129                 $result .= qq!<div class="diff from_file">$line</div>\n!;
2130
2131         } else {
2132                 # combined diff (merge commit)
2133                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
2134                         if ($from->{'href'}[$i]) {
2135                                 $line = '--- ' .
2136                                         $cgi->a({-href=>href(action=>"blobdiff",
2137                                                              hash_parent=>$diffinfo->{'from_id'}[$i],
2138                                                              hash_parent_base=>$parents[$i],
2139                                                              file_parent=>$from->{'file'}[$i],
2140                                                              hash=>$diffinfo->{'to_id'},
2141                                                              hash_base=>$hash,
2142                                                              file_name=>$to->{'file'}),
2143                                                  -class=>"path",
2144                                                  -title=>"diff" . ($i+1)},
2145                                                 $i+1) .
2146                                         '/' .
2147                                         $cgi->a({-href=>$from->{'href'}[$i], -class=>"path"},
2148                                                 esc_path($from->{'file'}[$i]));
2149                         } else {
2150                                 $line = '--- /dev/null';
2151                         }
2152                         $result .= qq!<div class="diff from_file">$line</div>\n!;
2153                 }
2154         }
2155
2156         $line = $to_line;
2157         #assert($line =~ m/^\+\+\+/) if DEBUG;
2158         # no extra formatting for "^+++ /dev/null"
2159         if ($line =~ m!^\+\+\+ "?b/!) {
2160                 if ($to->{'href'}) {
2161                         $line = '+++ b/' .
2162                                 $cgi->a({-href=>$to->{'href'}, -class=>"path"},
2163                                         esc_path($to->{'file'}));
2164                 } else {
2165                         $line = '+++ b/' .
2166                                 esc_path($to->{'file'});
2167                 }
2168         }
2169         $result .= qq!<div class="diff to_file">$line</div>\n!;
2170
2171         return $result;
2172 }
2173
2174 # create note for patch simplified by combined diff
2175 sub format_diff_cc_simplified {
2176         my ($diffinfo, @parents) = @_;
2177         my $result = '';
2178
2179         $result .= "<div class=\"diff header\">" .
2180                    "diff --cc ";
2181         if (!is_deleted($diffinfo)) {
2182                 $result .= $cgi->a({-href => href(action=>"blob",
2183                                                   hash_base=>$hash,
2184                                                   hash=>$diffinfo->{'to_id'},
2185                                                   file_name=>$diffinfo->{'to_file'}),
2186                                     -class => "path"},
2187                                    esc_path($diffinfo->{'to_file'}));
2188         } else {
2189                 $result .= esc_path($diffinfo->{'to_file'});
2190         }
2191         $result .= "</div>\n" . # class="diff header"
2192                    "<div class=\"diff nodifferences\">" .
2193                    "Simple merge" .
2194                    "</div>\n"; # class="diff nodifferences"
2195
2196         return $result;
2197 }
2198
2199 # format patch (diff) line (not to be used for diff headers)
2200 sub format_diff_line {
2201         my $line = shift;
2202         my ($from, $to) = @_;
2203         my $diff_class = "";
2204
2205         chomp $line;
2206
2207         if ($from && $to && ref($from->{'href'}) eq "ARRAY") {
2208                 # combined diff
2209                 my $prefix = substr($line, 0, scalar @{$from->{'href'}});
2210                 if ($line =~ m/^\@{3}/) {
2211                         $diff_class = " chunk_header";
2212                 } elsif ($line =~ m/^\\/) {
2213                         $diff_class = " incomplete";
2214                 } elsif ($prefix =~ tr/+/+/) {
2215                         $diff_class = " add";
2216                 } elsif ($prefix =~ tr/-/-/) {
2217                         $diff_class = " rem";
2218                 }
2219         } else {
2220                 # assume ordinary diff
2221                 my $char = substr($line, 0, 1);
2222                 if ($char eq '+') {
2223                         $diff_class = " add";
2224                 } elsif ($char eq '-') {
2225                         $diff_class = " rem";
2226                 } elsif ($char eq '@') {
2227                         $diff_class = " chunk_header";
2228                 } elsif ($char eq "\\") {
2229                         $diff_class = " incomplete";
2230                 }
2231         }
2232         $line = untabify($line);
2233         if ($from && $to && $line =~ m/^\@{2} /) {
2234                 my ($from_text, $from_start, $from_lines, $to_text, $to_start, $to_lines, $section) =
2235                         $line =~ m/^\@{2} (-(\d+)(?:,(\d+))?) (\+(\d+)(?:,(\d+))?) \@{2}(.*)$/;
2236
2237                 $from_lines = 0 unless defined $from_lines;
2238                 $to_lines   = 0 unless defined $to_lines;
2239
2240                 if ($from->{'href'}) {
2241                         $from_text = $cgi->a({-href=>"$from->{'href'}#l$from_start",
2242                                              -class=>"list"}, $from_text);
2243                 }
2244                 if ($to->{'href'}) {
2245                         $to_text   = $cgi->a({-href=>"$to->{'href'}#l$to_start",
2246                                              -class=>"list"}, $to_text);
2247                 }
2248                 $line = "<span class=\"chunk_info\">@@ $from_text $to_text @@</span>" .
2249                         "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2250                 return "<div class=\"diff$diff_class\">$line</div>\n";
2251         } elsif ($from && $to && $line =~ m/^\@{3}/) {
2252                 my ($prefix, $ranges, $section) = $line =~ m/^(\@+) (.*?) \@+(.*)$/;
2253                 my (@from_text, @from_start, @from_nlines, $to_text, $to_start, $to_nlines);
2254
2255                 @from_text = split(' ', $ranges);
2256                 for (my $i = 0; $i < @from_text; ++$i) {
2257                         ($from_start[$i], $from_nlines[$i]) =
2258                                 (split(',', substr($from_text[$i], 1)), 0);
2259                 }
2260
2261                 $to_text   = pop @from_text;
2262                 $to_start  = pop @from_start;
2263                 $to_nlines = pop @from_nlines;
2264
2265                 $line = "<span class=\"chunk_info\">$prefix ";
2266                 for (my $i = 0; $i < @from_text; ++$i) {
2267                         if ($from->{'href'}[$i]) {
2268                                 $line .= $cgi->a({-href=>"$from->{'href'}[$i]#l$from_start[$i]",
2269                                                   -class=>"list"}, $from_text[$i]);
2270                         } else {
2271                                 $line .= $from_text[$i];
2272                         }
2273                         $line .= " ";
2274                 }
2275                 if ($to->{'href'}) {
2276                         $line .= $cgi->a({-href=>"$to->{'href'}#l$to_start",
2277                                           -class=>"list"}, $to_text);
2278                 } else {
2279                         $line .= $to_text;
2280                 }
2281                 $line .= " $prefix</span>" .
2282                          "<span class=\"section\">" . esc_html($section, -nbsp=>1) . "</span>";
2283                 return "<div class=\"diff$diff_class\">$line</div>\n";
2284         }
2285         return "<div class=\"diff$diff_class\">" . esc_html($line, -nbsp=>1) . "</div>\n";
2286 }
2287
2288 # Generates undef or something like "_snapshot_" or "snapshot (_tbz2_ _zip_)",
2289 # linked.  Pass the hash of the tree/commit to snapshot.
2290 sub format_snapshot_links {
2291         my ($hash) = @_;
2292         my $num_fmts = @snapshot_fmts;
2293         if ($num_fmts > 1) {
2294                 # A parenthesized list of links bearing format names.
2295                 # e.g. "snapshot (_tar.gz_ _zip_)"
2296                 return "snapshot (" . join(' ', map
2297                         $cgi->a({
2298                                 -href => href(
2299                                         action=>"snapshot",
2300                                         hash=>$hash,
2301                                         snapshot_format=>$_
2302                                 )
2303                         }, $known_snapshot_formats{$_}{'display'})
2304                 , @snapshot_fmts) . ")";
2305         } elsif ($num_fmts == 1) {
2306                 # A single "snapshot" link whose tooltip bears the format name.
2307                 # i.e. "_snapshot_"
2308                 my ($fmt) = @snapshot_fmts;
2309                 return
2310                         $cgi->a({
2311                                 -href => href(
2312                                         action=>"snapshot",
2313                                         hash=>$hash,
2314                                         snapshot_format=>$fmt
2315                                 ),
2316                                 -title => "in format: $known_snapshot_formats{$fmt}{'display'}"
2317                         }, "snapshot");
2318         } else { # $num_fmts == 0
2319                 return undef;
2320         }
2321 }
2322
2323 ## ......................................................................
2324 ## functions returning values to be passed, perhaps after some
2325 ## transformation, to other functions; e.g. returning arguments to href()
2326
2327 # returns hash to be passed to href to generate gitweb URL
2328 # in -title key it returns description of link
2329 sub get_feed_info {
2330         my $format = shift || 'Atom';
2331         my %res = (action => lc($format));
2332
2333         # feed links are possible only for project views
2334         return unless (defined $project);
2335         # some views should link to OPML, or to generic project feed,
2336         # or don't have specific feed yet (so they should use generic)
2337         return if ($action =~ /^(?:tags|heads|forks|tag|search)$/x);
2338
2339         my $branch;
2340         # branches refs uses 'refs/heads/' prefix (fullname) to differentiate
2341         # from tag links; this also makes possible to detect branch links
2342         if ((defined $hash_base && $hash_base =~ m!^refs/heads/(.*)$!) ||
2343             (defined $hash      && $hash      =~ m!^refs/heads/(.*)$!)) {
2344                 $branch = $1;
2345         }
2346         # find log type for feed description (title)
2347         my $type = 'log';
2348         if (defined $file_name) {
2349                 $type  = "history of $file_name";
2350                 $type .= "/" if ($action eq 'tree');
2351                 $type .= " on '$branch'" if (defined $branch);
2352         } else {
2353                 $type = "log of $branch" if (defined $branch);
2354         }
2355
2356         $res{-title} = $type;
2357         $res{'hash'} = (defined $branch ? "refs/heads/$branch" : undef);
2358         $res{'file_name'} = $file_name;
2359
2360         return %res;
2361 }
2362
2363 ## ----------------------------------------------------------------------
2364 ## git utility subroutines, invoking git commands
2365
2366 # returns path to the core git executable and the --git-dir parameter as list
2367 sub git_cmd {
2368         $number_of_git_cmds++;
2369         return $GIT, '--git-dir='.$git_dir;
2370 }
2371
2372 # quote the given arguments for passing them to the shell
2373 # quote_command("command", "arg 1", "arg with ' and ! characters")
2374 # => "'command' 'arg 1' 'arg with '\'' and '\!' characters'"
2375 # Try to avoid using this function wherever possible.
2376 sub quote_command {
2377         return join(' ',
2378                 map { my $a = $_; $a =~ s/(['!])/'\\$1'/g; "'$a'" } @_ );
2379 }
2380
2381 # get HEAD ref of given project as hash
2382 sub git_get_head_hash {
2383         return git_get_full_hash(shift, 'HEAD');
2384 }
2385
2386 sub git_get_full_hash {
2387         return git_get_hash(@_);
2388 }
2389
2390 sub git_get_short_hash {
2391         return git_get_hash(@_, '--short=7');
2392 }
2393
2394 sub git_get_hash {
2395         my ($project, $hash, @options) = @_;
2396         my $o_git_dir = $git_dir;
2397         my $retval = undef;
2398         $git_dir = "$projectroot/$project";
2399         if (open my $fd, '-|', git_cmd(), 'rev-parse',
2400             '--verify', '-q', @options, $hash) {
2401                 $retval = <$fd>;
2402                 chomp $retval if defined $retval;
2403                 close $fd;
2404         }
2405         if (defined $o_git_dir) {
2406                 $git_dir = $o_git_dir;
2407         }
2408         return $retval;
2409 }
2410
2411 # get type of given object
2412 sub git_get_type {
2413         my $hash = shift;
2414
2415         open my $fd, "-|", git_cmd(), "cat-file", '-t', $hash or return;
2416         my $type = <$fd>;
2417         close $fd or return;
2418         chomp $type;
2419         return $type;
2420 }
2421
2422 # repository configuration
2423 our $config_file = '';
2424 our %config;
2425
2426 # store multiple values for single key as anonymous array reference
2427 # single values stored directly in the hash, not as [ <value> ]
2428 sub hash_set_multi {
2429         my ($hash, $key, $value) = @_;
2430
2431         if (!exists $hash->{$key}) {
2432                 $hash->{$key} = $value;
2433         } elsif (!ref $hash->{$key}) {
2434                 $hash->{$key} = [ $hash->{$key}, $value ];
2435         } else {
2436                 push @{$hash->{$key}}, $value;
2437         }
2438 }
2439
2440 # return hash of git project configuration
2441 # optionally limited to some section, e.g. 'gitweb'
2442 sub git_parse_project_config {
2443         my $section_regexp = shift;
2444         my %config;
2445
2446         local $/ = "\0";
2447
2448         open my $fh, "-|", git_cmd(), "config", '-z', '-l',
2449                 or return;
2450
2451         while (my $keyval = <$fh>) {
2452                 chomp $keyval;
2453                 my ($key, $value) = split(/\n/, $keyval, 2);
2454
2455                 hash_set_multi(\%config, $key, $value)
2456                         if (!defined $section_regexp || $key =~ /^(?:$section_regexp)\./o);
2457         }
2458         close $fh;
2459
2460         return %config;
2461 }
2462
2463 # convert config value to boolean: 'true' or 'false'
2464 # no value, number > 0, 'true' and 'yes' values are true
2465 # rest of values are treated as false (never as error)
2466 sub config_to_bool {
2467         my $val = shift;
2468
2469         return 1 if !defined $val;             # section.key
2470
2471         # strip leading and trailing whitespace
2472         $val =~ s/^\s+//;
2473         $val =~ s/\s+$//;
2474
2475         return (($val =~ /^\d+$/ && $val) ||   # section.key = 1
2476                 ($val =~ /^(?:true|yes)$/i));  # section.key = true
2477 }
2478
2479 # convert config value to simple decimal number
2480 # an optional value suffix of 'k', 'm', or 'g' will cause the value
2481 # to be multiplied by 1024, 1048576, or 1073741824
2482 sub config_to_int {
2483         my $val = shift;
2484
2485         # strip leading and trailing whitespace
2486         $val =~ s/^\s+//;
2487         $val =~ s/\s+$//;
2488
2489         if (my ($num, $unit) = ($val =~ /^([0-9]*)([kmg])$/i)) {
2490                 $unit = lc($unit);
2491                 # unknown unit is treated as 1
2492                 return $num * ($unit eq 'g' ? 1073741824 :
2493                                $unit eq 'm' ?    1048576 :
2494                                $unit eq 'k' ?       1024 : 1);
2495         }
2496         return $val;
2497 }
2498
2499 # convert config value to array reference, if needed
2500 sub config_to_multi {
2501         my $val = shift;
2502
2503         return ref($val) ? $val : (defined($val) ? [ $val ] : []);
2504 }
2505
2506 sub git_get_project_config {
2507         my ($key, $type) = @_;
2508
2509         return unless defined $git_dir;
2510
2511         # key sanity check
2512         return unless ($key);
2513         $key =~ s/^gitweb\.//;
2514         return if ($key =~ m/\W/);
2515
2516         # type sanity check
2517         if (defined $type) {
2518                 $type =~ s/^--//;
2519                 $type = undef
2520                         unless ($type eq 'bool' || $type eq 'int');
2521         }
2522
2523         # get config
2524         if (!defined $config_file ||
2525             $config_file ne "$git_dir/config") {
2526                 %config = git_parse_project_config('gitweb');
2527                 $config_file = "$git_dir/config";
2528         }
2529
2530         # check if config variable (key) exists
2531         return unless exists $config{"gitweb.$key"};
2532
2533         # ensure given type
2534         if (!defined $type) {
2535                 return $config{"gitweb.$key"};
2536         } elsif ($type eq 'bool') {
2537                 # backward compatibility: 'git config --bool' returns true/false
2538                 return config_to_bool($config{"gitweb.$key"}) ? 'true' : 'false';
2539         } elsif ($type eq 'int') {
2540                 return config_to_int($config{"gitweb.$key"});
2541         }
2542         return $config{"gitweb.$key"};
2543 }
2544
2545 # get hash of given path at given ref
2546 sub git_get_hash_by_path {
2547         my $base = shift;
2548         my $path = shift || return undef;
2549         my $type = shift;
2550
2551         $path =~ s,/+$,,;
2552
2553         open my $fd, "-|", git_cmd(), "ls-tree", $base, "--", $path
2554                 or die_error(500, "Open git-ls-tree failed");
2555         my $line = <$fd>;
2556         close $fd or return undef;
2557
2558         if (!defined $line) {
2559                 # there is no tree or hash given by $path at $base
2560                 return undef;
2561         }
2562
2563         #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
2564         $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/;
2565         if (defined $type && $type ne $2) {
2566                 # type doesn't match
2567                 return undef;
2568         }
2569         return $3;
2570 }
2571
2572 # get path of entry with given hash at given tree-ish (ref)
2573 # used to get 'from' filename for combined diff (merge commit) for renames
2574 sub git_get_path_by_hash {
2575         my $base = shift || return;
2576         my $hash = shift || return;
2577
2578         local $/ = "\0";
2579
2580         open my $fd, "-|", git_cmd(), "ls-tree", '-r', '-t', '-z', $base
2581                 or return undef;
2582         while (my $line = <$fd>) {
2583                 chomp $line;
2584
2585                 #'040000 tree 595596a6a9117ddba9fe379b6b012b558bac8423  gitweb'
2586                 #'100644 blob e02e90f0429be0d2a69b76571101f20b8f75530f  gitweb/README'
2587                 if ($line =~ m/(?:[0-9]+) (?:.+) $hash\t(.+)$/) {
2588                         close $fd;
2589                         return $1;
2590                 }
2591         }
2592         close $fd;
2593         return undef;
2594 }
2595
2596 ## ......................................................................
2597 ## git utility functions, directly accessing git repository
2598
2599 # get the value of config variable either from file named as the variable
2600 # itself in the repository ($GIT_DIR/$name file), or from gitweb.$name
2601 # configuration variable in the repository config file.
2602 sub git_get_file_or_project_config {
2603         my ($path, $name) = @_;
2604
2605         $git_dir = "$projectroot/$path";
2606         open my $fd, '<', "$git_dir/$name"
2607                 or return git_get_project_config($name);
2608         my $conf = <$fd>;
2609         close $fd;
2610         if (defined $conf) {
2611                 chomp $conf;
2612         }
2613         return $conf;
2614 }
2615
2616 sub git_get_project_description {
2617         my $path = shift;
2618         return git_get_file_or_project_config($path, 'description');
2619 }
2620
2621 sub git_get_project_category {
2622         my $path = shift;
2623         return git_get_file_or_project_config($path, 'category');
2624 }
2625
2626
2627 # supported formats:
2628 # * $GIT_DIR/ctags/<tagname> file (in 'ctags' subdirectory)
2629 #   - if its contents is a number, use it as tag weight,
2630 #   - otherwise add a tag with weight 1
2631 # * $GIT_DIR/ctags file, each line is a tag (with weight 1)
2632 #   the same value multiple times increases tag weight
2633 # * `gitweb.ctag' multi-valued repo config variable
2634 sub git_get_project_ctags {
2635         my $project = shift;
2636         my $ctags = {};
2637
2638         $git_dir = "$projectroot/$project";
2639         if (opendir my $dh, "$git_dir/ctags") {
2640                 my @files = grep { -f $_ } map { "$git_dir/ctags/$_" } readdir($dh);
2641                 foreach my $tagfile (@files) {
2642                         open my $ct, '<', $tagfile
2643                                 or next;
2644                         my $val = <$ct>;
2645                         chomp $val if $val;
2646                         close $ct;
2647
2648                         (my $ctag = $tagfile) =~ s#.*/##;
2649                         if ($val =~ /^\d+$/) {
2650                                 $ctags->{$ctag} = $val;
2651                         } else {
2652                                 $ctags->{$ctag} = 1;
2653                         }
2654                 }
2655                 closedir $dh;
2656
2657         } elsif (open my $fh, '<', "$git_dir/ctags") {
2658                 while (my $line = <$fh>) {
2659                         chomp $line;
2660                         $ctags->{$line}++ if $line;
2661                 }
2662                 close $fh;
2663
2664         } else {
2665                 my $taglist = config_to_multi(git_get_project_config('ctag'));
2666                 foreach my $tag (@$taglist) {
2667                         $ctags->{$tag}++;
2668                 }
2669         }
2670
2671         return $ctags;
2672 }
2673
2674 # return hash, where keys are content tags ('ctags'),
2675 # and values are sum of weights of given tag in every project
2676 sub git_gather_all_ctags {
2677         my $projects = shift;
2678         my $ctags = {};
2679
2680         foreach my $p (@$projects) {
2681                 foreach my $ct (keys %{$p->{'ctags'}}) {
2682                         $ctags->{$ct} += $p->{'ctags'}->{$ct};
2683                 }
2684         }
2685
2686         return $ctags;
2687 }
2688
2689 sub git_populate_project_tagcloud {
2690         my $ctags = shift;
2691
2692         # First, merge different-cased tags; tags vote on casing
2693         my %ctags_lc;
2694         foreach (keys %$ctags) {
2695                 $ctags_lc{lc $_}->{count} += $ctags->{$_};
2696                 if (not $ctags_lc{lc $_}->{topcount}
2697                     or $ctags_lc{lc $_}->{topcount} < $ctags->{$_}) {
2698                         $ctags_lc{lc $_}->{topcount} = $ctags->{$_};
2699                         $ctags_lc{lc $_}->{topname} = $_;
2700                 }
2701         }
2702
2703         my $cloud;
2704         my $matched = $cgi->param('by_tag');
2705         if (eval { require HTML::TagCloud; 1; }) {
2706                 $cloud = HTML::TagCloud->new;
2707                 foreach my $ctag (sort keys %ctags_lc) {
2708                         # Pad the title with spaces so that the cloud looks
2709                         # less crammed.
2710                         my $title = esc_html($ctags_lc{$ctag}->{topname});
2711                         $title =~ s/ /&nbsp;/g;
2712                         $title =~ s/^/&nbsp;/g;
2713                         $title =~ s/$/&nbsp;/g;
2714                         if (defined $matched && $matched eq $ctag) {
2715                                 $title = qq(<span class="match">$title</span>);
2716                         }
2717                         $cloud->add($title, href(project=>undef, ctag=>$ctag),
2718                                     $ctags_lc{$ctag}->{count});
2719                 }
2720         } else {
2721                 $cloud = {};
2722                 foreach my $ctag (keys %ctags_lc) {
2723                         my $title = esc_html($ctags_lc{$ctag}->{topname}, -nbsp=>1);
2724                         if (defined $matched && $matched eq $ctag) {
2725                                 $title = qq(<span class="match">$title</span>);
2726                         }
2727                         $cloud->{$ctag}{count} = $ctags_lc{$ctag}->{count};
2728                         $cloud->{$ctag}{ctag} =
2729                                 $cgi->a({-href=>href(project=>undef, ctag=>$ctag)}, $title);
2730                 }
2731         }
2732         return $cloud;
2733 }
2734
2735 sub git_show_project_tagcloud {
2736         my ($cloud, $count) = @_;
2737         if (ref $cloud eq 'HTML::TagCloud') {
2738                 return $cloud->html_and_css($count);
2739         } else {
2740                 my @tags = sort { $cloud->{$a}->{'count'} <=> $cloud->{$b}->{'count'} } keys %$cloud;
2741                 return
2742                         '<div id="htmltagcloud"'.($project ? '' : ' align="center"').'>' .
2743                         join (', ', map {
2744                                 $cloud->{$_}->{'ctag'}
2745                         } splice(@tags, 0, $count)) .
2746                         '</div>';
2747         }
2748 }
2749
2750 sub git_get_project_url_list {
2751         my $path = shift;
2752
2753         $git_dir = "$projectroot/$path";
2754         open my $fd, '<', "$git_dir/cloneurl"
2755                 or return wantarray ?
2756                 @{ config_to_multi(git_get_project_config('url')) } :
2757                    config_to_multi(git_get_project_config('url'));
2758         my @git_project_url_list = map { chomp; $_ } <$fd>;
2759         close $fd;
2760
2761         return wantarray ? @git_project_url_list : \@git_project_url_list;
2762 }
2763
2764 sub git_get_projects_list {
2765         my $filter = shift || '';
2766         my @list;
2767
2768         $filter =~ s/\.git$//;
2769
2770         if (-d $projects_list) {
2771                 # search in directory
2772                 my $dir = $projects_list;
2773                 # remove the trailing "/"
2774                 $dir =~ s!/+$!!;
2775                 my $pfxlen = length("$projects_list");
2776                 my $pfxdepth = ($projects_list =~ tr!/!!);
2777                 # when filtering, search only given subdirectory
2778                 if ($filter) {
2779                         $dir .= "/$filter";
2780                         $dir =~ s!/+$!!;
2781                 }
2782
2783                 File::Find::find({
2784                         follow_fast => 1, # follow symbolic links
2785                         follow_skip => 2, # ignore duplicates
2786                         dangling_symlinks => 0, # ignore dangling symlinks, silently
2787                         wanted => sub {
2788                                 # global variables
2789                                 our $project_maxdepth;
2790                                 our $projectroot;
2791                                 # skip project-list toplevel, if we get it.
2792                                 return if (m!^[/.]$!);
2793                                 # only directories can be git repositories
2794                                 return unless (-d $_);
2795                                 # don't traverse too deep (Find is super slow on os x)
2796                                 # $project_maxdepth excludes depth of $projectroot
2797                                 if (($File::Find::name =~ tr!/!!) - $pfxdepth > $project_maxdepth) {
2798                                         $File::Find::prune = 1;
2799                                         return;
2800                                 }
2801
2802                                 my $path = substr($File::Find::name, $pfxlen + 1);
2803                                 # we check related file in $projectroot
2804                                 if (check_export_ok("$projectroot/$path")) {
2805                                         push @list, { path => $path };
2806                                         $File::Find::prune = 1;
2807                                 }
2808                         },
2809                 }, "$dir");
2810
2811         } elsif (-f $projects_list) {
2812                 # read from file(url-encoded):
2813                 # 'git%2Fgit.git Linus+Torvalds'
2814                 # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2815                 # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2816                 open my $fd, '<', $projects_list or return;
2817         PROJECT:
2818                 while (my $line = <$fd>) {
2819                         chomp $line;
2820                         my ($path, $owner) = split ' ', $line;
2821                         $path = unescape($path);
2822                         $owner = unescape($owner);
2823                         if (!defined $path) {
2824                                 next;
2825                         }
2826                         # if $filter is rpovided, check if $path begins with $filter
2827                         if ($filter && $path !~ m!^\Q$filter\E/!) {
2828                                 next;
2829                         }
2830                         if (check_export_ok("$projectroot/$path")) {
2831                                 my $pr = {
2832                                         path => $path,
2833                                         owner => to_utf8($owner),
2834                                 };
2835                                 push @list, $pr;
2836                         }
2837                 }
2838                 close $fd;
2839         }
2840         return @list;
2841 }
2842
2843 # written with help of Tree::Trie module (Perl Artistic License, GPL compatibile)
2844 # as side effects it sets 'forks' field to list of forks for forked projects
2845 sub filter_forks_from_projects_list {
2846         my $projects = shift;
2847
2848         my %trie; # prefix tree of directories (path components)
2849         # generate trie out of those directories that might contain forks
2850         foreach my $pr (@$projects) {
2851                 my $path = $pr->{'path'};
2852                 $path =~ s/\.git$//;      # forks of 'repo.git' are in 'repo/' directory
2853                 next if ($path =~ m!/$!); # skip non-bare repositories, e.g. 'repo/.git'
2854                 next unless ($path);      # skip '.git' repository: tests, git-instaweb
2855                 next unless (-d $path);   # containing directory exists
2856                 $pr->{'forks'} = [];      # there can be 0 or more forks of project
2857
2858                 # add to trie
2859                 my @dirs = split('/', $path);
2860                 # walk the trie, until either runs out of components or out of trie
2861                 my $ref = \%trie;
2862                 while (scalar @dirs &&
2863                        exists($ref->{$dirs[0]})) {
2864                         $ref = $ref->{shift @dirs};
2865                 }
2866                 # create rest of trie structure from rest of components
2867                 foreach my $dir (@dirs) {
2868                         $ref = $ref->{$dir} = {};
2869                 }
2870                 # create end marker, store $pr as a data
2871                 $ref->{''} = $pr if (!exists $ref->{''});
2872         }
2873
2874         # filter out forks, by finding shortest prefix match for paths
2875         my @filtered;
2876  PROJECT:
2877         foreach my $pr (@$projects) {
2878                 # trie lookup
2879                 my $ref = \%trie;
2880         DIR:
2881                 foreach my $dir (split('/', $pr->{'path'})) {
2882                         if (exists $ref->{''}) {
2883                                 # found [shortest] prefix, is a fork - skip it
2884                                 push @{$ref->{''}{'forks'}}, $pr;
2885                                 next PROJECT;
2886                         }
2887                         if (!exists $ref->{$dir}) {
2888                                 # not in trie, cannot have prefix, not a fork
2889                                 push @filtered, $pr;
2890                                 next PROJECT;
2891                         }
2892                         # If the dir is there, we just walk one step down the trie.
2893                         $ref = $ref->{$dir};
2894                 }
2895                 # we ran out of trie
2896                 # (shouldn't happen: it's either no match, or end marker)
2897                 push @filtered, $pr;
2898         }
2899
2900         return @filtered;
2901 }
2902
2903 # note: fill_project_list_info must be run first,
2904 # for 'descr_long' and 'ctags' to be filled
2905 sub search_projects_list {
2906         my ($projlist, %opts) = @_;
2907         my $tagfilter  = $opts{'tagfilter'};
2908         my $searchtext = $opts{'searchtext'};
2909
2910         return @$projlist
2911                 unless ($tagfilter || $searchtext);
2912
2913         my @projects;
2914  PROJECT:
2915         foreach my $pr (@$projlist) {
2916
2917                 if ($tagfilter) {
2918                         next unless ref($pr->{'ctags'}) eq 'HASH';
2919                         next unless
2920                                 grep { lc($_) eq lc($tagfilter) } keys %{$pr->{'ctags'}};
2921                 }
2922
2923                 if ($searchtext) {
2924                         next unless
2925                                 $pr->{'path'} =~ /$searchtext/ ||
2926                                 $pr->{'descr_long'} =~ /$searchtext/;
2927                 }
2928
2929                 push @projects, $pr;
2930         }
2931
2932         return @projects;
2933 }
2934
2935 our $gitweb_project_owner = undef;
2936 sub git_get_project_list_from_file {
2937
2938         return if (defined $gitweb_project_owner);
2939
2940         $gitweb_project_owner = {};
2941         # read from file (url-encoded):
2942         # 'git%2Fgit.git Linus+Torvalds'
2943         # 'libs%2Fklibc%2Fklibc.git H.+Peter+Anvin'
2944         # 'linux%2Fhotplug%2Fudev.git Greg+Kroah-Hartman'
2945         if (-f $projects_list) {
2946                 open(my $fd, '<', $projects_list);
2947                 while (my $line = <$fd>) {
2948                         chomp $line;
2949                         my ($pr, $ow) = split ' ', $line;
2950                         $pr = unescape($pr);
2951                         $ow = unescape($ow);
2952                         $gitweb_project_owner->{$pr} = to_utf8($ow);
2953                 }
2954                 close $fd;
2955         }
2956 }
2957
2958 sub git_get_project_owner {
2959         my $project = shift;
2960         my $owner;
2961
2962         return undef unless $project;
2963         $git_dir = "$projectroot/$project";
2964
2965         if (!defined $gitweb_project_owner) {
2966                 git_get_project_list_from_file();
2967         }
2968
2969         if (exists $gitweb_project_owner->{$project}) {
2970                 $owner = $gitweb_project_owner->{$project};
2971         }
2972         if (!defined $owner){
2973                 $owner = git_get_project_config('owner');
2974         }
2975         if (!defined $owner) {
2976                 $owner = get_file_owner("$git_dir");
2977         }
2978
2979         return $owner;
2980 }
2981
2982 sub git_get_last_activity {
2983         my ($path) = @_;
2984         my $fd;
2985
2986         $git_dir = "$projectroot/$path";
2987         open($fd, "-|", git_cmd(), 'for-each-ref',
2988              '--format=%(committer)',
2989              '--sort=-committerdate',
2990              '--count=1',
2991              'refs/heads') or return;
2992         my $most_recent = <$fd>;
2993         close $fd or return;
2994         if (defined $most_recent &&
2995             $most_recent =~ / (\d+) [-+][01]\d\d\d$/) {
2996                 my $timestamp = $1;
2997                 my $age = time - $timestamp;
2998                 return ($age, age_string($age));
2999         }
3000         return (undef, undef);
3001 }
3002
3003 # Implementation note: when a single remote is wanted, we cannot use 'git
3004 # remote show -n' because that command always work (assuming it's a remote URL
3005 # if it's not defined), and we cannot use 'git remote show' because that would
3006 # try to make a network roundtrip. So the only way to find if that particular
3007 # remote is defined is to walk the list provided by 'git remote -v' and stop if
3008 # and when we find what we want.
3009 sub git_get_remotes_list {
3010         my $wanted = shift;
3011         my %remotes = ();
3012
3013         open my $fd, '-|' , git_cmd(), 'remote', '-v';
3014         return unless $fd;
3015         while (my $remote = <$fd>) {
3016                 chomp $remote;
3017                 $remote =~ s!\t(.*?)\s+\((\w+)\)$!!;
3018                 next if $wanted and not $remote eq $wanted;
3019                 my ($url, $key) = ($1, $2);
3020
3021                 $remotes{$remote} ||= { 'heads' => () };
3022                 $remotes{$remote}{$key} = $url;
3023         }
3024         close $fd or return;
3025         return wantarray ? %remotes : \%remotes;
3026 }
3027
3028 # Takes a hash of remotes as first parameter and fills it by adding the
3029 # available remote heads for each of the indicated remotes.
3030 sub fill_remote_heads {
3031         my $remotes = shift;
3032         my @heads = map { "remotes/$_" } keys %$remotes;
3033         my @remoteheads = git_get_heads_list(undef, @heads);
3034         foreach my $remote (keys %$remotes) {
3035                 $remotes->{$remote}{'heads'} = [ grep {
3036                         $_->{'name'} =~ s!^$remote/!!
3037                         } @remoteheads ];
3038         }
3039 }
3040
3041 sub git_get_references {
3042         my $type = shift || "";
3043         my %refs;
3044         # 5dc01c595e6c6ec9ccda4f6f69c131c0dd945f8c refs/tags/v2.6.11
3045         # c39ae07f393806ccf406ef966e9a15afc43cc36a refs/tags/v2.6.11^{}
3046         open my $fd, "-|", git_cmd(), "show-ref", "--dereference",
3047                 ($type ? ("--", "refs/$type") : ()) # use -- <pattern> if $type
3048                 or return;
3049
3050         while (my $line = <$fd>) {
3051                 chomp $line;
3052                 if ($line =~ m!^([0-9a-fA-F]{40})\srefs/($type.*)$!) {
3053                         if (defined $refs{$1}) {
3054                                 push @{$refs{$1}}, $2;
3055                         } else {
3056                                 $refs{$1} = [ $2 ];
3057                         }
3058                 }
3059         }
3060         close $fd or return;
3061         return \%refs;
3062 }
3063
3064 sub git_get_rev_name_tags {
3065         my $hash = shift || return undef;
3066
3067         open my $fd, "-|", git_cmd(), "name-rev", "--tags", $hash
3068                 or return;
3069         my $name_rev = <$fd>;
3070         close $fd;
3071
3072         if ($name_rev =~ m|^$hash tags/(.*)$|) {
3073                 return $1;
3074         } else {
3075                 # catches also '$hash undefined' output
3076                 return undef;
3077         }
3078 }
3079
3080 ## ----------------------------------------------------------------------
3081 ## parse to hash functions
3082
3083 sub parse_date {
3084         my $epoch = shift;
3085         my $tz = shift || "-0000";
3086
3087         my %date;
3088         my @months = ("Jan", "Feb", "Mar", "Apr", "May", "Jun", "Jul", "Aug", "Sep", "Oct", "Nov", "Dec");
3089         my @days = ("Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat");
3090         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($epoch);
3091         $date{'hour'} = $hour;
3092         $date{'minute'} = $min;
3093         $date{'mday'} = $mday;
3094         $date{'day'} = $days[$wday];
3095         $date{'month'} = $months[$mon];
3096         $date{'rfc2822'}   = sprintf "%s, %d %s %4d %02d:%02d:%02d +0000",
3097                              $days[$wday], $mday, $months[$mon], 1900+$year, $hour ,$min, $sec;
3098         $date{'mday-time'} = sprintf "%d %s %02d:%02d",
3099                              $mday, $months[$mon], $hour ,$min;
3100         $date{'iso-8601'}  = sprintf "%04d-%02d-%02dT%02d:%02d:%02dZ",
3101                              1900+$year, 1+$mon, $mday, $hour ,$min, $sec;
3102
3103         my ($tz_sign, $tz_hour, $tz_min) =
3104                 ($tz =~ m/^([-+])(\d\d)(\d\d)$/);
3105         $tz_sign = ($tz_sign eq '-' ? -1 : +1);
3106         my $local = $epoch + $tz_sign*((($tz_hour*60) + $tz_min)*60);
3107         ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($local);
3108         $date{'hour_local'} = $hour;
3109         $date{'minute_local'} = $min;
3110         $date{'tz_local'} = $tz;
3111         $date{'iso-tz'} = sprintf("%04d-%02d-%02d %02d:%02d:%02d %s",
3112                                   1900+$year, $mon+1, $mday,
3113                                   $hour, $min, $sec, $tz);
3114         return %date;
3115 }
3116
3117 sub parse_tag {
3118         my $tag_id = shift;
3119         my %tag;
3120         my @comment;
3121
3122         open my $fd, "-|", git_cmd(), "cat-file", "tag", $tag_id or return;
3123         $tag{'id'} = $tag_id;
3124         while (my $line = <$fd>) {
3125                 chomp $line;
3126                 if ($line =~ m/^object ([0-9a-fA-F]{40})$/) {
3127                         $tag{'object'} = $1;
3128                 } elsif ($line =~ m/^type (.+)$/) {
3129                         $tag{'type'} = $1;
3130                 } elsif ($line =~ m/^tag (.+)$/) {
3131                         $tag{'name'} = $1;
3132                 } elsif ($line =~ m/^tagger (.*) ([0-9]+) (.*)$/) {
3133                         $tag{'author'} = $1;
3134                         $tag{'author_epoch'} = $2;
3135                         $tag{'author_tz'} = $3;
3136                         if ($tag{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3137                                 $tag{'author_name'}  = $1;
3138                                 $tag{'author_email'} = $2;
3139                         } else {
3140                                 $tag{'author_name'} = $tag{'author'};
3141                         }
3142                 } elsif ($line =~ m/--BEGIN/) {
3143                         push @comment, $line;
3144                         last;
3145                 } elsif ($line eq "") {
3146                         last;
3147                 }
3148         }
3149         push @comment, <$fd>;
3150         $tag{'comment'} = \@comment;
3151         close $fd or return;
3152         if (!defined $tag{'name'}) {
3153                 return
3154         };
3155         return %tag
3156 }
3157
3158 sub parse_commit_text {
3159         my ($commit_text, $withparents) = @_;
3160         my @commit_lines = split '\n', $commit_text;
3161         my %co;
3162
3163         pop @commit_lines; # Remove '\0'
3164
3165         if (! @commit_lines) {
3166                 return;
3167         }
3168
3169         my $header = shift @commit_lines;
3170         if ($header !~ m/^[0-9a-fA-F]{40}/) {
3171                 return;
3172         }
3173         ($co{'id'}, my @parents) = split ' ', $header;
3174         while (my $line = shift @commit_lines) {
3175                 last if $line eq "\n";
3176                 if ($line =~ m/^tree ([0-9a-fA-F]{40})$/) {
3177                         $co{'tree'} = $1;
3178                 } elsif ((!defined $withparents) && ($line =~ m/^parent ([0-9a-fA-F]{40})$/)) {
3179                         push @parents, $1;
3180                 } elsif ($line =~ m/^author (.*) ([0-9]+) (.*)$/) {
3181                         $co{'author'} = to_utf8($1);
3182                         $co{'author_epoch'} = $2;
3183                         $co{'author_tz'} = $3;
3184                         if ($co{'author'} =~ m/^([^<]+) <([^>]*)>/) {
3185                                 $co{'author_name'}  = $1;
3186                                 $co{'author_email'} = $2;
3187                         } else {
3188                                 $co{'author_name'} = $co{'author'};
3189                         }
3190                 } elsif ($line =~ m/^committer (.*) ([0-9]+) (.*)$/) {
3191                         $co{'committer'} = to_utf8($1);
3192                         $co{'committer_epoch'} = $2;
3193                         $co{'committer_tz'} = $3;
3194                         if ($co{'committer'} =~ m/^([^<]+) <([^>]*)>/) {
3195                                 $co{'committer_name'}  = $1;
3196                                 $co{'committer_email'} = $2;
3197                         } else {
3198                                 $co{'committer_name'} = $co{'committer'};
3199                         }
3200                 }
3201         }
3202         if (!defined $co{'tree'}) {
3203                 return;
3204         };
3205         $co{'parents'} = \@parents;
3206         $co{'parent'} = $parents[0];
3207
3208         foreach my $title (@commit_lines) {
3209                 $title =~ s/^    //;
3210                 if ($title ne "") {
3211                         $co{'title'} = chop_str($title, 80, 5);
3212                         # remove leading stuff of merges to make the interesting part visible
3213                         if (length($title) > 50) {
3214                                 $title =~ s/^Automatic //;
3215                                 $title =~ s/^merge (of|with) /Merge ... /i;
3216                                 if (length($title) > 50) {
3217                                         $title =~ s/(http|rsync):\/\///;
3218                                 }
3219                                 if (length($title) > 50) {
3220                                         $title =~ s/(master|www|rsync)\.//;
3221                                 }
3222                                 if (length($title) > 50) {
3223                                         $title =~ s/kernel.org:?//;
3224                                 }
3225                                 if (length($title) > 50) {
3226                                         $title =~ s/\/pub\/scm//;
3227                                 }
3228                         }
3229                         $co{'title_short'} = chop_str($title, 50, 5);
3230                         last;
3231                 }
3232         }
3233         if (! defined $co{'title'} || $co{'title'} eq "") {
3234                 $co{'title'} = $co{'title_short'} = '(no commit message)';
3235         }
3236         # remove added spaces
3237         foreach my $line (@commit_lines) {
3238                 $line =~ s/^    //;
3239         }
3240         $co{'comment'} = \@commit_lines;
3241
3242         my $age = time - $co{'committer_epoch'};
3243         $co{'age'} = $age;
3244         $co{'age_string'} = age_string($age);
3245         my ($sec, $min, $hour, $mday, $mon, $year, $wday, $yday) = gmtime($co{'committer_epoch'});
3246         if ($age > 60*60*24*7*2) {
3247                 $co{'age_string_date'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3248                 $co{'age_string_age'} = $co{'age_string'};
3249         } else {
3250                 $co{'age_string_date'} = $co{'age_string'};
3251                 $co{'age_string_age'} = sprintf "%4i-%02u-%02i", 1900 + $year, $mon+1, $mday;
3252         }
3253         return %co;
3254 }
3255
3256 sub parse_commit {
3257         my ($commit_id) = @_;
3258         my %co;
3259
3260         local $/ = "\0";
3261
3262         open my $fd, "-|", git_cmd(), "rev-list",
3263                 "--parents",
3264                 "--header",
3265                 "--max-count=1",
3266                 $commit_id,
3267                 "--",
3268                 or die_error(500, "Open git-rev-list failed");
3269         %co = parse_commit_text(<$fd>, 1);
3270         close $fd;
3271
3272         return %co;
3273 }
3274
3275 sub parse_commits {
3276         my ($commit_id, $maxcount, $skip, $filename, @args) = @_;
3277         my @cos;
3278
3279         $maxcount ||= 1;
3280         $skip ||= 0;
3281
3282         local $/ = "\0";
3283
3284         open my $fd, "-|", git_cmd(), "rev-list",
3285                 "--header",
3286                 @args,
3287                 ("--max-count=" . $maxcount),
3288                 ("--skip=" . $skip),
3289                 @extra_options,
3290                 $commit_id,
3291                 "--",
3292                 ($filename ? ($filename) : ())
3293                 or die_error(500, "Open git-rev-list failed");
3294         while (my $line = <$fd>) {
3295                 my %co = parse_commit_text($line);
3296                 push @cos, \%co;
3297         }
3298         close $fd;
3299
3300         return wantarray ? @cos : \@cos;
3301 }
3302
3303 # parse line of git-diff-tree "raw" output
3304 sub parse_difftree_raw_line {
3305         my $line = shift;
3306         my %res;
3307
3308         # ':100644 100644 03b218260e99b78c6df0ed378e59ed9205ccc96d 3b93d5e7cc7f7dd4ebed13a5cc1a4ad976fc94d8 M   ls-files.c'
3309         # ':100644 100644 7f9281985086971d3877aca27704f2aaf9c448ce bc190ebc71bbd923f2b728e505408f5e54bd073a M   rev-tree.c'
3310         if ($line =~ m/^:([0-7]{6}) ([0-7]{6}) ([0-9a-fA-F]{40}) ([0-9a-fA-F]{40}) (.)([0-9]{0,3})\t(.*)$/) {
3311                 $res{'from_mode'} = $1;
3312                 $res{'to_mode'} = $2;
3313                 $res{'from_id'} = $3;
3314                 $res{'to_id'} = $4;
3315                 $res{'status'} = $5;
3316                 $res{'similarity'} = $6;
3317                 if ($res{'status'} eq 'R' || $res{'status'} eq 'C') { # renamed or copied
3318                         ($res{'from_file'}, $res{'to_file'}) = map { unquote($_) } split("\t", $7);
3319                 } else {
3320                         $res{'from_file'} = $res{'to_file'} = $res{'file'} = unquote($7);
3321                 }
3322         }
3323         # '::100755 100755 100755 60e79ca1b01bc8b057abe17ddab484699a7f5fdb 94067cc5f73388f33722d52ae02f44692bc07490 94067cc5f73388f33722d52ae02f44692bc07490 MR git-gui/git-gui.sh'
3324         # combined diff (for merge commit)
3325         elsif ($line =~ s/^(::+)((?:[0-7]{6} )+)((?:[0-9a-fA-F]{40} )+)([a-zA-Z]+)\t(.*)$//) {
3326                 $res{'nparents'}  = length($1);
3327                 $res{'from_mode'} = [ split(' ', $2) ];
3328                 $res{'to_mode'} = pop @{$res{'from_mode'}};
3329                 $res{'from_id'} = [ split(' ', $3) ];
3330                 $res{'to_id'} = pop @{$res{'from_id'}};
3331                 $res{'status'} = [ split('', $4) ];
3332                 $res{'to_file'} = unquote($5);
3333         }
3334         # 'c512b523472485aef4fff9e57b229d9d243c967f'
3335         elsif ($line =~ m/^([0-9a-fA-F]{40})$/) {
3336                 $res{'commit'} = $1;
3337         }
3338
3339         return wantarray ? %res : \%res;
3340 }
3341
3342 # wrapper: return parsed line of git-diff-tree "raw" output
3343 # (the argument might be raw line, or parsed info)
3344 sub parsed_difftree_line {
3345         my $line_or_ref = shift;
3346
3347         if (ref($line_or_ref) eq "HASH") {
3348                 # pre-parsed (or generated by hand)
3349                 return $line_or_ref;
3350         } else {
3351                 return parse_difftree_raw_line($line_or_ref);
3352         }
3353 }
3354
3355 # parse line of git-ls-tree output
3356 sub parse_ls_tree_line {
3357         my $line = shift;
3358         my %opts = @_;
3359         my %res;
3360
3361         if ($opts{'-l'}) {
3362                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa   16717  panic.c'
3363                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40}) +(-|[0-9]+)\t(.+)$/s;
3364
3365                 $res{'mode'} = $1;
3366                 $res{'type'} = $2;
3367                 $res{'hash'} = $3;
3368                 $res{'size'} = $4;
3369                 if ($opts{'-z'}) {
3370                         $res{'name'} = $5;
3371                 } else {
3372                         $res{'name'} = unquote($5);
3373                 }
3374         } else {
3375                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
3376                 $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t(.+)$/s;
3377
3378                 $res{'mode'} = $1;
3379                 $res{'type'} = $2;
3380                 $res{'hash'} = $3;
3381                 if ($opts{'-z'}) {
3382                         $res{'name'} = $4;
3383                 } else {
3384                         $res{'name'} = unquote($4);
3385                 }
3386         }
3387
3388         return wantarray ? %res : \%res;
3389 }
3390
3391 # generates _two_ hashes, references to which are passed as 2 and 3 argument
3392 sub parse_from_to_diffinfo {
3393         my ($diffinfo, $from, $to, @parents) = @_;
3394
3395         if ($diffinfo->{'nparents'}) {
3396                 # combined diff
3397                 $from->{'file'} = [];
3398                 $from->{'href'} = [];
3399                 fill_from_file_info($diffinfo, @parents)
3400                         unless exists $diffinfo->{'from_file'};
3401                 for (my $i = 0; $i < $diffinfo->{'nparents'}; $i++) {
3402                         $from->{'file'}[$i] =
3403                                 defined $diffinfo->{'from_file'}[$i] ?
3404                                         $diffinfo->{'from_file'}[$i] :
3405                                         $diffinfo->{'to_file'};
3406                         if ($diffinfo->{'status'}[$i] ne "A") { # not new (added) file
3407                                 $from->{'href'}[$i] = href(action=>"blob",
3408                                                            hash_base=>$parents[$i],
3409                                                            hash=>$diffinfo->{'from_id'}[$i],
3410                                                            file_name=>$from->{'file'}[$i]);
3411                         } else {
3412                                 $from->{'href'}[$i] = undef;
3413                         }
3414                 }
3415         } else {
3416                 # ordinary (not combined) diff
3417                 $from->{'file'} = $diffinfo->{'from_file'};
3418                 if ($diffinfo->{'status'} ne "A") { # not new (added) file
3419                         $from->{'href'} = href(action=>"blob", hash_base=>$hash_parent,
3420                                                hash=>$diffinfo->{'from_id'},
3421                                                file_name=>$from->{'file'});
3422                 } else {
3423                         delete $from->{'href'};
3424                 }
3425         }
3426
3427         $to->{'file'} = $diffinfo->{'to_file'};
3428         if (!is_deleted($diffinfo)) { # file exists in result
3429                 $to->{'href'} = href(action=>"blob", hash_base=>$hash,
3430                                      hash=>$diffinfo->{'to_id'},
3431                                      file_name=>$to->{'file'});
3432         } else {
3433                 delete $to->{'href'};
3434         }
3435 }
3436
3437 ## ......................................................................
3438 ## parse to array of hashes functions
3439
3440 sub git_get_heads_list {
3441         my ($limit, @classes) = @_;
3442         @classes = ('heads') unless @classes;
3443         my @patterns = map { "refs/$_" } @classes;
3444         my @headslist;
3445
3446         open my $fd, '-|', git_cmd(), 'for-each-ref',
3447                 ($limit ? '--count='.($limit+1) : ()), '--sort=-committerdate',
3448                 '--format=%(objectname) %(refname) %(subject)%00%(committer)',
3449                 @patterns
3450                 or return;
3451         while (my $line = <$fd>) {
3452                 my %ref_item;
3453
3454                 chomp $line;
3455                 my ($refinfo, $committerinfo) = split(/\0/, $line);
3456                 my ($hash, $name, $title) = split(' ', $refinfo, 3);
3457                 my ($committer, $epoch, $tz) =
3458                         ($committerinfo =~ /^(.*) ([0-9]+) (.*)$/);
3459                 $ref_item{'fullname'}  = $name;
3460                 $name =~ s!^refs/(?:head|remote)s/!!;
3461
3462                 $ref_item{'name'}  = $name;
3463                 $ref_item{'id'}    = $hash;
3464                 $ref_item{'title'} = $title || '(no commit message)';
3465                 $ref_item{'epoch'} = $epoch;
3466                 if ($epoch) {
3467                         $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3468                 } else {
3469                         $ref_item{'age'} = "unknown";
3470                 }
3471
3472                 push @headslist, \%ref_item;
3473         }
3474         close $fd;
3475
3476         return wantarray ? @headslist : \@headslist;
3477 }
3478
3479 sub git_get_tags_list {
3480         my $limit = shift;
3481         my @tagslist;
3482
3483         open my $fd, '-|', git_cmd(), 'for-each-ref',
3484                 ($limit ? '--count='.($limit+1) : ()), '--sort=-creatordate',
3485                 '--format=%(objectname) %(objecttype) %(refname) '.
3486                 '%(*objectname) %(*objecttype) %(subject)%00%(creator)',
3487                 'refs/tags'
3488                 or return;
3489         while (my $line = <$fd>) {
3490                 my %ref_item;
3491
3492                 chomp $line;
3493                 my ($refinfo, $creatorinfo) = split(/\0/, $line);
3494                 my ($id, $type, $name, $refid, $reftype, $title) = split(' ', $refinfo, 6);
3495                 my ($creator, $epoch, $tz) =
3496                         ($creatorinfo =~ /^(.*) ([0-9]+) (.*)$/);
3497                 $ref_item{'fullname'} = $name;
3498                 $name =~ s!^refs/tags/!!;
3499
3500                 $ref_item{'type'} = $type;
3501                 $ref_item{'id'} = $id;
3502                 $ref_item{'name'} = $name;
3503                 if ($type eq "tag") {
3504                         $ref_item{'subject'} = $title;
3505                         $ref_item{'reftype'} = $reftype;
3506                         $ref_item{'refid'}   = $refid;
3507                 } else {
3508                         $ref_item{'reftype'} = $type;
3509                         $ref_item{'refid'}   = $id;
3510                 }
3511
3512                 if ($type eq "tag" || $type eq "commit") {
3513                         $ref_item{'epoch'} = $epoch;
3514                         if ($epoch) {
3515                                 $ref_item{'age'} = age_string(time - $ref_item{'epoch'});
3516                         } else {
3517                                 $ref_item{'age'} = "unknown";
3518                         }
3519                 }
3520
3521                 push @tagslist, \%ref_item;
3522         }
3523         close $fd;
3524
3525         return wantarray ? @tagslist : \@tagslist;
3526 }
3527
3528 ## ----------------------------------------------------------------------
3529 ## filesystem-related functions
3530
3531 sub get_file_owner {
3532         my $path = shift;
3533
3534         my ($dev, $ino, $mode, $nlink, $st_uid, $st_gid, $rdev, $size) = stat($path);
3535         my ($name, $passwd, $uid, $gid, $quota, $comment, $gcos, $dir, $shell) = getpwuid($st_uid);
3536         if (!defined $gcos) {
3537                 return undef;
3538         }
3539         my $owner = $gcos;
3540         $owner =~ s/[,;].*$//;
3541         return to_utf8($owner);
3542 }
3543
3544 # assume that file exists
3545 sub insert_file {
3546         my $filename = shift;
3547
3548         open my $fd, '<', $filename;
3549         print map { to_utf8($_) } <$fd>;
3550         close $fd;
3551 }
3552
3553 ## ......................................................................
3554 ## mimetype related functions
3555
3556 sub mimetype_guess_file {
3557         my $filename = shift;
3558         my $mimemap = shift;
3559         -r $mimemap or return undef;
3560
3561         my %mimemap;
3562         open(my $mh, '<', $mimemap) or return undef;
3563         while (<$mh>) {
3564                 next if m/^#/; # skip comments
3565                 my ($mimetype, $exts) = split(/\t+/);
3566                 if (defined $exts) {
3567                         my @exts = split(/\s+/, $exts);
3568                         foreach my $ext (@exts) {
3569                                 $mimemap{$ext} = $mimetype;
3570                         }
3571                 }
3572         }
3573         close($mh);
3574
3575         $filename =~ /\.([^.]*)$/;
3576         return $mimemap{$1};
3577 }
3578
3579 sub mimetype_guess {
3580         my $filename = shift;
3581         my $mime;
3582         $filename =~ /\./ or return undef;
3583
3584         if ($mimetypes_file) {
3585                 my $file = $mimetypes_file;
3586                 if ($file !~ m!^/!) { # if it is relative path
3587                         # it is relative to project
3588                         $file = "$projectroot/$project/$file";
3589                 }
3590                 $mime = mimetype_guess_file($filename, $file);
3591         }
3592         $mime ||= mimetype_guess_file($filename, '/etc/mime.types');
3593         return $mime;
3594 }
3595
3596 sub blob_mimetype {
3597         my $fd = shift;
3598         my $filename = shift;
3599
3600         if ($filename) {
3601                 my $mime = mimetype_guess($filename);
3602                 $mime and return $mime;
3603         }
3604
3605         # just in case
3606         return $default_blob_plain_mimetype unless $fd;
3607
3608         if (-T $fd) {
3609                 return 'text/plain';
3610         } elsif (! $filename) {
3611                 return 'application/octet-stream';
3612         } elsif ($filename =~ m/\.png$/i) {
3613                 return 'image/png';
3614         } elsif ($filename =~ m/\.gif$/i) {
3615                 return 'image/gif';
3616         } elsif ($filename =~ m/\.jpe?g$/i) {
3617                 return 'image/jpeg';
3618         } else {
3619                 return 'application/octet-stream';
3620         }
3621 }
3622
3623 sub blob_contenttype {
3624         my ($fd, $file_name, $type) = @_;
3625
3626         $type ||= blob_mimetype($fd, $file_name);
3627         if ($type eq 'text/plain' && defined $default_text_plain_charset) {
3628                 $type .= "; charset=$default_text_plain_charset";
3629         }
3630
3631         return $type;
3632 }
3633
3634 # guess file syntax for syntax highlighting; return undef if no highlighting
3635 # the name of syntax can (in the future) depend on syntax highlighter used
3636 sub guess_file_syntax {
3637         my ($highlight, $mimetype, $file_name) = @_;
3638         return undef unless ($highlight && defined $file_name);
3639         my $basename = basename($file_name, '.in');
3640         return $highlight_basename{$basename}
3641                 if exists $highlight_basename{$basename};
3642
3643         $basename =~ /\.([^.]*)$/;
3644         my $ext = $1 or return undef;
3645         return $highlight_ext{$ext}
3646                 if exists $highlight_ext{$ext};
3647
3648         return undef;
3649 }
3650
3651 # run highlighter and return FD of its output,
3652 # or return original FD if no highlighting
3653 sub run_highlighter {
3654         my ($fd, $highlight, $syntax) = @_;
3655         return $fd unless ($highlight && defined $syntax);
3656
3657         close $fd;
3658         open $fd, quote_command(git_cmd(), "cat-file", "blob", $hash)." | ".
3659                   quote_command($highlight_bin).
3660                   " --replace-tabs=8 --fragment --syntax $syntax |"
3661                 or die_error(500, "Couldn't open file or run syntax highlighter");
3662         return $fd;
3663 }
3664
3665 ## ======================================================================
3666 ## functions printing HTML: header, footer, error page
3667
3668 sub get_page_title {
3669         my $title = to_utf8($site_name);
3670
3671         return $title unless (defined $project);
3672         $title .= " - " . to_utf8($project);
3673
3674         return $title unless (defined $action);
3675         $title .= "/$action"; # $action is US-ASCII (7bit ASCII)
3676
3677         return $title unless (defined $file_name);
3678         $title .= " - " . esc_path($file_name);
3679         if ($action eq "tree" && $file_name !~ m|/$|) {
3680                 $title .= "/";
3681         }
3682
3683         return $title;
3684 }
3685
3686 sub get_content_type_html {
3687         # require explicit support from the UA if we are to send the page as
3688         # 'application/xhtml+xml', otherwise send it as plain old 'text/html'.
3689         # we have to do this because MSIE sometimes globs '*/*', pretending to
3690         # support xhtml+xml but choking when it gets what it asked for.
3691         if (defined $cgi->http('HTTP_ACCEPT') &&
3692             $cgi->http('HTTP_ACCEPT') =~ m/(,|;|\s|^)application\/xhtml\+xml(,|;|\s|$)/ &&
3693             $cgi->Accept('application/xhtml+xml') != 0) {
3694                 return 'application/xhtml+xml';
3695         } else {
3696                 return 'text/html';
3697         }
3698 }
3699
3700 sub print_feed_meta {
3701         if (defined $project) {
3702                 my %href_params = get_feed_info();
3703                 if (!exists $href_params{'-title'}) {
3704                         $href_params{'-title'} = 'log';
3705                 }
3706
3707                 foreach my $format (qw(RSS Atom)) {
3708                         my $type = lc($format);
3709                         my %link_attr = (
3710                                 '-rel' => 'alternate',
3711                                 '-title' => esc_attr("$project - $href_params{'-title'} - $format feed"),
3712                                 '-type' => "application/$type+xml"
3713                         );
3714
3715                         $href_params{'action'} = $type;
3716                         $link_attr{'-href'} = href(%href_params);
3717                         print "<link ".
3718                               "rel=\"$link_attr{'-rel'}\" ".
3719                               "title=\"$link_attr{'-title'}\" ".
3720                               "href=\"$link_attr{'-href'}\" ".
3721                               "type=\"$link_attr{'-type'}\" ".
3722                               "/>\n";
3723
3724                         $href_params{'extra_options'} = '--no-merges';
3725                         $link_attr{'-href'} = href(%href_params);
3726                         $link_attr{'-title'} .= ' (no merges)';
3727                         print "<link ".
3728                               "rel=\"$link_attr{'-rel'}\" ".
3729                               "title=\"$link_attr{'-title'}\" ".
3730                               "href=\"$link_attr{'-href'}\" ".
3731                               "type=\"$link_attr{'-type'}\" ".
3732                               "/>\n";
3733                 }
3734
3735         } else {
3736                 printf('<link rel="alternate" title="%s projects list" '.
3737                        'href="%s" type="text/plain; charset=utf-8" />'."\n",
3738                        esc_attr($site_name), href(project=>undef, action=>"project_index"));
3739                 printf('<link rel="alternate" title="%s projects feeds" '.
3740                        'href="%s" type="text/x-opml" />'."\n",
3741                        esc_attr($site_name), href(project=>undef, action=>"opml"));
3742         }
3743 }
3744
3745 sub print_header_links {
3746         my $status = shift;
3747
3748         # print out each stylesheet that exist, providing backwards capability
3749         # for those people who defined $stylesheet in a config file
3750         if (defined $stylesheet) {
3751                 print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3752         } else {
3753                 foreach my $stylesheet (@stylesheets) {
3754                         next unless $stylesheet;
3755                         print '<link rel="stylesheet" type="text/css" href="'.esc_url($stylesheet).'"/>'."\n";
3756                 }
3757         }
3758         print_feed_meta()
3759                 if ($status eq '200 OK');
3760         if (defined $favicon) {
3761                 print qq(<link rel="shortcut icon" href=").esc_url($favicon).qq(" type="image/png" />\n);
3762         }
3763 }
3764
3765 sub print_nav_breadcrumbs {
3766         my %opts = @_;
3767
3768         print $cgi->a({-href => esc_url($home_link)}, $home_link_str) . " / ";
3769         if (defined $project) {
3770                 print $cgi->a({-href => href(action=>"summary")}, esc_html($project));
3771                 if (defined $action) {
3772                         my $action_print = $action ;
3773                         if (defined $opts{-action_extra}) {
3774                                 $action_print = $cgi->a({-href => href(action=>$action)},
3775                                         $action);
3776                         }
3777                         print " / $action_print";
3778                 }
3779                 if (defined $opts{-action_extra}) {
3780                         print " / $opts{-action_extra}";
3781                 }
3782                 print "\n";
3783         }
3784 }
3785
3786 sub print_search_form {
3787         if (!defined $searchtext) {
3788                 $searchtext = "";
3789         }
3790         my $search_hash;
3791         if (defined $hash_base) {
3792                 $search_hash = $hash_base;
3793         } elsif (defined $hash) {
3794                 $search_hash = $hash;
3795         } else {
3796                 $search_hash = "HEAD";
3797         }
3798         my $action = $my_uri;
3799         my $use_pathinfo = gitweb_check_feature('pathinfo');
3800         if ($use_pathinfo) {
3801                 $action .= "/".esc_url($project);
3802         }
3803         print $cgi->startform(-method => "get", -action => $action) .
3804               "<div class=\"search\">\n" .
3805               (!$use_pathinfo &&
3806               $cgi->input({-name=>"p", -value=>$project, -type=>"hidden"}) . "\n") .
3807               $cgi->input({-name=>"a", -value=>"search", -type=>"hidden"}) . "\n" .
3808               $cgi->input({-name=>"h", -value=>$search_hash, -type=>"hidden"}) . "\n" .
3809               $cgi->popup_menu(-name => 'st', -default => 'commit',
3810                                -values => ['commit', 'grep', 'author', 'committer', 'pickaxe']) .
3811               $cgi->sup($cgi->a({-href => href(action=>"search_help")}, "?")) .
3812               " search:\n",
3813               $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
3814               "<span title=\"Extended regular expression\">" .
3815               $cgi->checkbox(-name => 'sr', -value => 1, -label => 're',
3816                              -checked => $search_use_regexp) .
3817               "</span>" .
3818               "</div>" .
3819               $cgi->end_form() . "\n";
3820 }
3821
3822 sub git_header_html {
3823         my $status = shift || "200 OK";
3824         my $expires = shift;
3825         my %opts = @_;
3826
3827         my $title = get_page_title();
3828         my $content_type = get_content_type_html();
3829         print $cgi->header(-type=>$content_type, -charset => 'utf-8',
3830                            -status=> $status, -expires => $expires)
3831                 unless ($opts{'-no_http_header'});
3832         my $mod_perl_version = $ENV{'MOD_PERL'} ? " $ENV{'MOD_PERL'}" : '';
3833         print <<EOF;
3834 <?xml version="1.0" encoding="utf-8"?>
3835 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
3836 <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en-US" lang="en-US">
3837 <!-- git web interface version $version, (C) 2005-2006, Kay Sievers <kay.sievers\@vrfy.org>, Christian Gierke -->
3838 <!-- git core binaries version $git_version -->
3839 <head>
3840 <meta http-equiv="content-type" content="$content_type; charset=utf-8"/>
3841 <meta name="generator" content="gitweb/$version git/$git_version$mod_perl_version"/>
3842 <meta name="robots" content="index, nofollow"/>
3843 <title>$title</title>
3844 EOF
3845         # the stylesheet, favicon etc urls won't work correctly with path_info
3846         # unless we set the appropriate base URL
3847         if ($ENV{'PATH_INFO'}) {
3848                 print "<base href=\"".esc_url($base_url)."\" />\n";
3849         }
3850         print_header_links($status);
3851         print "</head>\n" .
3852               "<body>\n";
3853
3854         if (defined $site_header && -f $site_header) {
3855                 insert_file($site_header);
3856         }
3857
3858         print "<div class=\"page_header\">\n";
3859         if (defined $logo) {
3860                 print $cgi->a({-href => esc_url($logo_url),
3861                                -title => $logo_label},
3862                               $cgi->img({-src => esc_url($logo),
3863                                          -width => 72, -height => 27,
3864                                          -alt => "git",
3865                                          -class => "logo"}));
3866         }
3867         print_nav_breadcrumbs(%opts);
3868         print "</div>\n";
3869
3870         my $have_search = gitweb_check_feature('search');
3871         if (defined $project && $have_search) {
3872                 print_search_form();
3873         }
3874 }
3875
3876 sub git_footer_html {
3877         my $feed_class = 'rss_logo';
3878
3879         print "<div class=\"page_footer\">\n";
3880         if (defined $project) {
3881                 my $descr = git_get_project_description($project);
3882                 if (defined $descr) {
3883                         print "<div class=\"page_footer_text\">" . esc_html($descr) . "</div>\n";
3884                 }
3885
3886                 my %href_params = get_feed_info();
3887                 if (!%href_params) {
3888                         $feed_class .= ' generic';
3889                 }
3890                 $href_params{'-title'} ||= 'log';
3891
3892                 foreach my $format (qw(RSS Atom)) {
3893                         $href_params{'action'} = lc($format);
3894                         print $cgi->a({-href => href(%href_params),
3895                                       -title => "$href_params{'-title'} $format feed",
3896                                       -class => $feed_class}, $format)."\n";
3897                 }
3898
3899         } else {
3900                 print $cgi->a({-href => href(project=>undef, action=>"opml"),
3901                               -class => $feed_class}, "OPML") . " ";
3902                 print $cgi->a({-href => href(project=>undef, action=>"project_index"),
3903                               -class => $feed_class}, "TXT") . "\n";
3904         }
3905         print "</div>\n"; # class="page_footer"
3906
3907         if (defined $t0 && gitweb_check_feature('timed')) {
3908                 print "<div id=\"generating_info\">\n";
3909                 print 'This page took '.
3910                       '<span id="generating_time" class="time_span">'.
3911                       tv_interval($t0, [ gettimeofday() ]).
3912                       ' seconds </span>'.
3913                       ' and '.
3914                       '<span id="generating_cmd">'.
3915                       $number_of_git_cmds.
3916                       '</span> git commands '.
3917                       " to generate.\n";
3918                 print "</div>\n"; # class="page_footer"
3919         }
3920
3921         if (defined $site_footer && -f $site_footer) {
3922                 insert_file($site_footer);
3923         }
3924
3925         print qq!<script type="text/javascript" src="!.esc_url($javascript).qq!"></script>\n!;
3926         if (defined $action &&
3927             $action eq 'blame_incremental') {
3928                 print qq!<script type="text/javascript">\n!.
3929                       qq!startBlame("!. href(action=>"blame_data", -replay=>1) .qq!",\n!.
3930                       qq!           "!. href() .qq!");\n!.
3931                       qq!</script>\n!;
3932         } else {
3933                 my ($jstimezone, $tz_cookie, $datetime_class) =
3934                         gitweb_get_feature('javascript-timezone');
3935
3936                 print qq!<script type="text/javascript">\n!.
3937                       qq!window.onload = function () {\n!;
3938                 if (gitweb_check_feature('javascript-actions')) {
3939                         print qq!       fixLinks();\n!;
3940                 }
3941                 if ($jstimezone && $tz_cookie && $datetime_class) {
3942                         print qq!       var tz_cookie = { name: '$tz_cookie', expires: 14, path: '/' };\n!. # in days
3943                               qq!       onloadTZSetup('$jstimezone', tz_cookie, '$datetime_class');\n!;
3944                 }
3945                 print qq!};\n!.
3946                       qq!</script>\n!;
3947         }
3948
3949         print "</body>\n" .
3950               "</html>";
3951 }
3952
3953 # die_error(<http_status_code>, <error_message>[, <detailed_html_description>])
3954 # Example: die_error(404, 'Hash not found')
3955 # By convention, use the following status codes (as defined in RFC 2616):
3956 # 400: Invalid or missing CGI parameters, or
3957 #      requested object exists but has wrong type.
3958 # 403: Requested feature (like "pickaxe" or "snapshot") not enabled on
3959 #      this server or project.
3960 # 404: Requested object/revision/project doesn't exist.
3961 # 500: The server isn't configured properly, or
3962 #      an internal error occurred (e.g. failed assertions caused by bugs), or
3963 #      an unknown error occurred (e.g. the git binary died unexpectedly).
3964 # 503: The server is currently unavailable (because it is overloaded,
3965 #      or down for maintenance).  Generally, this is a temporary state.
3966 sub die_error {
3967         my $status = shift || 500;
3968         my $error = esc_html(shift) || "Internal Server Error";
3969         my $extra = shift;
3970         my %opts = @_;
3971
3972         my %http_responses = (
3973                 400 => '400 Bad Request',
3974                 403 => '403 Forbidden',
3975                 404 => '404 Not Found',
3976                 500 => '500 Internal Server Error',
3977                 503 => '503 Service Unavailable',
3978         );
3979         git_header_html($http_responses{$status}, undef, %opts);
3980         print <<EOF;
3981 <div class="page_body">
3982 <br /><br />
3983 $status - $error
3984 <br />
3985 EOF
3986         if (defined $extra) {
3987                 print "<hr />\n" .
3988                       "$extra\n";
3989         }
3990         print "</div>\n";
3991
3992         git_footer_html();
3993         goto DONE_GITWEB
3994                 unless ($opts{'-error_handler'});
3995 }
3996
3997 ## ----------------------------------------------------------------------
3998 ## functions printing or outputting HTML: navigation
3999
4000 sub git_print_page_nav {
4001         my ($current, $suppress, $head, $treehead, $treebase, $extra) = @_;
4002         $extra = '' if !defined $extra; # pager or formats
4003
4004         my @navs = qw(summary shortlog log commit commitdiff tree);
4005         if ($suppress) {
4006                 @navs = grep { $_ ne $suppress } @navs;
4007         }
4008
4009         my %arg = map { $_ => {action=>$_} } @navs;
4010         if (defined $head) {
4011                 for (qw(commit commitdiff)) {
4012                         $arg{$_}{'hash'} = $head;
4013                 }
4014                 if ($current =~ m/^(tree | log | shortlog | commit | commitdiff | search)$/x) {
4015                         for (qw(shortlog log)) {
4016                                 $arg{$_}{'hash'} = $head;
4017                         }
4018                 }
4019         }
4020
4021         $arg{'tree'}{'hash'} = $treehead if defined $treehead;
4022         $arg{'tree'}{'hash_base'} = $treebase if defined $treebase;
4023
4024         my @actions = gitweb_get_feature('actions');
4025         my %repl = (
4026                 '%' => '%',
4027                 'n' => $project,         # project name
4028                 'f' => $git_dir,         # project path within filesystem
4029                 'h' => $treehead || '',  # current hash ('h' parameter)
4030                 'b' => $treebase || '',  # hash base ('hb' parameter)
4031         );
4032         while (@actions) {
4033                 my ($label, $link, $pos) = splice(@actions,0,3);
4034                 # insert
4035                 @navs = map { $_ eq $pos ? ($_, $label) : $_ } @navs;
4036                 # munch munch
4037                 $link =~ s/%([%nfhb])/$repl{$1}/g;
4038                 $arg{$label}{'_href'} = $link;
4039         }
4040
4041         print "<div class=\"page_nav\">\n" .
4042                 (join " | ",
4043                  map { $_ eq $current ?
4044                        $_ : $cgi->a({-href => ($arg{$_}{_href} ? $arg{$_}{_href} : href(%{$arg{$_}}))}, "$_")
4045                  } @navs);
4046         print "<br/>\n$extra<br/>\n" .
4047               "</div>\n";
4048 }
4049
4050 # returns a submenu for the nagivation of the refs views (tags, heads,
4051 # remotes) with the current view disabled and the remotes view only
4052 # available if the feature is enabled
4053 sub format_ref_views {
4054         my ($current) = @_;
4055         my @ref_views = qw{tags heads};
4056         push @ref_views, 'remotes' if gitweb_check_feature('remote_heads');
4057         return join " | ", map {
4058                 $_ eq $current ? $_ :
4059                 $cgi->a({-href => href(action=>$_)}, $_)
4060         } @ref_views
4061 }
4062
4063 sub format_paging_nav {
4064         my ($action, $page, $has_next_link) = @_;
4065         my $paging_nav;
4066
4067
4068         if ($page > 0) {
4069                 $paging_nav .=
4070                         $cgi->a({-href => href(-replay=>1, page=>undef)}, "first") .
4071                         " &sdot; " .
4072                         $cgi->a({-href => href(-replay=>1, page=>$page-1),
4073                                  -accesskey => "p", -title => "Alt-p"}, "prev");
4074         } else {
4075                 $paging_nav .= "first &sdot; prev";
4076         }
4077
4078         if ($has_next_link) {
4079                 $paging_nav .= " &sdot; " .
4080                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
4081                                  -accesskey => "n", -title => "Alt-n"}, "next");
4082         } else {
4083                 $paging_nav .= " &sdot; next";
4084         }
4085
4086         return $paging_nav;
4087 }
4088
4089 ## ......................................................................
4090 ## functions printing or outputting HTML: div
4091
4092 sub git_print_header_div {
4093         my ($action, $title, $hash, $hash_base) = @_;
4094         my %args = ();
4095
4096         $args{'action'} = $action;
4097         $args{'hash'} = $hash if $hash;
4098         $args{'hash_base'} = $hash_base if $hash_base;
4099
4100         print "<div class=\"header\">\n" .
4101               $cgi->a({-href => href(%args), -class => "title"},
4102               $title ? $title : $action) .
4103               "\n</div>\n";
4104 }
4105
4106 sub format_repo_url {
4107         my ($name, $url) = @_;
4108         return "<tr class=\"metadata_url\"><td>$name</td><td>$url</td></tr>\n";
4109 }
4110
4111 # Group output by placing it in a DIV element and adding a header.
4112 # Options for start_div() can be provided by passing a hash reference as the
4113 # first parameter to the function.
4114 # Options to git_print_header_div() can be provided by passing an array
4115 # reference. This must follow the options to start_div if they are present.
4116 # The content can be a scalar, which is output as-is, a scalar reference, which
4117 # is output after html escaping, an IO handle passed either as *handle or
4118 # *handle{IO}, or a function reference. In the latter case all following
4119 # parameters will be taken as argument to the content function call.
4120 sub git_print_section {
4121         my ($div_args, $header_args, $content);
4122         my $arg = shift;
4123         if (ref($arg) eq 'HASH') {
4124                 $div_args = $arg;
4125                 $arg = shift;
4126         }
4127         if (ref($arg) eq 'ARRAY') {
4128                 $header_args = $arg;
4129                 $arg = shift;
4130         }
4131         $content = $arg;
4132
4133         print $cgi->start_div($div_args);
4134         git_print_header_div(@$header_args);
4135
4136         if (ref($content) eq 'CODE') {
4137                 $content->(@_);
4138         } elsif (ref($content) eq 'SCALAR') {
4139                 print esc_html($$content);
4140         } elsif (ref($content) eq 'GLOB' or ref($content) eq 'IO::Handle') {
4141                 print <$content>;
4142         } elsif (!ref($content) && defined($content)) {
4143                 print $content;
4144         }
4145
4146         print $cgi->end_div;
4147 }
4148
4149 sub format_timestamp_html {
4150         my $date = shift;
4151         my $strtime = $date->{'rfc2822'};
4152
4153         my (undef, undef, $datetime_class) =
4154                 gitweb_get_feature('javascript-timezone');
4155         if ($datetime_class) {
4156                 $strtime = qq!<span class="$datetime_class">$strtime</span>!;
4157         }
4158
4159         my $localtime_format = '(%02d:%02d %s)';
4160         if ($date->{'hour_local'} < 6) {
4161                 $localtime_format = '(<span class="atnight">%02d:%02d</span> %s)';
4162         }
4163         $strtime .= ' ' .
4164                     sprintf($localtime_format,
4165                             $date->{'hour_local'}, $date->{'minute_local'}, $date->{'tz_local'});
4166
4167         return $strtime;
4168 }
4169
4170 # Outputs the author name and date in long form
4171 sub git_print_authorship {
4172         my $co = shift;
4173         my %opts = @_;
4174         my $tag = $opts{-tag} || 'div';
4175         my $author = $co->{'author_name'};
4176
4177         my %ad = parse_date($co->{'author_epoch'}, $co->{'author_tz'});
4178         print "<$tag class=\"author_date\">" .
4179               format_search_author($author, "author", esc_html($author)) .
4180               " [".format_timestamp_html(\%ad)."]".
4181               git_get_avatar($co->{'author_email'}, -pad_before => 1) .
4182               "</$tag>\n";
4183 }
4184
4185 # Outputs table rows containing the full author or committer information,
4186 # in the format expected for 'commit' view (& similar).
4187 # Parameters are a commit hash reference, followed by the list of people
4188 # to output information for. If the list is empty it defaults to both
4189 # author and committer.
4190 sub git_print_authorship_rows {
4191         my $co = shift;
4192         # too bad we can't use @people = @_ || ('author', 'committer')
4193         my @people = @_;
4194         @people = ('author', 'committer') unless @people;
4195         foreach my $who (@people) {
4196                 my %wd = parse_date($co->{"${who}_epoch"}, $co->{"${who}_tz"});
4197                 print "<tr><td>$who</td><td>" .
4198                       format_search_author($co->{"${who}_name"}, $who,
4199                                            esc_html($co->{"${who}_name"})) . " " .
4200                       format_search_author($co->{"${who}_email"}, $who,
4201                                            esc_html("<" . $co->{"${who}_email"} . ">")) .
4202                       "</td><td rowspan=\"2\">" .
4203                       git_get_avatar($co->{"${who}_email"}, -size => 'double') .
4204                       "</td></tr>\n" .
4205                       "<tr>" .
4206                       "<td></td><td>" .
4207                       format_timestamp_html(\%wd) .
4208                       "</td>" .
4209                       "</tr>\n";
4210         }
4211 }
4212
4213 sub git_print_page_path {
4214         my $name = shift;
4215         my $type = shift;
4216         my $hb = shift;
4217
4218
4219         print "<div class=\"page_path\">";
4220         print $cgi->a({-href => href(action=>"tree", hash_base=>$hb),
4221                       -title => 'tree root'}, to_utf8("[$project]"));
4222         print " / ";
4223         if (defined $name) {
4224                 my @dirname = split '/', $name;
4225                 my $basename = pop @dirname;
4226                 my $fullname = '';
4227
4228                 foreach my $dir (@dirname) {
4229                         $fullname .= ($fullname ? '/' : '') . $dir;
4230                         print $cgi->a({-href => href(action=>"tree", file_name=>$fullname,
4231                                                      hash_base=>$hb),
4232                                       -title => $fullname}, esc_path($dir));
4233                         print " / ";
4234                 }
4235                 if (defined $type && $type eq 'blob') {
4236                         print $cgi->a({-href => href(action=>"blob_plain", file_name=>$file_name,
4237                                                      hash_base=>$hb),
4238                                       -title => $name}, esc_path($basename));
4239                 } elsif (defined $type && $type eq 'tree') {
4240                         print $cgi->a({-href => href(action=>"tree", file_name=>$file_name,
4241                                                      hash_base=>$hb),
4242                                       -title => $name}, esc_path($basename));
4243                         print " / ";
4244                 } else {
4245                         print esc_path($basename);
4246                 }
4247         }
4248         print "<br/></div>\n";
4249 }
4250
4251 sub git_print_log {
4252         my $log = shift;
4253         my %opts = @_;
4254
4255         if ($opts{'-remove_title'}) {
4256                 # remove title, i.e. first line of log
4257                 shift @$log;
4258         }
4259         # remove leading empty lines
4260         while (defined $log->[0] && $log->[0] eq "") {
4261                 shift @$log;
4262         }
4263
4264         # print log
4265         my $signoff = 0;
4266         my $empty = 0;
4267         foreach my $line (@$log) {
4268                 if ($line =~ m/^ *(signed[ \-]off[ \-]by[ :]|acked[ \-]by[ :]|cc[ :])/i) {
4269                         $signoff = 1;
4270                         $empty = 0;
4271                         if (! $opts{'-remove_signoff'}) {
4272                                 print "<span class=\"signoff\">" . esc_html($line) . "</span><br/>\n";
4273                                 next;
4274                         } else {
4275                                 # remove signoff lines
4276                                 next;
4277                         }
4278                 } else {
4279                         $signoff = 0;
4280                 }
4281
4282                 # print only one empty line
4283                 # do not print empty line after signoff
4284                 if ($line eq "") {
4285                         next if ($empty || $signoff);
4286                         $empty = 1;
4287                 } else {
4288                         $empty = 0;
4289                 }
4290
4291                 print format_log_line_html($line) . "<br/>\n";
4292         }
4293
4294         if ($opts{'-final_empty_line'}) {
4295                 # end with single empty line
4296                 print "<br/>\n" unless $empty;
4297         }
4298 }
4299
4300 # return link target (what link points to)
4301 sub git_get_link_target {
4302         my $hash = shift;
4303         my $link_target;
4304
4305         # read link
4306         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
4307                 or return;
4308         {
4309                 local $/ = undef;
4310                 $link_target = <$fd>;
4311         }
4312         close $fd
4313                 or return;
4314
4315         return $link_target;
4316 }
4317
4318 # given link target, and the directory (basedir) the link is in,
4319 # return target of link relative to top directory (top tree);
4320 # return undef if it is not possible (including absolute links).
4321 sub normalize_link_target {
4322         my ($link_target, $basedir) = @_;
4323
4324         # absolute symlinks (beginning with '/') cannot be normalized
4325         return if (substr($link_target, 0, 1) eq '/');
4326
4327         # normalize link target to path from top (root) tree (dir)
4328         my $path;
4329         if ($basedir) {
4330                 $path = $basedir . '/' . $link_target;
4331         } else {
4332                 # we are in top (root) tree (dir)
4333                 $path = $link_target;
4334         }
4335
4336         # remove //, /./, and /../
4337         my @path_parts;
4338         foreach my $part (split('/', $path)) {
4339                 # discard '.' and ''
4340                 next if (!$part || $part eq '.');
4341                 # handle '..'
4342                 if ($part eq '..') {
4343                         if (@path_parts) {
4344                                 pop @path_parts;
4345                         } else {
4346                                 # link leads outside repository (outside top dir)
4347                                 return;
4348                         }
4349                 } else {
4350                         push @path_parts, $part;
4351                 }
4352         }
4353         $path = join('/', @path_parts);
4354
4355         return $path;
4356 }
4357
4358 # print tree entry (row of git_tree), but without encompassing <tr> element
4359 sub git_print_tree_entry {
4360         my ($t, $basedir, $hash_base, $have_blame) = @_;
4361
4362         my %base_key = ();
4363         $base_key{'hash_base'} = $hash_base if defined $hash_base;
4364
4365         # The format of a table row is: mode list link.  Where mode is
4366         # the mode of the entry, list is the name of the entry, an href,
4367         # and link is the action links of the entry.
4368
4369         print "<td class=\"mode\">" . mode_str($t->{'mode'}) . "</td>\n";
4370         if (exists $t->{'size'}) {
4371                 print "<td class=\"size\">$t->{'size'}</td>\n";
4372         }
4373         if ($t->{'type'} eq "blob") {
4374                 print "<td class=\"list\">" .
4375                         $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4376                                                file_name=>"$basedir$t->{'name'}", %base_key),
4377                                 -class => "list"}, esc_path($t->{'name'}));
4378                 if (S_ISLNK(oct $t->{'mode'})) {
4379                         my $link_target = git_get_link_target($t->{'hash'});
4380                         if ($link_target) {
4381                                 my $norm_target = normalize_link_target($link_target, $basedir);
4382                                 if (defined $norm_target) {
4383                                         print " -> " .
4384                                               $cgi->a({-href => href(action=>"object", hash_base=>$hash_base,
4385                                                                      file_name=>$norm_target),
4386                                                        -title => $norm_target}, esc_path($link_target));
4387                                 } else {
4388                                         print " -> " . esc_path($link_target);
4389                                 }
4390                         }
4391                 }
4392                 print "</td>\n";
4393                 print "<td class=\"link\">";
4394                 print $cgi->a({-href => href(action=>"blob", hash=>$t->{'hash'},
4395                                              file_name=>"$basedir$t->{'name'}", %base_key)},
4396                               "blob");
4397                 if ($have_blame) {
4398                         print " | " .
4399                               $cgi->a({-href => href(action=>"blame", hash=>$t->{'hash'},
4400                                                      file_name=>"$basedir$t->{'name'}", %base_key)},
4401                                       "blame");
4402                 }
4403                 if (defined $hash_base) {
4404                         print " | " .
4405                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4406                                                      hash=>$t->{'hash'}, file_name=>"$basedir$t->{'name'}")},
4407                                       "history");
4408                 }
4409                 print " | " .
4410                         $cgi->a({-href => href(action=>"blob_plain", hash_base=>$hash_base,
4411                                                file_name=>"$basedir$t->{'name'}")},
4412                                 "raw");
4413                 print "</td>\n";
4414
4415         } elsif ($t->{'type'} eq "tree") {
4416                 print "<td class=\"list\">";
4417                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4418                                              file_name=>"$basedir$t->{'name'}",
4419                                              %base_key)},
4420                               esc_path($t->{'name'}));
4421                 print "</td>\n";
4422                 print "<td class=\"link\">";
4423                 print $cgi->a({-href => href(action=>"tree", hash=>$t->{'hash'},
4424                                              file_name=>"$basedir$t->{'name'}",
4425                                              %base_key)},
4426                               "tree");
4427                 if (defined $hash_base) {
4428                         print " | " .
4429                               $cgi->a({-href => href(action=>"history", hash_base=>$hash_base,
4430                                                      file_name=>"$basedir$t->{'name'}")},
4431                                       "history");
4432                 }
4433                 print "</td>\n";
4434         } else {
4435                 # unknown object: we can only present history for it
4436                 # (this includes 'commit' object, i.e. submodule support)
4437                 print "<td class=\"list\">" .
4438                       esc_path($t->{'name'}) .
4439                       "</td>\n";
4440                 print "<td class=\"link\">";
4441                 if (defined $hash_base) {
4442                         print $cgi->a({-href => href(action=>"history",
4443                                                      hash_base=>$hash_base,
4444                                                      file_name=>"$basedir$t->{'name'}")},
4445                                       "history");
4446                 }
4447                 print "</td>\n";
4448         }
4449 }
4450
4451 ## ......................................................................
4452 ## functions printing large fragments of HTML
4453
4454 # get pre-image filenames for merge (combined) diff
4455 sub fill_from_file_info {
4456         my ($diff, @parents) = @_;
4457
4458         $diff->{'from_file'} = [ ];
4459         $diff->{'from_file'}[$diff->{'nparents'} - 1] = undef;
4460         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4461                 if ($diff->{'status'}[$i] eq 'R' ||
4462                     $diff->{'status'}[$i] eq 'C') {
4463                         $diff->{'from_file'}[$i] =
4464                                 git_get_path_by_hash($parents[$i], $diff->{'from_id'}[$i]);
4465                 }
4466         }
4467
4468         return $diff;
4469 }
4470
4471 # is current raw difftree line of file deletion
4472 sub is_deleted {
4473         my $diffinfo = shift;
4474
4475         return $diffinfo->{'to_id'} eq ('0' x 40);
4476 }
4477
4478 # does patch correspond to [previous] difftree raw line
4479 # $diffinfo  - hashref of parsed raw diff format
4480 # $patchinfo - hashref of parsed patch diff format
4481 #              (the same keys as in $diffinfo)
4482 sub is_patch_split {
4483         my ($diffinfo, $patchinfo) = @_;
4484
4485         return defined $diffinfo && defined $patchinfo
4486                 && $diffinfo->{'to_file'} eq $patchinfo->{'to_file'};
4487 }
4488
4489
4490 sub git_difftree_body {
4491         my ($difftree, $hash, @parents) = @_;
4492         my ($parent) = $parents[0];
4493         my $have_blame = gitweb_check_feature('blame');
4494         print "<div class=\"list_head\">\n";
4495         if ($#{$difftree} > 10) {
4496                 print(($#{$difftree} + 1) . " files changed:\n");
4497         }
4498         print "</div>\n";
4499
4500         print "<table class=\"" .
4501               (@parents > 1 ? "combined " : "") .
4502               "diff_tree\">\n";
4503
4504         # header only for combined diff in 'commitdiff' view
4505         my $has_header = @$difftree && @parents > 1 && $action eq 'commitdiff';
4506         if ($has_header) {
4507                 # table header
4508                 print "<thead><tr>\n" .
4509                        "<th></th><th></th>\n"; # filename, patchN link
4510                 for (my $i = 0; $i < @parents; $i++) {
4511                         my $par = $parents[$i];
4512                         print "<th>" .
4513                               $cgi->a({-href => href(action=>"commitdiff",
4514                                                      hash=>$hash, hash_parent=>$par),
4515                                        -title => 'commitdiff to parent number ' .
4516                                                   ($i+1) . ': ' . substr($par,0,7)},
4517                                       $i+1) .
4518                               "&nbsp;</th>\n";
4519                 }
4520                 print "</tr></thead>\n<tbody>\n";
4521         }
4522
4523         my $alternate = 1;
4524         my $patchno = 0;
4525         foreach my $line (@{$difftree}) {
4526                 my $diff = parsed_difftree_line($line);
4527
4528                 if ($alternate) {
4529                         print "<tr class=\"dark\">\n";
4530                 } else {
4531                         print "<tr class=\"light\">\n";
4532                 }
4533                 $alternate ^= 1;
4534
4535                 if (exists $diff->{'nparents'}) { # combined diff
4536
4537                         fill_from_file_info($diff, @parents)
4538                                 unless exists $diff->{'from_file'};
4539
4540                         if (!is_deleted($diff)) {
4541                                 # file exists in the result (child) commit
4542                                 print "<td>" .
4543                                       $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4544                                                              file_name=>$diff->{'to_file'},
4545                                                              hash_base=>$hash),
4546                                               -class => "list"}, esc_path($diff->{'to_file'})) .
4547                                       "</td>\n";
4548                         } else {
4549                                 print "<td>" .
4550                                       esc_path($diff->{'to_file'}) .
4551                                       "</td>\n";
4552                         }
4553
4554                         if ($action eq 'commitdiff') {
4555                                 # link to patch
4556                                 $patchno++;
4557                                 print "<td class=\"link\">" .
4558                                       $cgi->a({-href => href(-anchor=>"patch$patchno")},
4559                                               "patch") .
4560                                       " | " .
4561                                       "</td>\n";
4562                         }
4563
4564                         my $has_history = 0;
4565                         my $not_deleted = 0;
4566                         for (my $i = 0; $i < $diff->{'nparents'}; $i++) {
4567                                 my $hash_parent = $parents[$i];
4568                                 my $from_hash = $diff->{'from_id'}[$i];
4569                                 my $from_path = $diff->{'from_file'}[$i];
4570                                 my $status = $diff->{'status'}[$i];
4571
4572                                 $has_history ||= ($status ne 'A');
4573                                 $not_deleted ||= ($status ne 'D');
4574
4575                                 if ($status eq 'A') {
4576                                         print "<td  class=\"link\" align=\"right\"> | </td>\n";
4577                                 } elsif ($status eq 'D') {
4578                                         print "<td class=\"link\">" .
4579                                               $cgi->a({-href => href(action=>"blob",
4580                                                                      hash_base=>$hash,
4581                                                                      hash=>$from_hash,
4582                                                                      file_name=>$from_path)},
4583                                                       "blob" . ($i+1)) .
4584                                               " | </td>\n";
4585                                 } else {
4586                                         if ($diff->{'to_id'} eq $from_hash) {
4587                                                 print "<td class=\"link nochange\">";
4588                                         } else {
4589                                                 print "<td class=\"link\">";
4590                                         }
4591                                         print $cgi->a({-href => href(action=>"blobdiff",
4592                                                                      hash=>$diff->{'to_id'},
4593                                                                      hash_parent=>$from_hash,
4594                                                                      hash_base=>$hash,
4595                                                                      hash_parent_base=>$hash_parent,
4596                                                                      file_name=>$diff->{'to_file'},
4597                                                                      file_parent=>$from_path)},
4598                                                       "diff" . ($i+1)) .
4599                                               " | </td>\n";
4600                                 }
4601                         }
4602
4603                         print "<td class=\"link\">";
4604                         if ($not_deleted) {
4605                                 print $cgi->a({-href => href(action=>"blob",
4606                                                              hash=>$diff->{'to_id'},
4607                                                              file_name=>$diff->{'to_file'},
4608                                                              hash_base=>$hash)},
4609                                               "blob");
4610                                 print " | " if ($has_history);
4611                         }
4612                         if ($has_history) {
4613                                 print $cgi->a({-href => href(action=>"history",
4614                                                              file_name=>$diff->{'to_file'},
4615                                                              hash_base=>$hash)},
4616                                               "history");
4617                         }
4618                         print "</td>\n";
4619
4620                         print "</tr>\n";
4621                         next; # instead of 'else' clause, to avoid extra indent
4622                 }
4623                 # else ordinary diff
4624
4625                 my ($to_mode_oct, $to_mode_str, $to_file_type);
4626                 my ($from_mode_oct, $from_mode_str, $from_file_type);
4627                 if ($diff->{'to_mode'} ne ('0' x 6)) {
4628                         $to_mode_oct = oct $diff->{'to_mode'};
4629                         if (S_ISREG($to_mode_oct)) { # only for regular file
4630                                 $to_mode_str = sprintf("%04o", $to_mode_oct & 0777); # permission bits
4631                         }
4632                         $to_file_type = file_type($diff->{'to_mode'});
4633                 }
4634                 if ($diff->{'from_mode'} ne ('0' x 6)) {
4635                         $from_mode_oct = oct $diff->{'from_mode'};
4636                         if (S_ISREG($from_mode_oct)) { # only for regular file
4637                                 $from_mode_str = sprintf("%04o", $from_mode_oct & 0777); # permission bits
4638                         }
4639                         $from_file_type = file_type($diff->{'from_mode'});
4640                 }
4641
4642                 if ($diff->{'status'} eq "A") { # created
4643                         my $mode_chng = "<span class=\"file_status new\">[new $to_file_type";
4644                         $mode_chng   .= " with mode: $to_mode_str" if $to_mode_str;
4645                         $mode_chng   .= "]</span>";
4646                         print "<td>";
4647                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4648                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4649                                       -class => "list"}, esc_path($diff->{'file'}));
4650                         print "</td>\n";
4651                         print "<td>$mode_chng</td>\n";
4652                         print "<td class=\"link\">";
4653                         if ($action eq 'commitdiff') {
4654                                 # link to patch
4655                                 $patchno++;
4656                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4657                                               "patch") .
4658                                       " | ";
4659                         }
4660                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4661                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4662                                       "blob");
4663                         print "</td>\n";
4664
4665                 } elsif ($diff->{'status'} eq "D") { # deleted
4666                         my $mode_chng = "<span class=\"file_status deleted\">[deleted $from_file_type]</span>";
4667                         print "<td>";
4668                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4669                                                      hash_base=>$parent, file_name=>$diff->{'file'}),
4670                                        -class => "list"}, esc_path($diff->{'file'}));
4671                         print "</td>\n";
4672                         print "<td>$mode_chng</td>\n";
4673                         print "<td class=\"link\">";
4674                         if ($action eq 'commitdiff') {
4675                                 # link to patch
4676                                 $patchno++;
4677                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4678                                               "patch") .
4679                                       " | ";
4680                         }
4681                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'from_id'},
4682                                                      hash_base=>$parent, file_name=>$diff->{'file'})},
4683                                       "blob") . " | ";
4684                         if ($have_blame) {
4685                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$parent,
4686                                                              file_name=>$diff->{'file'})},
4687                                               "blame") . " | ";
4688                         }
4689                         print $cgi->a({-href => href(action=>"history", hash_base=>$parent,
4690                                                      file_name=>$diff->{'file'})},
4691                                       "history");
4692                         print "</td>\n";
4693
4694                 } elsif ($diff->{'status'} eq "M" || $diff->{'status'} eq "T") { # modified, or type changed
4695                         my $mode_chnge = "";
4696                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4697                                 $mode_chnge = "<span class=\"file_status mode_chnge\">[changed";
4698                                 if ($from_file_type ne $to_file_type) {
4699                                         $mode_chnge .= " from $from_file_type to $to_file_type";
4700                                 }
4701                                 if (($from_mode_oct & 0777) != ($to_mode_oct & 0777)) {
4702                                         if ($from_mode_str && $to_mode_str) {
4703                                                 $mode_chnge .= " mode: $from_mode_str->$to_mode_str";
4704                                         } elsif ($to_mode_str) {
4705                                                 $mode_chnge .= " mode: $to_mode_str";
4706                                         }
4707                                 }
4708                                 $mode_chnge .= "]</span>\n";
4709                         }
4710                         print "<td>";
4711                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4712                                                      hash_base=>$hash, file_name=>$diff->{'file'}),
4713                                       -class => "list"}, esc_path($diff->{'file'}));
4714                         print "</td>\n";
4715                         print "<td>$mode_chnge</td>\n";
4716                         print "<td class=\"link\">";
4717                         if ($action eq 'commitdiff') {
4718                                 # link to patch
4719                                 $patchno++;
4720                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4721                                               "patch") .
4722                                       " | ";
4723                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4724                                 # "commit" view and modified file (not onlu mode changed)
4725                                 print $cgi->a({-href => href(action=>"blobdiff",
4726                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4727                                                              hash_base=>$hash, hash_parent_base=>$parent,
4728                                                              file_name=>$diff->{'file'})},
4729                                               "diff") .
4730                                       " | ";
4731                         }
4732                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4733                                                      hash_base=>$hash, file_name=>$diff->{'file'})},
4734                                        "blob") . " | ";
4735                         if ($have_blame) {
4736                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4737                                                              file_name=>$diff->{'file'})},
4738                                               "blame") . " | ";
4739                         }
4740                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4741                                                      file_name=>$diff->{'file'})},
4742                                       "history");
4743                         print "</td>\n";
4744
4745                 } elsif ($diff->{'status'} eq "R" || $diff->{'status'} eq "C") { # renamed or copied
4746                         my %status_name = ('R' => 'moved', 'C' => 'copied');
4747                         my $nstatus = $status_name{$diff->{'status'}};
4748                         my $mode_chng = "";
4749                         if ($diff->{'from_mode'} != $diff->{'to_mode'}) {
4750                                 # mode also for directories, so we cannot use $to_mode_str
4751                                 $mode_chng = sprintf(", mode: %04o", $to_mode_oct & 0777);
4752                         }
4753                         print "<td>" .
4754                               $cgi->a({-href => href(action=>"blob", hash_base=>$hash,
4755                                                      hash=>$diff->{'to_id'}, file_name=>$diff->{'to_file'}),
4756                                       -class => "list"}, esc_path($diff->{'to_file'})) . "</td>\n" .
4757                               "<td><span class=\"file_status $nstatus\">[$nstatus from " .
4758                               $cgi->a({-href => href(action=>"blob", hash_base=>$parent,
4759                                                      hash=>$diff->{'from_id'}, file_name=>$diff->{'from_file'}),
4760                                       -class => "list"}, esc_path($diff->{'from_file'})) .
4761                               " with " . (int $diff->{'similarity'}) . "% similarity$mode_chng]</span></td>\n" .
4762                               "<td class=\"link\">";
4763                         if ($action eq 'commitdiff') {
4764                                 # link to patch
4765                                 $patchno++;
4766                                 print $cgi->a({-href => href(-anchor=>"patch$patchno")},
4767                                               "patch") .
4768                                       " | ";
4769                         } elsif ($diff->{'to_id'} ne $diff->{'from_id'}) {
4770                                 # "commit" view and modified file (not only pure rename or copy)
4771                                 print $cgi->a({-href => href(action=>"blobdiff",
4772                                                              hash=>$diff->{'to_id'}, hash_parent=>$diff->{'from_id'},
4773                                                              hash_base=>$hash, hash_parent_base=>$parent,
4774                                                              file_name=>$diff->{'to_file'}, file_parent=>$diff->{'from_file'})},
4775                                               "diff") .
4776                                       " | ";
4777                         }
4778                         print $cgi->a({-href => href(action=>"blob", hash=>$diff->{'to_id'},
4779                                                      hash_base=>$parent, file_name=>$diff->{'to_file'})},
4780                                       "blob") . " | ";
4781                         if ($have_blame) {
4782                                 print $cgi->a({-href => href(action=>"blame", hash_base=>$hash,
4783                                                              file_name=>$diff->{'to_file'})},
4784                                               "blame") . " | ";
4785                         }
4786                         print $cgi->a({-href => href(action=>"history", hash_base=>$hash,
4787                                                     file_name=>$diff->{'to_file'})},
4788                                       "history");
4789                         print "</td>\n";
4790
4791                 } # we should not encounter Unmerged (U) or Unknown (X) status
4792                 print "</tr>\n";
4793         }
4794         print "</tbody>" if $has_header;
4795         print "</table>\n";
4796 }
4797
4798 sub git_patchset_body {
4799         my ($fd, $difftree, $hash, @hash_parents) = @_;
4800         my ($hash_parent) = $hash_parents[0];
4801
4802         my $is_combined = (@hash_parents > 1);
4803         my $patch_idx = 0;
4804         my $patch_number = 0;
4805         my $patch_line;
4806         my $diffinfo;
4807         my $to_name;
4808         my (%from, %to);
4809
4810         print "<div class=\"patchset\">\n";
4811
4812         # skip to first patch
4813         while ($patch_line = <$fd>) {
4814                 chomp $patch_line;
4815
4816                 last if ($patch_line =~ m/^diff /);
4817         }
4818
4819  PATCH:
4820         while ($patch_line) {
4821
4822                 # parse "git diff" header line
4823                 if ($patch_line =~ m/^diff --git (\"(?:[^\\\"]*(?:\\.[^\\\"]*)*)\"|[^ "]*) (.*)$/) {
4824                         # $1 is from_name, which we do not use
4825                         $to_name = unquote($2);
4826                         $to_name =~ s!^b/!!;
4827                 } elsif ($patch_line =~ m/^diff --(cc|combined) ("?.*"?)$/) {
4828                         # $1 is 'cc' or 'combined', which we do not use
4829                         $to_name = unquote($2);
4830                 } else {
4831                         $to_name = undef;
4832                 }
4833
4834                 # check if current patch belong to current raw line
4835                 # and parse raw git-diff line if needed
4836                 if (is_patch_split($diffinfo, { 'to_file' => $to_name })) {
4837                         # this is continuation of a split patch
4838                         print "<div class=\"patch cont\">\n";
4839                 } else {
4840                         # advance raw git-diff output if needed
4841                         $patch_idx++ if defined $diffinfo;
4842
4843                         # read and prepare patch information
4844                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4845
4846                         # compact combined diff output can have some patches skipped
4847                         # find which patch (using pathname of result) we are at now;
4848                         if ($is_combined) {
4849                                 while ($to_name ne $diffinfo->{'to_file'}) {
4850                                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4851                                               format_diff_cc_simplified($diffinfo, @hash_parents) .
4852                                               "</div>\n";  # class="patch"
4853
4854                                         $patch_idx++;
4855                                         $patch_number++;
4856
4857                                         last if $patch_idx > $#$difftree;
4858                                         $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4859                                 }
4860                         }
4861
4862                         # modifies %from, %to hashes
4863                         parse_from_to_diffinfo($diffinfo, \%from, \%to, @hash_parents);
4864
4865                         # this is first patch for raw difftree line with $patch_idx index
4866                         # we index @$difftree array from 0, but number patches from 1
4867                         print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n";
4868                 }
4869
4870                 # git diff header
4871                 #assert($patch_line =~ m/^diff /) if DEBUG;
4872                 #assert($patch_line !~ m!$/$!) if DEBUG; # is chomp-ed
4873                 $patch_number++;
4874                 # print "git diff" header
4875                 print format_git_diff_header_line($patch_line, $diffinfo,
4876                                                   \%from, \%to);
4877
4878                 # print extended diff header
4879                 print "<div class=\"diff extended_header\">\n";
4880         EXTENDED_HEADER:
4881                 while ($patch_line = <$fd>) {
4882                         chomp $patch_line;
4883
4884                         last EXTENDED_HEADER if ($patch_line =~ m/^--- |^diff /);
4885
4886                         print format_extended_diff_header_line($patch_line, $diffinfo,
4887                                                                \%from, \%to);
4888                 }
4889                 print "</div>\n"; # class="diff extended_header"
4890
4891                 # from-file/to-file diff header
4892                 if (! $patch_line) {
4893                         print "</div>\n"; # class="patch"
4894                         last PATCH;
4895                 }
4896                 next PATCH if ($patch_line =~ m/^diff /);
4897                 #assert($patch_line =~ m/^---/) if DEBUG;
4898
4899                 my $last_patch_line = $patch_line;
4900                 $patch_line = <$fd>;
4901                 chomp $patch_line;
4902                 #assert($patch_line =~ m/^\+\+\+/) if DEBUG;
4903
4904                 print format_diff_from_to_header($last_patch_line, $patch_line,
4905                                                  $diffinfo, \%from, \%to,
4906                                                  @hash_parents);
4907
4908                 # the patch itself
4909         LINE:
4910                 while ($patch_line = <$fd>) {
4911                         chomp $patch_line;
4912
4913                         next PATCH if ($patch_line =~ m/^diff /);
4914
4915                         print format_diff_line($patch_line, \%from, \%to);
4916                 }
4917
4918         } continue {
4919                 print "</div>\n"; # class="patch"
4920         }
4921
4922         # for compact combined (--cc) format, with chunk and patch simplification
4923         # the patchset might be empty, but there might be unprocessed raw lines
4924         for (++$patch_idx if $patch_number > 0;
4925              $patch_idx < @$difftree;
4926              ++$patch_idx) {
4927                 # read and prepare patch information
4928                 $diffinfo = parsed_difftree_line($difftree->[$patch_idx]);
4929
4930                 # generate anchor for "patch" links in difftree / whatchanged part
4931                 print "<div class=\"patch\" id=\"patch". ($patch_idx+1) ."\">\n" .
4932                       format_diff_cc_simplified($diffinfo, @hash_parents) .
4933                       "</div>\n";  # class="patch"
4934
4935                 $patch_number++;
4936         }
4937
4938         if ($patch_number == 0) {
4939                 if (@hash_parents > 1) {
4940                         print "<div class=\"diff nodifferences\">Trivial merge</div>\n";
4941                 } else {
4942                         print "<div class=\"diff nodifferences\">No differences found</div>\n";
4943                 }
4944         }
4945
4946         print "</div>\n"; # class="patchset"
4947 }
4948
4949 # . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . . .
4950
4951 # fills project list info (age, description, owner, category, forks)
4952 # for each project in the list, removing invalid projects from
4953 # returned list
4954 # NOTE: modifies $projlist, but does not remove entries from it
4955 sub fill_project_list_info {
4956         my $projlist = shift;
4957         my @projects;
4958
4959         my $show_ctags = gitweb_check_feature('ctags');
4960  PROJECT:
4961         foreach my $pr (@$projlist) {
4962                 my (@activity) = git_get_last_activity($pr->{'path'});
4963                 unless (@activity) {
4964                         next PROJECT;
4965                 }
4966                 ($pr->{'age'}, $pr->{'age_string'}) = @activity;
4967                 if (!defined $pr->{'descr'}) {
4968                         my $descr = git_get_project_description($pr->{'path'}) || "";
4969                         $descr = to_utf8($descr);
4970                         $pr->{'descr_long'} = $descr;
4971                         $pr->{'descr'} = chop_str($descr, $projects_list_description_width, 5);
4972                 }
4973                 if (!defined $pr->{'owner'}) {
4974                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}") || "";
4975                 }
4976                 if ($show_ctags) {
4977                         $pr->{'ctags'} = git_get_project_ctags($pr->{'path'});
4978                 }
4979                 if ($projects_list_group_categories && !defined $pr->{'category'}) {
4980                         my $cat = git_get_project_category($pr->{'path'}) ||
4981                                                            $project_list_default_category;
4982                         $pr->{'category'} = to_utf8($cat);
4983                 }
4984
4985                 push @projects, $pr;
4986         }
4987
4988         return @projects;
4989 }
4990
4991 sub sort_projects_list {
4992         my ($projlist, $order) = @_;
4993         my @projects;
4994
4995         my %order_info = (
4996                 project => { key => 'path', type => 'str' },
4997                 descr => { key => 'descr_long', type => 'str' },
4998                 owner => { key => 'owner', type => 'str' },
4999                 age => { key => 'age', type => 'num' }
5000         );
5001         my $oi = $order_info{$order};
5002         return @$projlist unless defined $oi;
5003         if ($oi->{'type'} eq 'str') {
5004                 @projects = sort {$a->{$oi->{'key'}} cmp $b->{$oi->{'key'}}} @$projlist;
5005         } else {
5006                 @projects = sort {$a->{$oi->{'key'}} <=> $b->{$oi->{'key'}}} @$projlist;
5007         }
5008
5009         return @projects;
5010 }
5011
5012 # returns a hash of categories, containing the list of project
5013 # belonging to each category
5014 sub build_projlist_by_category {
5015         my ($projlist, $from, $to) = @_;
5016         my %categories;
5017
5018         $from = 0 unless defined $from;
5019         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5020
5021         for (my $i = $from; $i <= $to; $i++) {
5022                 my $pr = $projlist->[$i];
5023                 push @{$categories{ $pr->{'category'} }}, $pr;
5024         }
5025
5026         return wantarray ? %categories : \%categories;
5027 }
5028
5029 # print 'sort by' <th> element, generating 'sort by $name' replay link
5030 # if that order is not selected
5031 sub print_sort_th {
5032         print format_sort_th(@_);
5033 }
5034
5035 sub format_sort_th {
5036         my ($name, $order, $header) = @_;
5037         my $sort_th = "";
5038         $header ||= ucfirst($name);
5039
5040         if ($order eq $name) {
5041                 $sort_th .= "<th>$header</th>\n";
5042         } else {
5043                 $sort_th .= "<th>" .
5044                             $cgi->a({-href => href(-replay=>1, order=>$name),
5045                                      -class => "header"}, $header) .
5046                             "</th>\n";
5047         }
5048
5049         return $sort_th;
5050 }
5051
5052 sub git_project_list_rows {
5053         my ($projlist, $from, $to, $check_forks) = @_;
5054
5055         $from = 0 unless defined $from;
5056         $to = $#$projlist if (!defined $to || $#$projlist < $to);
5057
5058         my $alternate = 1;
5059         for (my $i = $from; $i <= $to; $i++) {
5060                 my $pr = $projlist->[$i];
5061
5062                 if ($alternate) {
5063                         print "<tr class=\"dark\">\n";
5064                 } else {
5065                         print "<tr class=\"light\">\n";
5066                 }
5067                 $alternate ^= 1;
5068
5069                 if ($check_forks) {
5070                         print "<td>";
5071                         if ($pr->{'forks'}) {
5072                                 my $nforks = scalar @{$pr->{'forks'}};
5073                                 if ($nforks > 0) {
5074                                         print $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks"),
5075                                                        -title => "$nforks forks"}, "+");
5076                                 } else {
5077                                         print $cgi->span({-title => "$nforks forks"}, "+");
5078                                 }
5079                         }
5080                         print "</td>\n";
5081                 }
5082                 print "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5083                                         -class => "list"}, esc_html($pr->{'path'})) . "</td>\n" .
5084                       "<td>" . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary"),
5085                                         -class => "list", -title => $pr->{'descr_long'}},
5086                                         esc_html($pr->{'descr'})) . "</td>\n" .
5087                       "<td><i>" . chop_and_escape_str($pr->{'owner'}, 15) . "</i></td>\n";
5088                 print "<td class=\"". age_class($pr->{'age'}) . "\">" .
5089                       (defined $pr->{'age_string'} ? $pr->{'age_string'} : "No commits") . "</td>\n" .
5090                       "<td class=\"link\">" .
5091                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"summary")}, "summary")   . " | " .
5092                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"shortlog")}, "shortlog") . " | " .
5093                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"log")}, "log") . " | " .
5094                       $cgi->a({-href => href(project=>$pr->{'path'}, action=>"tree")}, "tree") .
5095                       ($pr->{'forks'} ? " | " . $cgi->a({-href => href(project=>$pr->{'path'}, action=>"forks")}, "forks") : '') .
5096                       "</td>\n" .
5097                       "</tr>\n";
5098         }
5099 }
5100
5101 sub git_project_list_body {
5102         # actually uses global variable $project
5103         my ($projlist, $order, $from, $to, $extra, $no_header) = @_;
5104         my @projects = @$projlist;
5105
5106         my $check_forks = gitweb_check_feature('forks');
5107         my $show_ctags  = gitweb_check_feature('ctags');
5108         my $tagfilter = $show_ctags ? $cgi->param('by_tag') : undef;
5109         $check_forks = undef
5110                 if ($tagfilter || $searchtext);
5111
5112         # filtering out forks before filling info allows to do less work
5113         @projects = filter_forks_from_projects_list(\@projects)
5114                 if ($check_forks);
5115         @projects = fill_project_list_info(\@projects);
5116         # searching projects require filling to be run before it
5117         @projects = search_projects_list(\@projects,
5118                                          'searchtext' => $searchtext,
5119                                          'tagfilter'  => $tagfilter)
5120                 if ($tagfilter || $searchtext);
5121
5122         $order ||= $default_projects_order;
5123         $from = 0 unless defined $from;
5124         $to = $#projects if (!defined $to || $#projects < $to);
5125
5126         # short circuit
5127         if ($from > $to) {
5128                 print "<center>\n".
5129                       "<b>No such projects found</b><br />\n".
5130                       "Click ".$cgi->a({-href=>href(project=>undef)},"here")." to view all projects<br />\n".
5131                       "</center>\n<br />\n";
5132                 return;
5133         }
5134
5135         @projects = sort_projects_list(\@projects, $order);
5136
5137         if ($show_ctags) {
5138                 my $ctags = git_gather_all_ctags(\@projects);
5139                 my $cloud = git_populate_project_tagcloud($ctags);
5140                 print git_show_project_tagcloud($cloud, 64);
5141         }
5142
5143         print "<table class=\"project_list\">\n";
5144         unless ($no_header) {
5145                 print "<tr>\n";
5146                 if ($check_forks) {
5147                         print "<th></th>\n";
5148                 }
5149                 print_sort_th('project', $order, 'Project');
5150                 print_sort_th('descr', $order, 'Description');
5151                 print_sort_th('owner', $order, 'Owner');
5152                 print_sort_th('age', $order, 'Last Change');
5153                 print "<th></th>\n" . # for links
5154                       "</tr>\n";
5155         }
5156
5157         if ($projects_list_group_categories) {
5158                 # only display categories with projects in the $from-$to window
5159                 @projects = sort {$a->{'category'} cmp $b->{'category'}} @projects[$from..$to];
5160                 my %categories = build_projlist_by_category(\@projects, $from, $to);
5161                 foreach my $cat (sort keys %categories) {
5162                         unless ($cat eq "") {
5163                                 print "<tr>\n";
5164                                 if ($check_forks) {
5165                                         print "<td></td>\n";
5166                                 }
5167                                 print "<td class=\"category\" colspan=\"5\">".esc_html($cat)."</td>\n";
5168                                 print "</tr>\n";
5169                         }
5170
5171                         git_project_list_rows($categories{$cat}, undef, undef, $check_forks);
5172                 }
5173         } else {
5174                 git_project_list_rows(\@projects, $from, $to, $check_forks);
5175         }
5176
5177         if (defined $extra) {
5178                 print "<tr>\n";
5179                 if ($check_forks) {
5180                         print "<td></td>\n";
5181                 }
5182                 print "<td colspan=\"5\">$extra</td>\n" .
5183                       "</tr>\n";
5184         }
5185         print "</table>\n";
5186 }
5187
5188 sub git_log_body {
5189         # uses global variable $project
5190         my ($commitlist, $from, $to, $refs, $extra) = @_;
5191
5192         $from = 0 unless defined $from;
5193         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5194
5195         for (my $i = 0; $i <= $to; $i++) {
5196                 my %co = %{$commitlist->[$i]};
5197                 next if !%co;
5198                 my $commit = $co{'id'};
5199                 my $ref = format_ref_marker($refs, $commit);
5200                 git_print_header_div('commit',
5201                                "<span class=\"age\">$co{'age_string'}</span>" .
5202                                esc_html($co{'title'}) . $ref,
5203                                $commit);
5204                 print "<div class=\"title_text\">\n" .
5205                       "<div class=\"log_link\">\n" .
5206                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") .
5207                       " | " .
5208                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") .
5209                       " | " .
5210                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree") .
5211                       "<br/>\n" .
5212                       "</div>\n";
5213                       git_print_authorship(\%co, -tag => 'span');
5214                       print "<br/>\n</div>\n";
5215
5216                 print "<div class=\"log_body\">\n";
5217                 git_print_log($co{'comment'}, -final_empty_line=> 1);
5218                 print "</div>\n";
5219         }
5220         if ($extra) {
5221                 print "<div class=\"page_nav\">\n";
5222                 print "$extra\n";
5223                 print "</div>\n";
5224         }
5225 }
5226
5227 sub git_shortlog_body {
5228         # uses global variable $project
5229         my ($commitlist, $from, $to, $refs, $extra) = @_;
5230
5231         $from = 0 unless defined $from;
5232         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5233
5234         print "<table class=\"shortlog\">\n";
5235         my $alternate = 1;
5236         for (my $i = $from; $i <= $to; $i++) {
5237                 my %co = %{$commitlist->[$i]};
5238                 my $commit = $co{'id'};
5239                 my $ref = format_ref_marker($refs, $commit);
5240                 if ($alternate) {
5241                         print "<tr class=\"dark\">\n";
5242                 } else {
5243                         print "<tr class=\"light\">\n";
5244                 }
5245                 $alternate ^= 1;
5246                 # git_summary() used print "<td><i>$co{'age_string'}</i></td>\n" .
5247                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5248                       format_author_html('td', \%co, 10) . "<td>";
5249                 print format_subject_html($co{'title'}, $co{'title_short'},
5250                                           href(action=>"commit", hash=>$commit), $ref);
5251                 print "</td>\n" .
5252                       "<td class=\"link\">" .
5253                       $cgi->a({-href => href(action=>"commit", hash=>$commit)}, "commit") . " | " .
5254                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff") . " | " .
5255                       $cgi->a({-href => href(action=>"tree", hash=>$commit, hash_base=>$commit)}, "tree");
5256                 my $snapshot_links = format_snapshot_links($commit);
5257                 if (defined $snapshot_links) {
5258                         print " | " . $snapshot_links;
5259                 }
5260                 print "</td>\n" .
5261                       "</tr>\n";
5262         }
5263         if (defined $extra) {
5264                 print "<tr>\n" .
5265                       "<td colspan=\"4\">$extra</td>\n" .
5266                       "</tr>\n";
5267         }
5268         print "</table>\n";
5269 }
5270
5271 sub git_history_body {
5272         # Warning: assumes constant type (blob or tree) during history
5273         my ($commitlist, $from, $to, $refs, $extra,
5274             $file_name, $file_hash, $ftype) = @_;
5275
5276         $from = 0 unless defined $from;
5277         $to = $#{$commitlist} unless (defined $to && $to <= $#{$commitlist});
5278
5279         print "<table class=\"history\">\n";
5280         my $alternate = 1;
5281         for (my $i = $from; $i <= $to; $i++) {
5282                 my %co = %{$commitlist->[$i]};
5283                 if (!%co) {
5284                         next;
5285                 }
5286                 my $commit = $co{'id'};
5287
5288                 my $ref = format_ref_marker($refs, $commit);
5289
5290                 if ($alternate) {
5291                         print "<tr class=\"dark\">\n";
5292                 } else {
5293                         print "<tr class=\"light\">\n";
5294                 }
5295                 $alternate ^= 1;
5296                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5297         # shortlog:   format_author_html('td', \%co, 10)
5298                       format_author_html('td', \%co, 15, 3) . "<td>";
5299                 # originally git_history used chop_str($co{'title'}, 50)
5300                 print format_subject_html($co{'title'}, $co{'title_short'},
5301                                           href(action=>"commit", hash=>$commit), $ref);
5302                 print "</td>\n" .
5303                       "<td class=\"link\">" .
5304                       $cgi->a({-href => href(action=>$ftype, hash_base=>$commit, file_name=>$file_name)}, $ftype) . " | " .
5305                       $cgi->a({-href => href(action=>"commitdiff", hash=>$commit)}, "commitdiff");
5306
5307                 if ($ftype eq 'blob') {
5308                         my $blob_current = $file_hash;
5309                         my $blob_parent  = git_get_hash_by_path($commit, $file_name);
5310                         if (defined $blob_current && defined $blob_parent &&
5311                                         $blob_current ne $blob_parent) {
5312                                 print " | " .
5313                                         $cgi->a({-href => href(action=>"blobdiff",
5314                                                                hash=>$blob_current, hash_parent=>$blob_parent,
5315                                                                hash_base=>$hash_base, hash_parent_base=>$commit,
5316                                                                file_name=>$file_name)},
5317                                                 "diff to current");
5318                         }
5319                 }
5320                 print "</td>\n" .
5321                       "</tr>\n";
5322         }
5323         if (defined $extra) {
5324                 print "<tr>\n" .
5325                       "<td colspan=\"4\">$extra</td>\n" .
5326                       "</tr>\n";
5327         }
5328         print "</table>\n";
5329 }
5330
5331 sub git_tags_body {
5332         # uses global variable $project
5333         my ($taglist, $from, $to, $extra) = @_;
5334         $from = 0 unless defined $from;
5335         $to = $#{$taglist} if (!defined $to || $#{$taglist} < $to);
5336
5337         print "<table class=\"tags\">\n";
5338         my $alternate = 1;
5339         for (my $i = $from; $i <= $to; $i++) {
5340                 my $entry = $taglist->[$i];
5341                 my %tag = %$entry;
5342                 my $comment = $tag{'subject'};
5343                 my $comment_short;
5344                 if (defined $comment) {
5345                         $comment_short = chop_str($comment, 30, 5);
5346                 }
5347                 if ($alternate) {
5348                         print "<tr class=\"dark\">\n";
5349                 } else {
5350                         print "<tr class=\"light\">\n";
5351                 }
5352                 $alternate ^= 1;
5353                 if (defined $tag{'age'}) {
5354                         print "<td><i>$tag{'age'}</i></td>\n";
5355                 } else {
5356                         print "<td></td>\n";
5357                 }
5358                 print "<td>" .
5359                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'}),
5360                                -class => "list name"}, esc_html($tag{'name'})) .
5361                       "</td>\n" .
5362                       "<td>";
5363                 if (defined $comment) {
5364                         print format_subject_html($comment, $comment_short,
5365                                                   href(action=>"tag", hash=>$tag{'id'}));
5366                 }
5367                 print "</td>\n" .
5368                       "<td class=\"selflink\">";
5369                 if ($tag{'type'} eq "tag") {
5370                         print $cgi->a({-href => href(action=>"tag", hash=>$tag{'id'})}, "tag");
5371                 } else {
5372                         print "&nbsp;";
5373                 }
5374                 print "</td>\n" .
5375                       "<td class=\"link\">" . " | " .
5376                       $cgi->a({-href => href(action=>$tag{'reftype'}, hash=>$tag{'refid'})}, $tag{'reftype'});
5377                 if ($tag{'reftype'} eq "commit") {
5378                         print " | " . $cgi->a({-href => href(action=>"shortlog", hash=>$tag{'fullname'})}, "shortlog") .
5379                               " | " . $cgi->a({-href => href(action=>"log", hash=>$tag{'fullname'})}, "log");
5380                 } elsif ($tag{'reftype'} eq "blob") {
5381                         print " | " . $cgi->a({-href => href(action=>"blob_plain", hash=>$tag{'refid'})}, "raw");
5382                 }
5383                 print "</td>\n" .
5384                       "</tr>";
5385         }
5386         if (defined $extra) {
5387                 print "<tr>\n" .
5388                       "<td colspan=\"5\">$extra</td>\n" .
5389                       "</tr>\n";
5390         }
5391         print "</table>\n";
5392 }
5393
5394 sub git_heads_body {
5395         # uses global variable $project
5396         my ($headlist, $head, $from, $to, $extra) = @_;
5397         $from = 0 unless defined $from;
5398         $to = $#{$headlist} if (!defined $to || $#{$headlist} < $to);
5399
5400         print "<table class=\"heads\">\n";
5401         my $alternate = 1;
5402         for (my $i = $from; $i <= $to; $i++) {
5403                 my $entry = $headlist->[$i];
5404                 my %ref = %$entry;
5405                 my $curr = $ref{'id'} eq $head;
5406                 if ($alternate) {
5407                         print "<tr class=\"dark\">\n";
5408                 } else {
5409                         print "<tr class=\"light\">\n";
5410                 }
5411                 $alternate ^= 1;
5412                 print "<td><i>$ref{'age'}</i></td>\n" .
5413                       ($curr ? "<td class=\"current_head\">" : "<td>") .
5414                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'}),
5415                                -class => "list name"},esc_html($ref{'name'})) .
5416                       "</td>\n" .
5417                       "<td class=\"link\">" .
5418                       $cgi->a({-href => href(action=>"shortlog", hash=>$ref{'fullname'})}, "shortlog") . " | " .
5419                       $cgi->a({-href => href(action=>"log", hash=>$ref{'fullname'})}, "log") . " | " .
5420                       $cgi->a({-href => href(action=>"tree", hash=>$ref{'fullname'}, hash_base=>$ref{'fullname'})}, "tree") .
5421                       "</td>\n" .
5422                       "</tr>";
5423         }
5424         if (defined $extra) {
5425                 print "<tr>\n" .
5426                       "<td colspan=\"3\">$extra</td>\n" .
5427                       "</tr>\n";
5428         }
5429         print "</table>\n";
5430 }
5431
5432 # Display a single remote block
5433 sub git_remote_block {
5434         my ($remote, $rdata, $limit, $head) = @_;
5435
5436         my $heads = $rdata->{'heads'};
5437         my $fetch = $rdata->{'fetch'};
5438         my $push = $rdata->{'push'};
5439
5440         my $urls_table = "<table class=\"projects_list\">\n" ;
5441
5442         if (defined $fetch) {
5443                 if ($fetch eq $push) {
5444                         $urls_table .= format_repo_url("URL", $fetch);
5445                 } else {
5446                         $urls_table .= format_repo_url("Fetch URL", $fetch);
5447                         $urls_table .= format_repo_url("Push URL", $push) if defined $push;
5448                 }
5449         } elsif (defined $push) {
5450                 $urls_table .= format_repo_url("Push URL", $push);
5451         } else {
5452                 $urls_table .= format_repo_url("", "No remote URL");
5453         }
5454
5455         $urls_table .= "</table>\n";
5456
5457         my $dots;
5458         if (defined $limit && $limit < @$heads) {
5459                 $dots = $cgi->a({-href => href(action=>"remotes", hash=>$remote)}, "...");
5460         }
5461
5462         print $urls_table;
5463         git_heads_body($heads, $head, 0, $limit, $dots);
5464 }
5465
5466 # Display a list of remote names with the respective fetch and push URLs
5467 sub git_remotes_list {
5468         my ($remotedata, $limit) = @_;
5469         print "<table class=\"heads\">\n";
5470         my $alternate = 1;
5471         my @remotes = sort keys %$remotedata;
5472
5473         my $limited = $limit && $limit < @remotes;
5474
5475         $#remotes = $limit - 1 if $limited;
5476
5477         while (my $remote = shift @remotes) {
5478                 my $rdata = $remotedata->{$remote};
5479                 my $fetch = $rdata->{'fetch'};
5480                 my $push = $rdata->{'push'};
5481                 if ($alternate) {
5482                         print "<tr class=\"dark\">\n";
5483                 } else {
5484                         print "<tr class=\"light\">\n";
5485                 }
5486                 $alternate ^= 1;
5487                 print "<td>" .
5488                       $cgi->a({-href=> href(action=>'remotes', hash=>$remote),
5489                                -class=> "list name"},esc_html($remote)) .
5490                       "</td>";
5491                 print "<td class=\"link\">" .
5492                       (defined $fetch ? $cgi->a({-href=> $fetch}, "fetch") : "fetch") .
5493                       " | " .
5494                       (defined $push ? $cgi->a({-href=> $push}, "push") : "push") .
5495                       "</td>";
5496
5497                 print "</tr>\n";
5498         }
5499
5500         if ($limited) {
5501                 print "<tr>\n" .
5502                       "<td colspan=\"3\">" .
5503                       $cgi->a({-href => href(action=>"remotes")}, "...") .
5504                       "</td>\n" . "</tr>\n";
5505         }
5506
5507         print "</table>";
5508 }
5509
5510 # Display remote heads grouped by remote, unless there are too many
5511 # remotes, in which case we only display the remote names
5512 sub git_remotes_body {
5513         my ($remotedata, $limit, $head) = @_;
5514         if ($limit and $limit < keys %$remotedata) {
5515                 git_remotes_list($remotedata, $limit);
5516         } else {
5517                 fill_remote_heads($remotedata);
5518                 while (my ($remote, $rdata) = each %$remotedata) {
5519                         git_print_section({-class=>"remote", -id=>$remote},
5520                                 ["remotes", $remote, $remote], sub {
5521                                         git_remote_block($remote, $rdata, $limit, $head);
5522                                 });
5523                 }
5524         }
5525 }
5526
5527 sub git_search_grep_body {
5528         my ($commitlist, $from, $to, $extra) = @_;
5529         $from = 0 unless defined $from;
5530         $to = $#{$commitlist} if (!defined $to || $#{$commitlist} < $to);
5531
5532         print "<table class=\"commit_search\">\n";
5533         my $alternate = 1;
5534         for (my $i = $from; $i <= $to; $i++) {
5535                 my %co = %{$commitlist->[$i]};
5536                 if (!%co) {
5537                         next;
5538                 }
5539                 my $commit = $co{'id'};
5540                 if ($alternate) {
5541                         print "<tr class=\"dark\">\n";
5542                 } else {
5543                         print "<tr class=\"light\">\n";
5544                 }
5545                 $alternate ^= 1;
5546                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
5547                       format_author_html('td', \%co, 15, 5) .
5548                       "<td>" .
5549                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
5550                                -class => "list subject"},
5551                               chop_and_escape_str($co{'title'}, 50) . "<br/>");
5552                 my $comment = $co{'comment'};
5553                 foreach my $line (@$comment) {
5554                         if ($line =~ m/^(.*?)($search_regexp)(.*)$/i) {
5555                                 my ($lead, $match, $trail) = ($1, $2, $3);
5556                                 $match = chop_str($match, 70, 5, 'center');
5557                                 my $contextlen = int((80 - length($match))/2);
5558                                 $contextlen = 30 if ($contextlen > 30);
5559                                 $lead  = chop_str($lead,  $contextlen, 10, 'left');
5560                                 $trail = chop_str($trail, $contextlen, 10, 'right');
5561
5562                                 $lead  = esc_html($lead);
5563                                 $match = esc_html($match);
5564                                 $trail = esc_html($trail);
5565
5566                                 print "$lead<span class=\"match\">$match</span>$trail<br />";
5567                         }
5568                 }
5569                 print "</td>\n" .
5570                       "<td class=\"link\">" .
5571                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
5572                       " | " .
5573                       $cgi->a({-href => href(action=>"commitdiff", hash=>$co{'id'})}, "commitdiff") .
5574                       " | " .
5575                       $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
5576                 print "</td>\n" .
5577                       "</tr>\n";
5578         }
5579         if (defined $extra) {
5580                 print "<tr>\n" .
5581                       "<td colspan=\"3\">$extra</td>\n" .
5582                       "</tr>\n";
5583         }
5584         print "</table>\n";
5585 }
5586
5587 ## ======================================================================
5588 ## ======================================================================
5589 ## actions
5590
5591 sub git_project_list {
5592         my $order = $input_params{'order'};
5593         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5594                 die_error(400, "Unknown order parameter");
5595         }
5596
5597         my @list = git_get_projects_list();
5598         if (!@list) {
5599                 die_error(404, "No projects found");
5600         }
5601
5602         git_header_html();
5603         if (defined $home_text && -f $home_text) {
5604                 print "<div class=\"index_include\">\n";
5605                 insert_file($home_text);
5606                 print "</div>\n";
5607         }
5608         print $cgi->startform(-method => "get") .
5609               "<p class=\"projsearch\">Search:\n" .
5610               $cgi->textfield(-name => "s", -value => $searchtext) . "\n" .
5611               "</p>" .
5612               $cgi->end_form() . "\n";
5613         git_project_list_body(\@list, $order);
5614         git_footer_html();
5615 }
5616
5617 sub git_forks {
5618         my $order = $input_params{'order'};
5619         if (defined $order && $order !~ m/none|project|descr|owner|age/) {
5620                 die_error(400, "Unknown order parameter");
5621         }
5622
5623         my @list = git_get_projects_list($project);
5624         if (!@list) {
5625                 die_error(404, "No forks found");
5626         }
5627
5628         git_header_html();
5629         git_print_page_nav('','');
5630         git_print_header_div('summary', "$project forks");
5631         git_project_list_body(\@list, $order);
5632         git_footer_html();
5633 }
5634
5635 sub git_project_index {
5636         my @projects = git_get_projects_list();
5637         if (!@projects) {
5638                 die_error(404, "No projects found");
5639         }
5640
5641         print $cgi->header(
5642                 -type => 'text/plain',
5643                 -charset => 'utf-8',
5644                 -content_disposition => 'inline; filename="index.aux"');
5645
5646         foreach my $pr (@projects) {
5647                 if (!exists $pr->{'owner'}) {
5648                         $pr->{'owner'} = git_get_project_owner("$pr->{'path'}");
5649                 }
5650
5651                 my ($path, $owner) = ($pr->{'path'}, $pr->{'owner'});
5652                 # quote as in CGI::Util::encode, but keep the slash, and use '+' for ' '
5653                 $path  =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5654                 $owner =~ s/([^a-zA-Z0-9_.\-\/ ])/sprintf("%%%02X", ord($1))/eg;
5655                 $path  =~ s/ /\+/g;
5656                 $owner =~ s/ /\+/g;
5657
5658                 print "$path $owner\n";
5659         }
5660 }
5661
5662 sub git_summary {
5663         my $descr = git_get_project_description($project) || "none";
5664         my %co = parse_commit("HEAD");
5665         my %cd = %co ? parse_date($co{'committer_epoch'}, $co{'committer_tz'}) : ();
5666         my $head = $co{'id'};
5667         my $remote_heads = gitweb_check_feature('remote_heads');
5668
5669         my $owner = git_get_project_owner($project);
5670
5671         my $refs = git_get_references();
5672         # These get_*_list functions return one more to allow us to see if
5673         # there are more ...
5674         my @taglist  = git_get_tags_list(16);
5675         my @headlist = git_get_heads_list(16);
5676         my %remotedata = $remote_heads ? git_get_remotes_list() : ();
5677         my @forklist;
5678         my $check_forks = gitweb_check_feature('forks');
5679
5680         if ($check_forks) {
5681                 # find forks of a project
5682                 @forklist = git_get_projects_list($project);
5683                 # filter out forks of forks
5684                 @forklist = filter_forks_from_projects_list(\@forklist)
5685                         if (@forklist);
5686         }
5687
5688         git_header_html();
5689         git_print_page_nav('summary','', $head);
5690
5691         print "<div class=\"title\">&nbsp;</div>\n";
5692         print "<table class=\"projects_list\">\n" .
5693               "<tr id=\"metadata_desc\"><td>description</td><td>" . esc_html($descr) . "</td></tr>\n" .
5694               "<tr id=\"metadata_owner\"><td>owner</td><td>" . esc_html($owner) . "</td></tr>\n";
5695         if (defined $cd{'rfc2822'}) {
5696                 print "<tr id=\"metadata_lchange\"><td>last change</td>" .
5697                       "<td>".format_timestamp_html(\%cd)."</td></tr>\n";
5698         }
5699
5700         # use per project git URL list in $projectroot/$project/cloneurl
5701         # or make project git URL from git base URL and project name
5702         my $url_tag = "URL";
5703         my @url_list = git_get_project_url_list($project);
5704         @url_list = map { "$_/$project" } @git_base_url_list unless @url_list;
5705         foreach my $git_url (@url_list) {
5706                 next unless $git_url;
5707                 print format_repo_url($url_tag, $git_url);
5708                 $url_tag = "";
5709         }
5710
5711         # Tag cloud
5712         my $show_ctags = gitweb_check_feature('ctags');
5713         if ($show_ctags) {
5714                 my $ctags = git_get_project_ctags($project);
5715                 if (%$ctags) {
5716                         # without ability to add tags, don't show if there are none
5717                         my $cloud = git_populate_project_tagcloud($ctags);
5718                         print "<tr id=\"metadata_ctags\">" .
5719                               "<td>content tags</td>" .
5720                               "<td>".git_show_project_tagcloud($cloud, 48)."</td>" .
5721                               "</tr>\n";
5722                 }
5723         }
5724
5725         print "</table>\n";
5726
5727         # If XSS prevention is on, we don't include README.html.
5728         # TODO: Allow a readme in some safe format.
5729         if (!$prevent_xss && -s "$projectroot/$project/README.html") {
5730                 print "<div class=\"title\">readme</div>\n" .
5731                       "<div class=\"readme\">\n";
5732                 insert_file("$projectroot/$project/README.html");
5733                 print "\n</div>\n"; # class="readme"
5734         }
5735
5736         # we need to request one more than 16 (0..15) to check if
5737         # those 16 are all
5738         my @commitlist = $head ? parse_commits($head, 17) : ();
5739         if (@commitlist) {
5740                 git_print_header_div('shortlog');
5741                 git_shortlog_body(\@commitlist, 0, 15, $refs,
5742                                   $#commitlist <=  15 ? undef :
5743                                   $cgi->a({-href => href(action=>"shortlog")}, "..."));
5744         }
5745
5746         if (@taglist) {
5747                 git_print_header_div('tags');
5748                 git_tags_body(\@taglist, 0, 15,
5749                               $#taglist <=  15 ? undef :
5750                               $cgi->a({-href => href(action=>"tags")}, "..."));
5751         }
5752
5753         if (@headlist) {
5754                 git_print_header_div('heads');
5755                 git_heads_body(\@headlist, $head, 0, 15,
5756                                $#headlist <= 15 ? undef :
5757                                $cgi->a({-href => href(action=>"heads")}, "..."));
5758         }
5759
5760         if (%remotedata) {
5761                 git_print_header_div('remotes');
5762                 git_remotes_body(\%remotedata, 15, $head);
5763         }
5764
5765         if (@forklist) {
5766                 git_print_header_div('forks');
5767                 git_project_list_body(\@forklist, 'age', 0, 15,
5768                                       $#forklist <= 15 ? undef :
5769                                       $cgi->a({-href => href(action=>"forks")}, "..."),
5770                                       'no_header');
5771         }
5772
5773         git_footer_html();
5774 }
5775
5776 sub git_tag {
5777         my %tag = parse_tag($hash);
5778
5779         if (! %tag) {
5780                 die_error(404, "Unknown tag object");
5781         }
5782
5783         my $head = git_get_head_hash($project);
5784         git_header_html();
5785         git_print_page_nav('','', $head,undef,$head);
5786         git_print_header_div('commit', esc_html($tag{'name'}), $hash);
5787         print "<div class=\"title_text\">\n" .
5788               "<table class=\"object_header\">\n" .
5789               "<tr>\n" .
5790               "<td>object</td>\n" .
5791               "<td>" . $cgi->a({-class => "list", -href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5792                                $tag{'object'}) . "</td>\n" .
5793               "<td class=\"link\">" . $cgi->a({-href => href(action=>$tag{'type'}, hash=>$tag{'object'})},
5794                                               $tag{'type'}) . "</td>\n" .
5795               "</tr>\n";
5796         if (defined($tag{'author'})) {
5797                 git_print_authorship_rows(\%tag, 'author');
5798         }
5799         print "</table>\n\n" .
5800               "</div>\n";
5801         print "<div class=\"page_body\">";
5802         my $comment = $tag{'comment'};
5803         foreach my $line (@$comment) {
5804                 chomp $line;
5805                 print esc_html($line, -nbsp=>1) . "<br/>\n";
5806         }
5807         print "</div>\n";
5808         git_footer_html();
5809 }
5810
5811 sub git_blame_common {
5812         my $format = shift || 'porcelain';
5813         if ($format eq 'porcelain' && $cgi->param('js')) {
5814                 $format = 'incremental';
5815                 $action = 'blame_incremental'; # for page title etc
5816         }
5817
5818         # permissions
5819         gitweb_check_feature('blame')
5820                 or die_error(403, "Blame view not allowed");
5821
5822         # error checking
5823         die_error(400, "No file name given") unless $file_name;
5824         $hash_base ||= git_get_head_hash($project);
5825         die_error(404, "Couldn't find base commit") unless $hash_base;
5826         my %co = parse_commit($hash_base)
5827                 or die_error(404, "Commit not found");
5828         my $ftype = "blob";
5829         if (!defined $hash) {
5830                 $hash = git_get_hash_by_path($hash_base, $file_name, "blob")
5831                         or die_error(404, "Error looking up file");
5832         } else {
5833                 $ftype = git_get_type($hash);
5834                 if ($ftype !~ "blob") {
5835                         die_error(400, "Object is not a blob");
5836                 }
5837         }
5838
5839         my $fd;
5840         if ($format eq 'incremental') {
5841                 # get file contents (as base)
5842                 open $fd, "-|", git_cmd(), 'cat-file', 'blob', $hash
5843                         or die_error(500, "Open git-cat-file failed");
5844         } elsif ($format eq 'data') {
5845                 # run git-blame --incremental
5846                 open $fd, "-|", git_cmd(), "blame", "--incremental",
5847                         $hash_base, "--", $file_name
5848                         or die_error(500, "Open git-blame --incremental failed");
5849         } else {
5850                 # run git-blame --porcelain
5851                 open $fd, "-|", git_cmd(), "blame", '-p',
5852                         $hash_base, '--', $file_name
5853                         or die_error(500, "Open git-blame --porcelain failed");
5854         }
5855
5856         # incremental blame data returns early
5857         if ($format eq 'data') {
5858                 print $cgi->header(
5859                         -type=>"text/plain", -charset => "utf-8",
5860                         -status=> "200 OK");
5861                 local $| = 1; # output autoflush
5862                 print while <$fd>;
5863                 close $fd
5864                         or print "ERROR $!\n";
5865
5866                 print 'END';
5867                 if (defined $t0 && gitweb_check_feature('timed')) {
5868                         print ' '.
5869                               tv_interval($t0, [ gettimeofday() ]).
5870                               ' '.$number_of_git_cmds;
5871                 }
5872                 print "\n";
5873
5874                 return;
5875         }
5876
5877         # page header
5878         git_header_html();
5879         my $formats_nav =
5880                 $cgi->a({-href => href(action=>"blob", -replay=>1)},
5881                         "blob") .
5882                 " | ";
5883         if ($format eq 'incremental') {
5884                 $formats_nav .=
5885                         $cgi->a({-href => href(action=>"blame", javascript=>0, -replay=>1)},
5886                                 "blame") . " (non-incremental)";
5887         } else {
5888                 $formats_nav .=
5889                         $cgi->a({-href => href(action=>"blame_incremental", -replay=>1)},
5890                                 "blame") . " (incremental)";
5891         }
5892         $formats_nav .=
5893                 " | " .
5894                 $cgi->a({-href => href(action=>"history", -replay=>1)},
5895                         "history") .
5896                 " | " .
5897                 $cgi->a({-href => href(action=>$action, file_name=>$file_name)},
5898                         "HEAD");
5899         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
5900         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
5901         git_print_page_path($file_name, $ftype, $hash_base);
5902
5903         # page body
5904         if ($format eq 'incremental') {
5905                 print "<noscript>\n<div class=\"error\"><center><b>\n".
5906                       "This page requires JavaScript to run.\n Use ".
5907                       $cgi->a({-href => href(action=>'blame',javascript=>0,-replay=>1)},
5908                               'this page').
5909                       " instead.\n".
5910                       "</b></center></div>\n</noscript>\n";
5911
5912                 print qq!<div id="progress_bar" style="width: 100%; background-color: yellow"></div>\n!;
5913         }
5914
5915         print qq!<div class="page_body">\n!;
5916         print qq!<div id="progress_info">... / ...</div>\n!
5917                 if ($format eq 'incremental');
5918         print qq!<table id="blame_table" class="blame" width="100%">\n!.
5919               #qq!<col width="5.5em" /><col width="2.5em" /><col width="*" />\n!.
5920               qq!<thead>\n!.
5921               qq!<tr><th>Commit</th><th>Line</th><th>Data</th></tr>\n!.
5922               qq!</thead>\n!.
5923               qq!<tbody>\n!;
5924
5925         my @rev_color = qw(light dark);
5926         my $num_colors = scalar(@rev_color);
5927         my $current_color = 0;
5928
5929         if ($format eq 'incremental') {
5930                 my $color_class = $rev_color[$current_color];
5931
5932                 #contents of a file
5933                 my $linenr = 0;
5934         LINE:
5935                 while (my $line = <$fd>) {
5936                         chomp $line;
5937                         $linenr++;
5938
5939                         print qq!<tr id="l$linenr" class="$color_class">!.
5940                               qq!<td class="sha1"><a href=""> </a></td>!.
5941                               qq!<td class="linenr">!.
5942                               qq!<a class="linenr" href="">$linenr</a></td>!;
5943                         print qq!<td class="pre">! . esc_html($line) . "</td>\n";
5944                         print qq!</tr>\n!;
5945                 }
5946
5947         } else { # porcelain, i.e. ordinary blame
5948                 my %metainfo = (); # saves information about commits
5949
5950                 # blame data
5951         LINE:
5952                 while (my $line = <$fd>) {
5953                         chomp $line;
5954                         # the header: <SHA-1> <src lineno> <dst lineno> [<lines in group>]
5955                         # no <lines in group> for subsequent lines in group of lines
5956                         my ($full_rev, $orig_lineno, $lineno, $group_size) =
5957                            ($line =~ /^([0-9a-f]{40}) (\d+) (\d+)(?: (\d+))?$/);
5958                         if (!exists $metainfo{$full_rev}) {
5959                                 $metainfo{$full_rev} = { 'nprevious' => 0 };
5960                         }
5961                         my $meta = $metainfo{$full_rev};
5962                         my $data;
5963                         while ($data = <$fd>) {
5964                                 chomp $data;
5965                                 last if ($data =~ s/^\t//); # contents of line
5966                                 if ($data =~ /^(\S+)(?: (.*))?$/) {
5967                                         $meta->{$1} = $2 unless exists $meta->{$1};
5968                                 }
5969                                 if ($data =~ /^previous /) {
5970                                         $meta->{'nprevious'}++;
5971                                 }
5972                         }
5973                         my $short_rev = substr($full_rev, 0, 8);
5974                         my $author = $meta->{'author'};
5975                         my %date =
5976                                 parse_date($meta->{'author-time'}, $meta->{'author-tz'});
5977                         my $date = $date{'iso-tz'};
5978                         if ($group_size) {
5979                                 $current_color = ($current_color + 1) % $num_colors;
5980                         }
5981                         my $tr_class = $rev_color[$current_color];
5982                         $tr_class .= ' boundary' if (exists $meta->{'boundary'});
5983                         $tr_class .= ' no-previous' if ($meta->{'nprevious'} == 0);
5984                         $tr_class .= ' multiple-previous' if ($meta->{'nprevious'} > 1);
5985                         print "<tr id=\"l$lineno\" class=\"$tr_class\">\n";
5986                         if ($group_size) {
5987                                 print "<td class=\"sha1\"";
5988                                 print " title=\"". esc_html($author) . ", $date\"";
5989                                 print " rowspan=\"$group_size\"" if ($group_size > 1);
5990                                 print ">";
5991                                 print $cgi->a({-href => href(action=>"commit",
5992                                                              hash=>$full_rev,
5993                                                              file_name=>$file_name)},
5994                                               esc_html($short_rev));
5995                                 if ($group_size >= 2) {
5996                                         my @author_initials = ($author =~ /\b([[:upper:]])\B/g);
5997                                         if (@author_initials) {
5998                                                 print "<br />" .
5999                                                       esc_html(join('', @author_initials));
6000                                                 #           or join('.', ...)
6001                                         }
6002                                 }
6003                                 print "</td>\n";
6004                         }
6005                         # 'previous' <sha1 of parent commit> <filename at commit>
6006                         if (exists $meta->{'previous'} &&
6007                             $meta->{'previous'} =~ /^([a-fA-F0-9]{40}) (.*)$/) {
6008                                 $meta->{'parent'} = $1;
6009                                 $meta->{'file_parent'} = unquote($2);
6010                         }
6011                         my $linenr_commit =
6012                                 exists($meta->{'parent'}) ?
6013                                 $meta->{'parent'} : $full_rev;
6014                         my $linenr_filename =
6015                                 exists($meta->{'file_parent'}) ?
6016                                 $meta->{'file_parent'} : unquote($meta->{'filename'});
6017                         my $blamed = href(action => 'blame',
6018                                           file_name => $linenr_filename,
6019                                           hash_base => $linenr_commit);
6020                         print "<td class=\"linenr\">";
6021                         print $cgi->a({ -href => "$blamed#l$orig_lineno",
6022                                         -class => "linenr" },
6023                                       esc_html($lineno));
6024                         print "</td>";
6025                         print "<td class=\"pre\">" . esc_html($data) . "</td>\n";
6026                         print "</tr>\n";
6027                 } # end while
6028
6029         }
6030
6031         # footer
6032         print "</tbody>\n".
6033               "</table>\n"; # class="blame"
6034         print "</div>\n";   # class="blame_body"
6035         close $fd
6036                 or print "Reading blob failed\n";
6037
6038         git_footer_html();
6039 }
6040
6041 sub git_blame {
6042         git_blame_common();
6043 }
6044
6045 sub git_blame_incremental {
6046         git_blame_common('incremental');
6047 }
6048
6049 sub git_blame_data {
6050         git_blame_common('data');
6051 }
6052
6053 sub git_tags {
6054         my $head = git_get_head_hash($project);
6055         git_header_html();
6056         git_print_page_nav('','', $head,undef,$head,format_ref_views('tags'));
6057         git_print_header_div('summary', $project);
6058
6059         my @tagslist = git_get_tags_list();
6060         if (@tagslist) {
6061                 git_tags_body(\@tagslist);
6062         }
6063         git_footer_html();
6064 }
6065
6066 sub git_heads {
6067         my $head = git_get_head_hash($project);
6068         git_header_html();
6069         git_print_page_nav('','', $head,undef,$head,format_ref_views('heads'));
6070         git_print_header_div('summary', $project);
6071
6072         my @headslist = git_get_heads_list();
6073         if (@headslist) {
6074                 git_heads_body(\@headslist, $head);
6075         }
6076         git_footer_html();
6077 }
6078
6079 # used both for single remote view and for list of all the remotes
6080 sub git_remotes {
6081         gitweb_check_feature('remote_heads')
6082                 or die_error(403, "Remote heads view is disabled");
6083
6084         my $head = git_get_head_hash($project);
6085         my $remote = $input_params{'hash'};
6086
6087         my $remotedata = git_get_remotes_list($remote);
6088         die_error(500, "Unable to get remote information") unless defined $remotedata;
6089
6090         unless (%$remotedata) {
6091                 die_error(404, defined $remote ?
6092                         "Remote $remote not found" :
6093                         "No remotes found");
6094         }
6095
6096         git_header_html(undef, undef, -action_extra => $remote);
6097         git_print_page_nav('', '',  $head, undef, $head,
6098                 format_ref_views($remote ? '' : 'remotes'));
6099
6100         fill_remote_heads($remotedata);
6101         if (defined $remote) {
6102                 git_print_header_div('remotes', "$remote remote for $project");
6103                 git_remote_block($remote, $remotedata->{$remote}, undef, $head);
6104         } else {
6105                 git_print_header_div('summary', "$project remotes");
6106                 git_remotes_body($remotedata, undef, $head);
6107         }
6108
6109         git_footer_html();
6110 }
6111
6112 sub git_blob_plain {
6113         my $type = shift;
6114         my $expires;
6115
6116         if (!defined $hash) {
6117                 if (defined $file_name) {
6118                         my $base = $hash_base || git_get_head_hash($project);
6119                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6120                                 or die_error(404, "Cannot find file");
6121                 } else {
6122                         die_error(400, "No file name defined");
6123                 }
6124         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6125                 # blobs defined by non-textual hash id's can be cached
6126                 $expires = "+1d";
6127         }
6128
6129         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6130                 or die_error(500, "Open git-cat-file blob '$hash' failed");
6131
6132         # content-type (can include charset)
6133         $type = blob_contenttype($fd, $file_name, $type);
6134
6135         # "save as" filename, even when no $file_name is given
6136         my $save_as = "$hash";
6137         if (defined $file_name) {
6138                 $save_as = $file_name;
6139         } elsif ($type =~ m/^text\//) {
6140                 $save_as .= '.txt';
6141         }
6142
6143         # With XSS prevention on, blobs of all types except a few known safe
6144         # ones are served with "Content-Disposition: attachment" to make sure
6145         # they don't run in our security domain.  For certain image types,
6146         # blob view writes an <img> tag referring to blob_plain view, and we
6147         # want to be sure not to break that by serving the image as an
6148         # attachment (though Firefox 3 doesn't seem to care).
6149         my $sandbox = $prevent_xss &&
6150                 $type !~ m!^(?:text/plain|image/(?:gif|png|jpeg))(?:[ ;]|$)!;
6151
6152         print $cgi->header(
6153                 -type => $type,
6154                 -expires => $expires,
6155                 -content_disposition =>
6156                         ($sandbox ? 'attachment' : 'inline')
6157                         . '; filename="' . $save_as . '"');
6158         local $/ = undef;
6159         binmode STDOUT, ':raw';
6160         print <$fd>;
6161         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6162         close $fd;
6163 }
6164
6165 sub git_blob {
6166         my $expires;
6167
6168         if (!defined $hash) {
6169                 if (defined $file_name) {
6170                         my $base = $hash_base || git_get_head_hash($project);
6171                         $hash = git_get_hash_by_path($base, $file_name, "blob")
6172                                 or die_error(404, "Cannot find file");
6173                 } else {
6174                         die_error(400, "No file name defined");
6175                 }
6176         } elsif ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6177                 # blobs defined by non-textual hash id's can be cached
6178                 $expires = "+1d";
6179         }
6180
6181         my $have_blame = gitweb_check_feature('blame');
6182         open my $fd, "-|", git_cmd(), "cat-file", "blob", $hash
6183                 or die_error(500, "Couldn't cat $file_name, $hash");
6184         my $mimetype = blob_mimetype($fd, $file_name);
6185         # use 'blob_plain' (aka 'raw') view for files that cannot be displayed
6186         if ($mimetype !~ m!^(?:text/|image/(?:gif|png|jpeg)$)! && -B $fd) {
6187                 close $fd;
6188                 return git_blob_plain($mimetype);
6189         }
6190         # we can have blame only for text/* mimetype
6191         $have_blame &&= ($mimetype =~ m!^text/!);
6192
6193         my $highlight = gitweb_check_feature('highlight');
6194         my $syntax = guess_file_syntax($highlight, $mimetype, $file_name);
6195         $fd = run_highlighter($fd, $highlight, $syntax)
6196                 if $syntax;
6197
6198         git_header_html(undef, $expires);
6199         my $formats_nav = '';
6200         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6201                 if (defined $file_name) {
6202                         if ($have_blame) {
6203                                 $formats_nav .=
6204                                         $cgi->a({-href => href(action=>"blame", -replay=>1)},
6205                                                 "blame") .
6206                                         " | ";
6207                         }
6208                         $formats_nav .=
6209                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6210                                         "history") .
6211                                 " | " .
6212                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6213                                         "raw") .
6214                                 " | " .
6215                                 $cgi->a({-href => href(action=>"blob",
6216                                                        hash_base=>"HEAD", file_name=>$file_name)},
6217                                         "HEAD");
6218                 } else {
6219                         $formats_nav .=
6220                                 $cgi->a({-href => href(action=>"blob_plain", -replay=>1)},
6221                                         "raw");
6222                 }
6223                 git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6224                 git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6225         } else {
6226                 print "<div class=\"page_nav\">\n" .
6227                       "<br/><br/></div>\n" .
6228                       "<div class=\"title\">".esc_html($hash)."</div>\n";
6229         }
6230         git_print_page_path($file_name, "blob", $hash_base);
6231         print "<div class=\"page_body\">\n";
6232         if ($mimetype =~ m!^image/!) {
6233                 print qq!<img type="!.esc_attr($mimetype).qq!"!;
6234                 if ($file_name) {
6235                         print qq! alt="!.esc_attr($file_name).qq!" title="!.esc_attr($file_name).qq!"!;
6236                 }
6237                 print qq! src="! .
6238                       href(action=>"blob_plain", hash=>$hash,
6239                            hash_base=>$hash_base, file_name=>$file_name) .
6240                       qq!" />\n!;
6241         } else {
6242                 my $nr;
6243                 while (my $line = <$fd>) {
6244                         chomp $line;
6245                         $nr++;
6246                         $line = untabify($line);
6247                         printf qq!<div class="pre"><a id="l%i" href="%s#l%i" class="linenr">%4i</a> %s</div>\n!,
6248                                $nr, esc_attr(href(-replay => 1)), $nr, $nr, $syntax ? $line : esc_html($line, -nbsp=>1);
6249                 }
6250         }
6251         close $fd
6252                 or print "Reading blob failed.\n";
6253         print "</div>";
6254         git_footer_html();
6255 }
6256
6257 sub git_tree {
6258         if (!defined $hash_base) {
6259                 $hash_base = "HEAD";
6260         }
6261         if (!defined $hash) {
6262                 if (defined $file_name) {
6263                         $hash = git_get_hash_by_path($hash_base, $file_name, "tree");
6264                 } else {
6265                         $hash = $hash_base;
6266                 }
6267         }
6268         die_error(404, "No such tree") unless defined($hash);
6269
6270         my $show_sizes = gitweb_check_feature('show-sizes');
6271         my $have_blame = gitweb_check_feature('blame');
6272
6273         my @entries = ();
6274         {
6275                 local $/ = "\0";
6276                 open my $fd, "-|", git_cmd(), "ls-tree", '-z',
6277                         ($show_sizes ? '-l' : ()), @extra_options, $hash
6278                         or die_error(500, "Open git-ls-tree failed");
6279                 @entries = map { chomp; $_ } <$fd>;
6280                 close $fd
6281                         or die_error(404, "Reading tree failed");
6282         }
6283
6284         my $refs = git_get_references();
6285         my $ref = format_ref_marker($refs, $hash_base);
6286         git_header_html();
6287         my $basedir = '';
6288         if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6289                 my @views_nav = ();
6290                 if (defined $file_name) {
6291                         push @views_nav,
6292                                 $cgi->a({-href => href(action=>"history", -replay=>1)},
6293                                         "history"),
6294                                 $cgi->a({-href => href(action=>"tree",
6295                                                        hash_base=>"HEAD", file_name=>$file_name)},
6296                                         "HEAD"),
6297                 }
6298                 my $snapshot_links = format_snapshot_links($hash);
6299                 if (defined $snapshot_links) {
6300                         # FIXME: Should be available when we have no hash base as well.
6301                         push @views_nav, $snapshot_links;
6302                 }
6303                 git_print_page_nav('tree','', $hash_base, undef, undef,
6304                                    join(' | ', @views_nav));
6305                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash_base);
6306         } else {
6307                 undef $hash_base;
6308                 print "<div class=\"page_nav\">\n";
6309                 print "<br/><br/></div>\n";
6310                 print "<div class=\"title\">".esc_html($hash)."</div>\n";
6311         }
6312         if (defined $file_name) {
6313                 $basedir = $file_name;
6314                 if ($basedir ne '' && substr($basedir, -1) ne '/') {
6315                         $basedir .= '/';
6316                 }
6317                 git_print_page_path($file_name, 'tree', $hash_base);
6318         }
6319         print "<div class=\"page_body\">\n";
6320         print "<table class=\"tree\">\n";
6321         my $alternate = 1;
6322         # '..' (top directory) link if possible
6323         if (defined $hash_base &&
6324             defined $file_name && $file_name =~ m![^/]+$!) {
6325                 if ($alternate) {
6326                         print "<tr class=\"dark\">\n";
6327                 } else {
6328                         print "<tr class=\"light\">\n";
6329                 }
6330                 $alternate ^= 1;
6331
6332                 my $up = $file_name;
6333                 $up =~ s!/?[^/]+$!!;
6334                 undef $up unless $up;
6335                 # based on git_print_tree_entry
6336                 print '<td class="mode">' . mode_str('040000') . "</td>\n";
6337                 print '<td class="size">&nbsp;</td>'."\n" if $show_sizes;
6338                 print '<td class="list">';
6339                 print $cgi->a({-href => href(action=>"tree",
6340                                              hash_base=>$hash_base,
6341                                              file_name=>$up)},
6342                               "..");
6343                 print "</td>\n";
6344                 print "<td class=\"link\"></td>\n";
6345
6346                 print "</tr>\n";
6347         }
6348         foreach my $line (@entries) {
6349                 my %t = parse_ls_tree_line($line, -z => 1, -l => $show_sizes);
6350
6351                 if ($alternate) {
6352                         print "<tr class=\"dark\">\n";
6353                 } else {
6354                         print "<tr class=\"light\">\n";
6355                 }
6356                 $alternate ^= 1;
6357
6358                 git_print_tree_entry(\%t, $basedir, $hash_base, $have_blame);
6359
6360                 print "</tr>\n";
6361         }
6362         print "</table>\n" .
6363               "</div>";
6364         git_footer_html();
6365 }
6366
6367 sub snapshot_name {
6368         my ($project, $hash) = @_;
6369
6370         # path/to/project.git  -> project
6371         # path/to/project/.git -> project
6372         my $name = to_utf8($project);
6373         $name =~ s,([^/])/*\.git$,$1,;
6374         $name = basename($name);
6375         # sanitize name
6376         $name =~ s/[[:cntrl:]]/?/g;
6377
6378         my $ver = $hash;
6379         if ($hash =~ /^[0-9a-fA-F]+$/) {
6380                 # shorten SHA-1 hash
6381                 my $full_hash = git_get_full_hash($project, $hash);
6382                 if ($full_hash =~ /^$hash/ && length($hash) > 7) {
6383                         $ver = git_get_short_hash($project, $hash);
6384                 }
6385         } elsif ($hash =~ m!^refs/tags/(.*)$!) {
6386                 # tags don't need shortened SHA-1 hash
6387                 $ver = $1;
6388         } else {
6389                 # branches and other need shortened SHA-1 hash
6390                 if ($hash =~ m!^refs/(?:heads|remotes)/(.*)$!) {
6391                         $ver = $1;
6392                 }
6393                 $ver .= '-' . git_get_short_hash($project, $hash);
6394         }
6395         # in case of hierarchical branch names
6396         $ver =~ s!/!.!g;
6397
6398         # name = project-version_string
6399         $name = "$name-$ver";
6400
6401         return wantarray ? ($name, $name) : $name;
6402 }
6403
6404 sub git_snapshot {
6405         my $format = $input_params{'snapshot_format'};
6406         if (!@snapshot_fmts) {
6407                 die_error(403, "Snapshots not allowed");
6408         }
6409         # default to first supported snapshot format
6410         $format ||= $snapshot_fmts[0];
6411         if ($format !~ m/^[a-z0-9]+$/) {
6412                 die_error(400, "Invalid snapshot format parameter");
6413         } elsif (!exists($known_snapshot_formats{$format})) {
6414                 die_error(400, "Unknown snapshot format");
6415         } elsif ($known_snapshot_formats{$format}{'disabled'}) {
6416                 die_error(403, "Snapshot format not allowed");
6417         } elsif (!grep($_ eq $format, @snapshot_fmts)) {
6418                 die_error(403, "Unsupported snapshot format");
6419         }
6420
6421         my $type = git_get_type("$hash^{}");
6422         if (!$type) {
6423                 die_error(404, 'Object does not exist');
6424         }  elsif ($type eq 'blob') {
6425                 die_error(400, 'Object is not a tree-ish');
6426         }
6427
6428         my ($name, $prefix) = snapshot_name($project, $hash);
6429         my $filename = "$name$known_snapshot_formats{$format}{'suffix'}";
6430         my $cmd = quote_command(
6431                 git_cmd(), 'archive',
6432                 "--format=$known_snapshot_formats{$format}{'format'}",
6433                 "--prefix=$prefix/", $hash);
6434         if (exists $known_snapshot_formats{$format}{'compressor'}) {
6435                 $cmd .= ' | ' . quote_command(@{$known_snapshot_formats{$format}{'compressor'}});
6436         }
6437
6438         $filename =~ s/(["\\])/\\$1/g;
6439         print $cgi->header(
6440                 -type => $known_snapshot_formats{$format}{'type'},
6441                 -content_disposition => 'inline; filename="' . $filename . '"',
6442                 -status => '200 OK');
6443
6444         open my $fd, "-|", $cmd
6445                 or die_error(500, "Execute git-archive failed");
6446         binmode STDOUT, ':raw';
6447         print <$fd>;
6448         binmode STDOUT, ':utf8'; # as set at the beginning of gitweb.cgi
6449         close $fd;
6450 }
6451
6452 sub git_log_generic {
6453         my ($fmt_name, $body_subr, $base, $parent, $file_name, $file_hash) = @_;
6454
6455         my $head = git_get_head_hash($project);
6456         if (!defined $base) {
6457                 $base = $head;
6458         }
6459         if (!defined $page) {
6460                 $page = 0;
6461         }
6462         my $refs = git_get_references();
6463
6464         my $commit_hash = $base;
6465         if (defined $parent) {
6466                 $commit_hash = "$parent..$base";
6467         }
6468         my @commitlist =
6469                 parse_commits($commit_hash, 101, (100 * $page),
6470                               defined $file_name ? ($file_name, "--full-history") : ());
6471
6472         my $ftype;
6473         if (!defined $file_hash && defined $file_name) {
6474                 # some commits could have deleted file in question,
6475                 # and not have it in tree, but one of them has to have it
6476                 for (my $i = 0; $i < @commitlist; $i++) {
6477                         $file_hash = git_get_hash_by_path($commitlist[$i]{'id'}, $file_name);
6478                         last if defined $file_hash;
6479                 }
6480         }
6481         if (defined $file_hash) {
6482                 $ftype = git_get_type($file_hash);
6483         }
6484         if (defined $file_name && !defined $ftype) {
6485                 die_error(500, "Unknown type of object");
6486         }
6487         my %co;
6488         if (defined $file_name) {
6489                 %co = parse_commit($base)
6490                         or die_error(404, "Unknown commit object");
6491         }
6492
6493
6494         my $paging_nav = format_paging_nav($fmt_name, $page, $#commitlist >= 100);
6495         my $next_link = '';
6496         if ($#commitlist >= 100) {
6497                 $next_link =
6498                         $cgi->a({-href => href(-replay=>1, page=>$page+1),
6499                                  -accesskey => "n", -title => "Alt-n"}, "next");
6500         }
6501         my $patch_max = gitweb_get_feature('patches');
6502         if ($patch_max && !defined $file_name) {
6503                 if ($patch_max < 0 || @commitlist <= $patch_max) {
6504                         $paging_nav .= " &sdot; " .
6505                                 $cgi->a({-href => href(action=>"patches", -replay=>1)},
6506                                         "patches");
6507                 }
6508         }
6509
6510         git_header_html();
6511         git_print_page_nav($fmt_name,'', $hash,$hash,$hash, $paging_nav);
6512         if (defined $file_name) {
6513                 git_print_header_div('commit', esc_html($co{'title'}), $base);
6514         } else {
6515                 git_print_header_div('summary', $project)
6516         }
6517         git_print_page_path($file_name, $ftype, $hash_base)
6518                 if (defined $file_name);
6519
6520         $body_subr->(\@commitlist, 0, 99, $refs, $next_link,
6521                      $file_name, $file_hash, $ftype);
6522
6523         git_footer_html();
6524 }
6525
6526 sub git_log {
6527         git_log_generic('log', \&git_log_body,
6528                         $hash, $hash_parent);
6529 }
6530
6531 sub git_commit {
6532         $hash ||= $hash_base || "HEAD";
6533         my %co = parse_commit($hash)
6534             or die_error(404, "Unknown commit object");
6535
6536         my $parent  = $co{'parent'};
6537         my $parents = $co{'parents'}; # listref
6538
6539         # we need to prepare $formats_nav before any parameter munging
6540         my $formats_nav;
6541         if (!defined $parent) {
6542                 # --root commitdiff
6543                 $formats_nav .= '(initial)';
6544         } elsif (@$parents == 1) {
6545                 # single parent commit
6546                 $formats_nav .=
6547                         '(parent: ' .
6548                         $cgi->a({-href => href(action=>"commit",
6549                                                hash=>$parent)},
6550                                 esc_html(substr($parent, 0, 7))) .
6551                         ')';
6552         } else {
6553                 # merge commit
6554                 $formats_nav .=
6555                         '(merge: ' .
6556                         join(' ', map {
6557                                 $cgi->a({-href => href(action=>"commit",
6558                                                        hash=>$_)},
6559                                         esc_html(substr($_, 0, 7)));
6560                         } @$parents ) .
6561                         ')';
6562         }
6563         if (gitweb_check_feature('patches') && @$parents <= 1) {
6564                 $formats_nav .= " | " .
6565                         $cgi->a({-href => href(action=>"patch", -replay=>1)},
6566                                 "patch");
6567         }
6568
6569         if (!defined $parent) {
6570                 $parent = "--root";
6571         }
6572         my @difftree;
6573         open my $fd, "-|", git_cmd(), "diff-tree", '-r', "--no-commit-id",
6574                 @diff_opts,
6575                 (@$parents <= 1 ? $parent : '-c'),
6576                 $hash, "--"
6577                 or die_error(500, "Open git-diff-tree failed");
6578         @difftree = map { chomp; $_ } <$fd>;
6579         close $fd or die_error(404, "Reading git-diff-tree failed");
6580
6581         # non-textual hash id's can be cached
6582         my $expires;
6583         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6584                 $expires = "+1d";
6585         }
6586         my $refs = git_get_references();
6587         my $ref = format_ref_marker($refs, $co{'id'});
6588
6589         git_header_html(undef, $expires);
6590         git_print_page_nav('commit', '',
6591                            $hash, $co{'tree'}, $hash,
6592                            $formats_nav);
6593
6594         if (defined $co{'parent'}) {
6595                 git_print_header_div('commitdiff', esc_html($co{'title'}) . $ref, $hash);
6596         } else {
6597                 git_print_header_div('tree', esc_html($co{'title'}) . $ref, $co{'tree'}, $hash);
6598         }
6599         print "<div class=\"title_text\">\n" .
6600               "<table class=\"object_header\">\n";
6601         git_print_authorship_rows(\%co);
6602         print "<tr><td>commit</td><td class=\"sha1\">$co{'id'}</td></tr>\n";
6603         print "<tr>" .
6604               "<td>tree</td>" .
6605               "<td class=\"sha1\">" .
6606               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash),
6607                        class => "list"}, $co{'tree'}) .
6608               "</td>" .
6609               "<td class=\"link\">" .
6610               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$hash)},
6611                       "tree");
6612         my $snapshot_links = format_snapshot_links($hash);
6613         if (defined $snapshot_links) {
6614                 print " | " . $snapshot_links;
6615         }
6616         print "</td>" .
6617               "</tr>\n";
6618
6619         foreach my $par (@$parents) {
6620                 print "<tr>" .
6621                       "<td>parent</td>" .
6622                       "<td class=\"sha1\">" .
6623                       $cgi->a({-href => href(action=>"commit", hash=>$par),
6624                                class => "list"}, $par) .
6625                       "</td>" .
6626                       "<td class=\"link\">" .
6627                       $cgi->a({-href => href(action=>"commit", hash=>$par)}, "commit") .
6628                       " | " .
6629                       $cgi->a({-href => href(action=>"commitdiff", hash=>$hash, hash_parent=>$par)}, "diff") .
6630                       "</td>" .
6631                       "</tr>\n";
6632         }
6633         print "</table>".
6634               "</div>\n";
6635
6636         print "<div class=\"page_body\">\n";
6637         git_print_log($co{'comment'});
6638         print "</div>\n";
6639
6640         git_difftree_body(\@difftree, $hash, @$parents);
6641
6642         git_footer_html();
6643 }
6644
6645 sub git_object {
6646         # object is defined by:
6647         # - hash or hash_base alone
6648         # - hash_base and file_name
6649         my $type;
6650
6651         # - hash or hash_base alone
6652         if ($hash || ($hash_base && !defined $file_name)) {
6653                 my $object_id = $hash || $hash_base;
6654
6655                 open my $fd, "-|", quote_command(
6656                         git_cmd(), 'cat-file', '-t', $object_id) . ' 2> /dev/null'
6657                         or die_error(404, "Object does not exist");
6658                 $type = <$fd>;
6659                 chomp $type;
6660                 close $fd
6661                         or die_error(404, "Object does not exist");
6662
6663         # - hash_base and file_name
6664         } elsif ($hash_base && defined $file_name) {
6665                 $file_name =~ s,/+$,,;
6666
6667                 system(git_cmd(), "cat-file", '-e', $hash_base) == 0
6668                         or die_error(404, "Base object does not exist");
6669
6670                 # here errors should not hapen
6671                 open my $fd, "-|", git_cmd(), "ls-tree", $hash_base, "--", $file_name
6672                         or die_error(500, "Open git-ls-tree failed");
6673                 my $line = <$fd>;
6674                 close $fd;
6675
6676                 #'100644 blob 0fa3f3a66fb6a137f6ec2c19351ed4d807070ffa  panic.c'
6677                 unless ($line && $line =~ m/^([0-9]+) (.+) ([0-9a-fA-F]{40})\t/) {
6678                         die_error(404, "File or directory for given base does not exist");
6679                 }
6680                 $type = $2;
6681                 $hash = $3;
6682         } else {
6683                 die_error(400, "Not enough information to find object");
6684         }
6685
6686         print $cgi->redirect(-uri => href(action=>$type, -full=>1,
6687                                           hash=>$hash, hash_base=>$hash_base,
6688                                           file_name=>$file_name),
6689                              -status => '302 Found');
6690 }
6691
6692 sub git_blobdiff {
6693         my $format = shift || 'html';
6694
6695         my $fd;
6696         my @difftree;
6697         my %diffinfo;
6698         my $expires;
6699
6700         # preparing $fd and %diffinfo for git_patchset_body
6701         # new style URI
6702         if (defined $hash_base && defined $hash_parent_base) {
6703                 if (defined $file_name) {
6704                         # read raw output
6705                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6706                                 $hash_parent_base, $hash_base,
6707                                 "--", (defined $file_parent ? $file_parent : ()), $file_name
6708                                 or die_error(500, "Open git-diff-tree failed");
6709                         @difftree = map { chomp; $_ } <$fd>;
6710                         close $fd
6711                                 or die_error(404, "Reading git-diff-tree failed");
6712                         @difftree
6713                                 or die_error(404, "Blob diff not found");
6714
6715                 } elsif (defined $hash &&
6716                          $hash =~ /[0-9a-fA-F]{40}/) {
6717                         # try to find filename from $hash
6718
6719                         # read filtered raw output
6720                         open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6721                                 $hash_parent_base, $hash_base, "--"
6722                                 or die_error(500, "Open git-diff-tree failed");
6723                         @difftree =
6724                                 # ':100644 100644 03b21826... 3b93d5e7... M     ls-files.c'
6725                                 # $hash == to_id
6726                                 grep { /^:[0-7]{6} [0-7]{6} [0-9a-fA-F]{40} $hash/ }
6727                                 map { chomp; $_ } <$fd>;
6728                         close $fd
6729                                 or die_error(404, "Reading git-diff-tree failed");
6730                         @difftree
6731                                 or die_error(404, "Blob diff not found");
6732
6733                 } else {
6734                         die_error(400, "Missing one of the blob diff parameters");
6735                 }
6736
6737                 if (@difftree > 1) {
6738                         die_error(400, "Ambiguous blob diff specification");
6739                 }
6740
6741                 %diffinfo = parse_difftree_raw_line($difftree[0]);
6742                 $file_parent ||= $diffinfo{'from_file'} || $file_name;
6743                 $file_name   ||= $diffinfo{'to_file'};
6744
6745                 $hash_parent ||= $diffinfo{'from_id'};
6746                 $hash        ||= $diffinfo{'to_id'};
6747
6748                 # non-textual hash id's can be cached
6749                 if ($hash_base =~ m/^[0-9a-fA-F]{40}$/ &&
6750                     $hash_parent_base =~ m/^[0-9a-fA-F]{40}$/) {
6751                         $expires = '+1d';
6752                 }
6753
6754                 # open patch output
6755                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6756                         '-p', ($format eq 'html' ? "--full-index" : ()),
6757                         $hash_parent_base, $hash_base,
6758                         "--", (defined $file_parent ? $file_parent : ()), $file_name
6759                         or die_error(500, "Open git-diff-tree failed");
6760         }
6761
6762         # old/legacy style URI -- not generated anymore since 1.4.3.
6763         if (!%diffinfo) {
6764                 die_error('404 Not Found', "Missing one of the blob diff parameters")
6765         }
6766
6767         # header
6768         if ($format eq 'html') {
6769                 my $formats_nav =
6770                         $cgi->a({-href => href(action=>"blobdiff_plain", -replay=>1)},
6771                                 "raw");
6772                 git_header_html(undef, $expires);
6773                 if (defined $hash_base && (my %co = parse_commit($hash_base))) {
6774                         git_print_page_nav('','', $hash_base,$co{'tree'},$hash_base, $formats_nav);
6775                         git_print_header_div('commit', esc_html($co{'title'}), $hash_base);
6776                 } else {
6777                         print "<div class=\"page_nav\"><br/>$formats_nav<br/></div>\n";
6778                         print "<div class=\"title\">".esc_html("$hash vs $hash_parent")."</div>\n";
6779                 }
6780                 if (defined $file_name) {
6781                         git_print_page_path($file_name, "blob", $hash_base);
6782                 } else {
6783                         print "<div class=\"page_path\"></div>\n";
6784                 }
6785
6786         } elsif ($format eq 'plain') {
6787                 print $cgi->header(
6788                         -type => 'text/plain',
6789                         -charset => 'utf-8',
6790                         -expires => $expires,
6791                         -content_disposition => 'inline; filename="' . "$file_name" . '.patch"');
6792
6793                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
6794
6795         } else {
6796                 die_error(400, "Unknown blobdiff format");
6797         }
6798
6799         # patch
6800         if ($format eq 'html') {
6801                 print "<div class=\"page_body\">\n";
6802
6803                 git_patchset_body($fd, [ \%diffinfo ], $hash_base, $hash_parent_base);
6804                 close $fd;
6805
6806                 print "</div>\n"; # class="page_body"
6807                 git_footer_html();
6808
6809         } else {
6810                 while (my $line = <$fd>) {
6811                         $line =~ s!a/($hash|$hash_parent)!'a/'.esc_path($diffinfo{'from_file'})!eg;
6812                         $line =~ s!b/($hash|$hash_parent)!'b/'.esc_path($diffinfo{'to_file'})!eg;
6813
6814                         print $line;
6815
6816                         last if $line =~ m!^\+\+\+!;
6817                 }
6818                 local $/ = undef;
6819                 print <$fd>;
6820                 close $fd;
6821         }
6822 }
6823
6824 sub git_blobdiff_plain {
6825         git_blobdiff('plain');
6826 }
6827
6828 sub git_commitdiff {
6829         my %params = @_;
6830         my $format = $params{-format} || 'html';
6831
6832         my ($patch_max) = gitweb_get_feature('patches');
6833         if ($format eq 'patch') {
6834                 die_error(403, "Patch view not allowed") unless $patch_max;
6835         }
6836
6837         $hash ||= $hash_base || "HEAD";
6838         my %co = parse_commit($hash)
6839             or die_error(404, "Unknown commit object");
6840
6841         # choose format for commitdiff for merge
6842         if (! defined $hash_parent && @{$co{'parents'}} > 1) {
6843                 $hash_parent = '--cc';
6844         }
6845         # we need to prepare $formats_nav before almost any parameter munging
6846         my $formats_nav;
6847         if ($format eq 'html') {
6848                 $formats_nav =
6849                         $cgi->a({-href => href(action=>"commitdiff_plain", -replay=>1)},
6850                                 "raw");
6851                 if ($patch_max && @{$co{'parents'}} <= 1) {
6852                         $formats_nav .= " | " .
6853                                 $cgi->a({-href => href(action=>"patch", -replay=>1)},
6854                                         "patch");
6855                 }
6856
6857                 if (defined $hash_parent &&
6858                     $hash_parent ne '-c' && $hash_parent ne '--cc') {
6859                         # commitdiff with two commits given
6860                         my $hash_parent_short = $hash_parent;
6861                         if ($hash_parent =~ m/^[0-9a-fA-F]{40}$/) {
6862                                 $hash_parent_short = substr($hash_parent, 0, 7);
6863                         }
6864                         $formats_nav .=
6865                                 ' (from';
6866                         for (my $i = 0; $i < @{$co{'parents'}}; $i++) {
6867                                 if ($co{'parents'}[$i] eq $hash_parent) {
6868                                         $formats_nav .= ' parent ' . ($i+1);
6869                                         last;
6870                                 }
6871                         }
6872                         $formats_nav .= ': ' .
6873                                 $cgi->a({-href => href(action=>"commitdiff",
6874                                                        hash=>$hash_parent)},
6875                                         esc_html($hash_parent_short)) .
6876                                 ')';
6877                 } elsif (!$co{'parent'}) {
6878                         # --root commitdiff
6879                         $formats_nav .= ' (initial)';
6880                 } elsif (scalar @{$co{'parents'}} == 1) {
6881                         # single parent commit
6882                         $formats_nav .=
6883                                 ' (parent: ' .
6884                                 $cgi->a({-href => href(action=>"commitdiff",
6885                                                        hash=>$co{'parent'})},
6886                                         esc_html(substr($co{'parent'}, 0, 7))) .
6887                                 ')';
6888                 } else {
6889                         # merge commit
6890                         if ($hash_parent eq '--cc') {
6891                                 $formats_nav .= ' | ' .
6892                                         $cgi->a({-href => href(action=>"commitdiff",
6893                                                                hash=>$hash, hash_parent=>'-c')},
6894                                                 'combined');
6895                         } else { # $hash_parent eq '-c'
6896                                 $formats_nav .= ' | ' .
6897                                         $cgi->a({-href => href(action=>"commitdiff",
6898                                                                hash=>$hash, hash_parent=>'--cc')},
6899                                                 'compact');
6900                         }
6901                         $formats_nav .=
6902                                 ' (merge: ' .
6903                                 join(' ', map {
6904                                         $cgi->a({-href => href(action=>"commitdiff",
6905                                                                hash=>$_)},
6906                                                 esc_html(substr($_, 0, 7)));
6907                                 } @{$co{'parents'}} ) .
6908                                 ')';
6909                 }
6910         }
6911
6912         my $hash_parent_param = $hash_parent;
6913         if (!defined $hash_parent_param) {
6914                 # --cc for multiple parents, --root for parentless
6915                 $hash_parent_param =
6916                         @{$co{'parents'}} > 1 ? '--cc' : $co{'parent'} || '--root';
6917         }
6918
6919         # read commitdiff
6920         my $fd;
6921         my @difftree;
6922         if ($format eq 'html') {
6923                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6924                         "--no-commit-id", "--patch-with-raw", "--full-index",
6925                         $hash_parent_param, $hash, "--"
6926                         or die_error(500, "Open git-diff-tree failed");
6927
6928                 while (my $line = <$fd>) {
6929                         chomp $line;
6930                         # empty line ends raw part of diff-tree output
6931                         last unless $line;
6932                         push @difftree, scalar parse_difftree_raw_line($line);
6933                 }
6934
6935         } elsif ($format eq 'plain') {
6936                 open $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
6937                         '-p', $hash_parent_param, $hash, "--"
6938                         or die_error(500, "Open git-diff-tree failed");
6939         } elsif ($format eq 'patch') {
6940                 # For commit ranges, we limit the output to the number of
6941                 # patches specified in the 'patches' feature.
6942                 # For single commits, we limit the output to a single patch,
6943                 # diverging from the git-format-patch default.
6944                 my @commit_spec = ();
6945                 if ($hash_parent) {
6946                         if ($patch_max > 0) {
6947                                 push @commit_spec, "-$patch_max";
6948                         }
6949                         push @commit_spec, '-n', "$hash_parent..$hash";
6950                 } else {
6951                         if ($params{-single}) {
6952                                 push @commit_spec, '-1';
6953                         } else {
6954                                 if ($patch_max > 0) {
6955                                         push @commit_spec, "-$patch_max";
6956                                 }
6957                                 push @commit_spec, "-n";
6958                         }
6959                         push @commit_spec, '--root', $hash;
6960                 }
6961                 open $fd, "-|", git_cmd(), "format-patch", @diff_opts,
6962                         '--encoding=utf8', '--stdout', @commit_spec
6963                         or die_error(500, "Open git-format-patch failed");
6964         } else {
6965                 die_error(400, "Unknown commitdiff format");
6966         }
6967
6968         # non-textual hash id's can be cached
6969         my $expires;
6970         if ($hash =~ m/^[0-9a-fA-F]{40}$/) {
6971                 $expires = "+1d";
6972         }
6973
6974         # write commit message
6975         if ($format eq 'html') {
6976                 my $refs = git_get_references();
6977                 my $ref = format_ref_marker($refs, $co{'id'});
6978
6979                 git_header_html(undef, $expires);
6980                 git_print_page_nav('commitdiff','', $hash,$co{'tree'},$hash, $formats_nav);
6981                 git_print_header_div('commit', esc_html($co{'title'}) . $ref, $hash);
6982                 print "<div class=\"title_text\">\n" .
6983                       "<table class=\"object_header\">\n";
6984                 git_print_authorship_rows(\%co);
6985                 print "</table>".
6986                       "</div>\n";
6987                 print "<div class=\"page_body\">\n";
6988                 if (@{$co{'comment'}} > 1) {
6989                         print "<div class=\"log\">\n";
6990                         git_print_log($co{'comment'}, -final_empty_line=> 1, -remove_title => 1);
6991                         print "</div>\n"; # class="log"
6992                 }
6993
6994         } elsif ($format eq 'plain') {
6995                 my $refs = git_get_references("tags");
6996                 my $tagname = git_get_rev_name_tags($hash);
6997                 my $filename = basename($project) . "-$hash.patch";
6998
6999                 print $cgi->header(
7000                         -type => 'text/plain',
7001                         -charset => 'utf-8',
7002                         -expires => $expires,
7003                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7004                 my %ad = parse_date($co{'author_epoch'}, $co{'author_tz'});
7005                 print "From: " . to_utf8($co{'author'}) . "\n";
7006                 print "Date: $ad{'rfc2822'} ($ad{'tz_local'})\n";
7007                 print "Subject: " . to_utf8($co{'title'}) . "\n";
7008
7009                 print "X-Git-Tag: $tagname\n" if $tagname;
7010                 print "X-Git-Url: " . $cgi->self_url() . "\n\n";
7011
7012                 foreach my $line (@{$co{'comment'}}) {
7013                         print to_utf8($line) . "\n";
7014                 }
7015                 print "---\n\n";
7016         } elsif ($format eq 'patch') {
7017                 my $filename = basename($project) . "-$hash.patch";
7018
7019                 print $cgi->header(
7020                         -type => 'text/plain',
7021                         -charset => 'utf-8',
7022                         -expires => $expires,
7023                         -content_disposition => 'inline; filename="' . "$filename" . '"');
7024         }
7025
7026         # write patch
7027         if ($format eq 'html') {
7028                 my $use_parents = !defined $hash_parent ||
7029                         $hash_parent eq '-c' || $hash_parent eq '--cc';
7030                 git_difftree_body(\@difftree, $hash,
7031                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7032                 print "<br/>\n";
7033
7034                 git_patchset_body($fd, \@difftree, $hash,
7035                                   $use_parents ? @{$co{'parents'}} : $hash_parent);
7036                 close $fd;
7037                 print "</div>\n"; # class="page_body"
7038                 git_footer_html();
7039
7040         } elsif ($format eq 'plain') {
7041                 local $/ = undef;
7042                 print <$fd>;
7043                 close $fd
7044                         or print "Reading git-diff-tree failed\n";
7045         } elsif ($format eq 'patch') {
7046                 local $/ = undef;
7047                 print <$fd>;
7048                 close $fd
7049                         or print "Reading git-format-patch failed\n";
7050         }
7051 }
7052
7053 sub git_commitdiff_plain {
7054         git_commitdiff(-format => 'plain');
7055 }
7056
7057 # format-patch-style patches
7058 sub git_patch {
7059         git_commitdiff(-format => 'patch', -single => 1);
7060 }
7061
7062 sub git_patches {
7063         git_commitdiff(-format => 'patch');
7064 }
7065
7066 sub git_history {
7067         git_log_generic('history', \&git_history_body,
7068                         $hash_base, $hash_parent_base,
7069                         $file_name, $hash);
7070 }
7071
7072 sub git_search {
7073         gitweb_check_feature('search') or die_error(403, "Search is disabled");
7074         if (!defined $searchtext) {
7075                 die_error(400, "Text field is empty");
7076         }
7077         if (!defined $hash) {
7078                 $hash = git_get_head_hash($project);
7079         }
7080         my %co = parse_commit($hash);
7081         if (!%co) {
7082                 die_error(404, "Unknown commit object");
7083         }
7084         if (!defined $page) {
7085                 $page = 0;
7086         }
7087
7088         $searchtype ||= 'commit';
7089         if ($searchtype eq 'pickaxe') {
7090                 # pickaxe may take all resources of your box and run for several minutes
7091                 # with every query - so decide by yourself how public you make this feature
7092                 gitweb_check_feature('pickaxe')
7093                     or die_error(403, "Pickaxe is disabled");
7094         }
7095         if ($searchtype eq 'grep') {
7096                 gitweb_check_feature('grep')
7097                     or die_error(403, "Grep is disabled");
7098         }
7099
7100         git_header_html();
7101
7102         if ($searchtype eq 'commit' or $searchtype eq 'author' or $searchtype eq 'committer') {
7103                 my $greptype;
7104                 if ($searchtype eq 'commit') {
7105                         $greptype = "--grep=";
7106                 } elsif ($searchtype eq 'author') {
7107                         $greptype = "--author=";
7108                 } elsif ($searchtype eq 'committer') {
7109                         $greptype = "--committer=";
7110                 }
7111                 $greptype .= $searchtext;
7112                 my @commitlist = parse_commits($hash, 101, (100 * $page), undef,
7113                                                $greptype, '--regexp-ignore-case',
7114                                                $search_use_regexp ? '--extended-regexp' : '--fixed-strings');
7115
7116                 my $paging_nav = '';
7117                 if ($page > 0) {
7118                         $paging_nav .=
7119                                 $cgi->a({-href => href(action=>"search", hash=>$hash,
7120                                                        searchtext=>$searchtext,
7121                                                        searchtype=>$searchtype)},
7122                                         "first");
7123                         $paging_nav .= " &sdot; " .
7124                                 $cgi->a({-href => href(-replay=>1, page=>$page-1),
7125                                          -accesskey => "p", -title => "Alt-p"}, "prev");
7126                 } else {
7127                         $paging_nav .= "first";
7128                         $paging_nav .= " &sdot; prev";
7129                 }
7130                 my $next_link = '';
7131                 if ($#commitlist >= 100) {
7132                         $next_link =
7133                                 $cgi->a({-href => href(-replay=>1, page=>$page+1),
7134                                          -accesskey => "n", -title => "Alt-n"}, "next");
7135                         $paging_nav .= " &sdot; $next_link";
7136                 } else {
7137                         $paging_nav .= " &sdot; next";
7138                 }
7139
7140                 git_print_page_nav('','', $hash,$co{'tree'},$hash, $paging_nav);
7141                 git_print_header_div('commit', esc_html($co{'title'}), $hash);
7142                 if ($page == 0 && !@commitlist) {
7143                         print "<p>No match.</p>\n";
7144                 } else {
7145                         git_search_grep_body(\@commitlist, 0, 99, $next_link);
7146                 }
7147         }
7148
7149         if ($searchtype eq 'pickaxe') {
7150                 git_print_page_nav('','', $hash,$co{'tree'},$hash);
7151                 git_print_header_div('commit', esc_html($co{'title'}), $hash);
7152
7153                 print "<table class=\"pickaxe search\">\n";
7154                 my $alternate = 1;
7155                 local $/ = "\n";
7156                 open my $fd, '-|', git_cmd(), '--no-pager', 'log', @diff_opts,
7157                         '--pretty=format:%H', '--no-abbrev', '--raw', "-S$searchtext",
7158                         ($search_use_regexp ? '--pickaxe-regex' : ());
7159                 undef %co;
7160                 my @files;
7161                 while (my $line = <$fd>) {
7162                         chomp $line;
7163                         next unless $line;
7164
7165                         my %set = parse_difftree_raw_line($line);
7166                         if (defined $set{'commit'}) {
7167                                 # finish previous commit
7168                                 if (%co) {
7169                                         print "</td>\n" .
7170                                               "<td class=\"link\">" .
7171                                               $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
7172                                               " | " .
7173                                               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
7174                                         print "</td>\n" .
7175                                               "</tr>\n";
7176                                 }
7177
7178                                 if ($alternate) {
7179                                         print "<tr class=\"dark\">\n";
7180                                 } else {
7181                                         print "<tr class=\"light\">\n";
7182                                 }
7183                                 $alternate ^= 1;
7184                                 %co = parse_commit($set{'commit'});
7185                                 my $author = chop_and_escape_str($co{'author_name'}, 15, 5);
7186                                 print "<td title=\"$co{'age_string_age'}\"><i>$co{'age_string_date'}</i></td>\n" .
7187                                       "<td><i>$author</i></td>\n" .
7188                                       "<td>" .
7189                                       $cgi->a({-href => href(action=>"commit", hash=>$co{'id'}),
7190                                               -class => "list subject"},
7191                                               chop_and_escape_str($co{'title'}, 50) . "<br/>");
7192                         } elsif (defined $set{'to_id'}) {
7193                                 next if ($set{'to_id'} =~ m/^0{40}$/);
7194
7195                                 print $cgi->a({-href => href(action=>"blob", hash_base=>$co{'id'},
7196                                                              hash=>$set{'to_id'}, file_name=>$set{'to_file'}),
7197                                               -class => "list"},
7198                                               "<span class=\"match\">" . esc_path($set{'file'}) . "</span>") .
7199                                       "<br/>\n";
7200                         }
7201                 }
7202                 close $fd;
7203
7204                 # finish last commit (warning: repetition!)
7205                 if (%co) {
7206                         print "</td>\n" .
7207                               "<td class=\"link\">" .
7208                               $cgi->a({-href => href(action=>"commit", hash=>$co{'id'})}, "commit") .
7209                               " | " .
7210                               $cgi->a({-href => href(action=>"tree", hash=>$co{'tree'}, hash_base=>$co{'id'})}, "tree");
7211                         print "</td>\n" .
7212                               "</tr>\n";
7213                 }
7214
7215                 print "</table>\n";
7216         }
7217
7218         if ($searchtype eq 'grep') {
7219                 git_print_page_nav('','', $hash,$co{'tree'},$hash);
7220                 git_print_header_div('commit', esc_html($co{'title'}), $hash);
7221
7222                 print "<table class=\"grep_search\">\n";
7223                 my $alternate = 1;
7224                 my $matches = 0;
7225                 local $/ = "\n";
7226                 open my $fd, "-|", git_cmd(), 'grep', '-n',
7227                         $search_use_regexp ? ('-E', '-i') : '-F',
7228                         $searchtext, $co{'tree'};
7229                 my $lastfile = '';
7230                 while (my $line = <$fd>) {
7231                         chomp $line;
7232                         my ($file, $lno, $ltext, $binary);
7233                         last if ($matches++ > 1000);
7234                         if ($line =~ /^Binary file (.+) matches$/) {
7235                                 $file = $1;
7236                                 $binary = 1;
7237                         } else {
7238                                 (undef, $file, $lno, $ltext) = split(/:/, $line, 4);
7239                         }
7240                         if ($file ne $lastfile) {
7241                                 $lastfile and print "</td></tr>\n";
7242                                 if ($alternate++) {
7243                                         print "<tr class=\"dark\">\n";
7244                                 } else {
7245                                         print "<tr class=\"light\">\n";
7246                                 }
7247                                 print "<td class=\"list\">".
7248                                         $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
7249                                                                file_name=>"$file"),
7250                                                 -class => "list"}, esc_path($file));
7251                                 print "</td><td>\n";
7252                                 $lastfile = $file;
7253                         }
7254                         if ($binary) {
7255                                 print "<div class=\"binary\">Binary file</div>\n";
7256                         } else {
7257                                 $ltext = untabify($ltext);
7258                                 if ($ltext =~ m/^(.*)($search_regexp)(.*)$/i) {
7259                                         $ltext = esc_html($1, -nbsp=>1);
7260                                         $ltext .= '<span class="match">';
7261                                         $ltext .= esc_html($2, -nbsp=>1);
7262                                         $ltext .= '</span>';
7263                                         $ltext .= esc_html($3, -nbsp=>1);
7264                                 } else {
7265                                         $ltext = esc_html($ltext, -nbsp=>1);
7266                                 }
7267                                 print "<div class=\"pre\">" .
7268                                         $cgi->a({-href => href(action=>"blob", hash=>$co{'hash'},
7269                                                                file_name=>"$file").'#l'.$lno,
7270                                                 -class => "linenr"}, sprintf('%4i', $lno))
7271                                         . ' ' .  $ltext . "</div>\n";
7272                         }
7273                 }
7274                 if ($lastfile) {
7275                         print "</td></tr>\n";
7276                         if ($matches > 1000) {
7277                                 print "<div class=\"diff nodifferences\">Too many matches, listing trimmed</div>\n";
7278                         }
7279                 } else {
7280                         print "<div class=\"diff nodifferences\">No matches found</div>\n";
7281                 }
7282                 close $fd;
7283
7284                 print "</table>\n";
7285         }
7286         git_footer_html();
7287 }
7288
7289 sub git_search_help {
7290         git_header_html();
7291         git_print_page_nav('','', $hash,$hash,$hash);
7292         print <<EOT;
7293 <p><strong>Pattern</strong> is by default a normal string that is matched precisely (but without
7294 regard to case, except in the case of pickaxe). However, when you check the <em>re</em> checkbox,
7295 the pattern entered is recognized as the POSIX extended
7296 <a href="http://en.wikipedia.org/wiki/Regular_expression">regular expression</a> (also case
7297 insensitive).</p>
7298 <dl>
7299 <dt><b>commit</b></dt>
7300 <dd>The commit messages and authorship information will be scanned for the given pattern.</dd>
7301 EOT
7302         my $have_grep = gitweb_check_feature('grep');
7303         if ($have_grep) {
7304                 print <<EOT;
7305 <dt><b>grep</b></dt>
7306 <dd>All files in the currently selected tree (HEAD unless you are explicitly browsing
7307     a different one) are searched for the given pattern. On large trees, this search can take
7308 a while and put some strain on the server, so please use it with some consideration. Note that
7309 due to git-grep peculiarity, currently if regexp mode is turned off, the matches are
7310 case-sensitive.</dd>
7311 EOT
7312         }
7313         print <<EOT;
7314 <dt><b>author</b></dt>
7315 <dd>Name and e-mail of the change author and date of birth of the patch will be scanned for the given pattern.</dd>
7316 <dt><b>committer</b></dt>
7317 <dd>Name and e-mail of the committer and date of commit will be scanned for the given pattern.</dd>
7318 EOT
7319         my $have_pickaxe = gitweb_check_feature('pickaxe');
7320         if ($have_pickaxe) {
7321                 print <<EOT;
7322 <dt><b>pickaxe</b></dt>
7323 <dd>All commits that caused the string to appear or disappear from any file (changes that
7324 added, removed or "modified" the string) will be listed. This search can take a while and
7325 takes a lot of strain on the server, so please use it wisely. Note that since you may be
7326 interested even in changes just changing the case as well, this search is case sensitive.</dd>
7327 EOT
7328         }
7329         print "</dl>\n";
7330         git_footer_html();
7331 }
7332
7333 sub git_shortlog {
7334         git_log_generic('shortlog', \&git_shortlog_body,
7335                         $hash, $hash_parent);
7336 }
7337
7338 ## ......................................................................
7339 ## feeds (RSS, Atom; OPML)
7340
7341 sub git_feed {
7342         my $format = shift || 'atom';
7343         my $have_blame = gitweb_check_feature('blame');
7344
7345         # Atom: http://www.atomenabled.org/developers/syndication/
7346         # RSS:  http://www.notestips.com/80256B3A007F2692/1/NAMO5P9UPQ
7347         if ($format ne 'rss' && $format ne 'atom') {
7348                 die_error(400, "Unknown web feed format");
7349         }
7350
7351         # log/feed of current (HEAD) branch, log of given branch, history of file/directory
7352         my $head = $hash || 'HEAD';
7353         my @commitlist = parse_commits($head, 150, 0, $file_name);
7354
7355         my %latest_commit;
7356         my %latest_date;
7357         my $content_type = "application/$format+xml";
7358         if (defined $cgi->http('HTTP_ACCEPT') &&
7359                  $cgi->Accept('text/xml') > $cgi->Accept($content_type)) {
7360                 # browser (feed reader) prefers text/xml
7361                 $content_type = 'text/xml';
7362         }
7363         if (defined($commitlist[0])) {
7364                 %latest_commit = %{$commitlist[0]};
7365                 my $latest_epoch = $latest_commit{'committer_epoch'};
7366                 %latest_date   = parse_date($latest_epoch, $latest_commit{'comitter_tz'});
7367                 my $if_modified = $cgi->http('IF_MODIFIED_SINCE');
7368                 if (defined $if_modified) {
7369                         my $since;
7370                         if (eval { require HTTP::Date; 1; }) {
7371                                 $since = HTTP::Date::str2time($if_modified);
7372                         } elsif (eval { require Time::ParseDate; 1; }) {
7373                                 $since = Time::ParseDate::parsedate($if_modified, GMT => 1);
7374                         }
7375                         if (defined $since && $latest_epoch <= $since) {
7376                                 print $cgi->header(
7377                                         -type => $content_type,
7378                                         -charset => 'utf-8',
7379                                         -last_modified => $latest_date{'rfc2822'},
7380                                         -status => '304 Not Modified');
7381                                 return;
7382                         }
7383                 }
7384                 print $cgi->header(
7385                         -type => $content_type,
7386                         -charset => 'utf-8',
7387                         -last_modified => $latest_date{'rfc2822'});
7388         } else {
7389                 print $cgi->header(
7390                         -type => $content_type,
7391                         -charset => 'utf-8');
7392         }
7393
7394         # Optimization: skip generating the body if client asks only
7395         # for Last-Modified date.
7396         return if ($cgi->request_method() eq 'HEAD');
7397
7398         # header variables
7399         my $title = "$site_name - $project/$action";
7400         my $feed_type = 'log';
7401         if (defined $hash) {
7402                 $title .= " - '$hash'";
7403                 $feed_type = 'branch log';
7404                 if (defined $file_name) {
7405                         $title .= " :: $file_name";
7406                         $feed_type = 'history';
7407                 }
7408         } elsif (defined $file_name) {
7409                 $title .= " - $file_name";
7410                 $feed_type = 'history';
7411         }
7412         $title .= " $feed_type";
7413         my $descr = git_get_project_description($project);
7414         if (defined $descr) {
7415                 $descr = esc_html($descr);
7416         } else {
7417                 $descr = "$project " .
7418                          ($format eq 'rss' ? 'RSS' : 'Atom') .
7419                          " feed";
7420         }
7421         my $owner = git_get_project_owner($project);
7422         $owner = esc_html($owner);
7423
7424         #header
7425         my $alt_url;
7426         if (defined $file_name) {
7427                 $alt_url = href(-full=>1, action=>"history", hash=>$hash, file_name=>$file_name);
7428         } elsif (defined $hash) {
7429                 $alt_url = href(-full=>1, action=>"log", hash=>$hash);
7430         } else {
7431                 $alt_url = href(-full=>1, action=>"summary");
7432         }
7433         print qq!<?xml version="1.0" encoding="utf-8"?>\n!;
7434         if ($format eq 'rss') {
7435                 print <<XML;
7436 <rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/">
7437 <channel>
7438 XML
7439                 print "<title>$title</title>\n" .
7440                       "<link>$alt_url</link>\n" .
7441                       "<description>$descr</description>\n" .
7442                       "<language>en</language>\n" .
7443                       # project owner is responsible for 'editorial' content
7444                       "<managingEditor>$owner</managingEditor>\n";
7445                 if (defined $logo || defined $favicon) {
7446                         # prefer the logo to the favicon, since RSS
7447                         # doesn't allow both
7448                         my $img = esc_url($logo || $favicon);
7449                         print "<image>\n" .
7450                               "<url>$img</url>\n" .
7451                               "<title>$title</title>\n" .
7452                               "<link>$alt_url</link>\n" .
7453                               "</image>\n";
7454                 }
7455                 if (%latest_date) {
7456                         print "<pubDate>$latest_date{'rfc2822'}</pubDate>\n";
7457                         print "<lastBuildDate>$latest_date{'rfc2822'}</lastBuildDate>\n";
7458                 }
7459                 print "<generator>gitweb v.$version/$git_version</generator>\n";
7460         } elsif ($format eq 'atom') {
7461                 print <<XML;
7462 <feed xmlns="http://www.w3.org/2005/Atom">
7463 XML
7464                 print "<title>$title</title>\n" .
7465                       "<subtitle>$descr</subtitle>\n" .
7466                       '<link rel="alternate" type="text/html" href="' .
7467                       $alt_url . '" />' . "\n" .
7468                       '<link rel="self" type="' . $content_type . '" href="' .
7469                       $cgi->self_url() . '" />' . "\n" .
7470                       "<id>" . href(-full=>1) . "</id>\n" .
7471                       # use project owner for feed author
7472                       "<author><name>$owner</name></author>\n";
7473                 if (defined $favicon) {
7474                         print "<icon>" . esc_url($favicon) . "</icon>\n";
7475                 }
7476                 if (defined $logo) {
7477                         # not twice as wide as tall: 72 x 27 pixels
7478                         print "<logo>" . esc_url($logo) . "</logo>\n";
7479                 }
7480                 if (! %latest_date) {
7481                         # dummy date to keep the feed valid until commits trickle in:
7482                         print "<updated>1970-01-01T00:00:00Z</updated>\n";
7483                 } else {
7484                         print "<updated>$latest_date{'iso-8601'}</updated>\n";
7485                 }
7486                 print "<generator version='$version/$git_version'>gitweb</generator>\n";
7487         }
7488
7489         # contents
7490         for (my $i = 0; $i <= $#commitlist; $i++) {
7491                 my %co = %{$commitlist[$i]};
7492                 my $commit = $co{'id'};
7493                 # we read 150, we always show 30 and the ones more recent than 48 hours
7494                 if (($i >= 20) && ((time - $co{'author_epoch'}) > 48*60*60)) {
7495                         last;
7496                 }
7497                 my %cd = parse_date($co{'author_epoch'}, $co{'author_tz'});
7498
7499                 # get list of changed files
7500                 open my $fd, "-|", git_cmd(), "diff-tree", '-r', @diff_opts,
7501                         $co{'parent'} || "--root",
7502                         $co{'id'}, "--", (defined $file_name ? $file_name : ())
7503                         or next;
7504                 my @difftree = map { chomp; $_ } <$fd>;
7505                 close $fd
7506                         or next;
7507
7508                 # print element (entry, item)
7509                 my $co_url = href(-full=>1, action=>"commitdiff", hash=>$commit);
7510                 if ($format eq 'rss') {
7511                         print "<item>\n" .
7512                               "<title>" . esc_html($co{'title'}) . "</title>\n" .
7513                               "<author>" . esc_html($co{'author'}) . "</author>\n" .
7514                               "<pubDate>$cd{'rfc2822'}</pubDate>\n" .
7515                               "<guid isPermaLink=\"true\">$co_url</guid>\n" .
7516                               "<link>$co_url</link>\n" .
7517                               "<description>" . esc_html($co{'title'}) . "</description>\n" .
7518                               "<content:encoded>" .
7519                               "<![CDATA[\n";
7520                 } elsif ($format eq 'atom') {
7521                         print "<entry>\n" .
7522                               "<title type=\"html\">" . esc_html($co{'title'}) . "</title>\n" .
7523                               "<updated>$cd{'iso-8601'}</updated>\n" .
7524                               "<author>\n" .
7525                               "  <name>" . esc_html($co{'author_name'}) . "</name>\n";
7526                         if ($co{'author_email'}) {
7527                                 print "  <email>" . esc_html($co{'author_email'}) . "</email>\n";
7528                         }
7529                         print "</author>\n" .
7530                               # use committer for contributor
7531                               "<contributor>\n" .
7532                               "  <name>" . esc_html($co{'committer_name'}) . "</name>\n";
7533                         if ($co{'committer_email'}) {
7534                                 print "  <email>" . esc_html($co{'committer_email'}) . "</email>\n";
7535                         }
7536                         print "</contributor>\n" .
7537                               "<published>$cd{'iso-8601'}</published>\n" .
7538                               "<link rel=\"alternate\" type=\"text/html\" href=\"$co_url\" />\n" .
7539                               "<id>$co_url</id>\n" .
7540                               "<content type=\"xhtml\" xml:base=\"" . esc_url($my_url) . "\">\n" .
7541                               "<div xmlns=\"http://www.w3.org/1999/xhtml\">\n";
7542                 }
7543                 my $comment = $co{'comment'};
7544                 print "<pre>\n";
7545                 foreach my $line (@$comment) {
7546                         $line = esc_html($line);
7547                         print "$line\n";
7548                 }
7549                 print "</pre><ul>\n";
7550                 foreach my $difftree_line (@difftree) {
7551                         my %difftree = parse_difftree_raw_line($difftree_line);
7552                         next if !$difftree{'from_id'};
7553
7554                         my $file = $difftree{'file'} || $difftree{'to_file'};
7555
7556                         print "<li>" .
7557                               "[" .
7558                               $cgi->a({-href => href(-full=>1, action=>"blobdiff",
7559                                                      hash=>$difftree{'to_id'}, hash_parent=>$difftree{'from_id'},
7560                                                      hash_base=>$co{'id'}, hash_parent_base=>$co{'parent'},
7561                                                      file_name=>$file, file_parent=>$difftree{'from_file'}),
7562                                       -title => "diff"}, 'D');
7563                         if ($have_blame) {
7564                                 print $cgi->a({-href => href(-full=>1, action=>"blame",
7565                                                              file_name=>$file, hash_base=>$commit),
7566                                               -title => "blame"}, 'B');
7567                         }
7568                         # if this is not a feed of a file history
7569                         if (!defined $file_name || $file_name ne $file) {
7570                                 print $cgi->a({-href => href(-full=>1, action=>"history",
7571                                                              file_name=>$file, hash=>$commit),
7572                                               -title => "history"}, 'H');
7573                         }
7574                         $file = esc_path($file);
7575                         print "] ".
7576                               "$file</li>\n";
7577                 }
7578                 if ($format eq 'rss') {
7579                         print "</ul>]]>\n" .
7580                               "</content:encoded>\n" .
7581                               "</item>\n";
7582                 } elsif ($format eq 'atom') {
7583                         print "</ul>\n</div>\n" .
7584                               "</content>\n" .
7585                               "</entry>\n";
7586                 }
7587         }
7588
7589         # end of feed
7590         if ($format eq 'rss') {
7591                 print "</channel>\n</rss>\n";
7592         } elsif ($format eq 'atom') {
7593                 print "</feed>\n";
7594         }
7595 }
7596
7597 sub git_rss {
7598         git_feed('rss');
7599 }
7600
7601 sub git_atom {
7602         git_feed('atom');
7603 }
7604
7605 sub git_opml {
7606         my @list = git_get_projects_list();
7607         if (!@list) {
7608                 die_error(404, "No projects found");
7609         }
7610
7611         print $cgi->header(
7612                 -type => 'text/xml',
7613                 -charset => 'utf-8',
7614                 -content_disposition => 'inline; filename="opml.xml"');
7615
7616         print <<XML;
7617 <?xml version="1.0" encoding="utf-8"?>
7618 <opml version="1.0">
7619 <head>
7620   <title>$site_name OPML Export</title>
7621 </head>
7622 <body>
7623 <outline text="git RSS feeds">
7624 XML
7625
7626         foreach my $pr (@list) {
7627                 my %proj = %$pr;
7628                 my $head = git_get_head_hash($proj{'path'});
7629                 if (!defined $head) {
7630                         next;
7631                 }
7632                 $git_dir = "$projectroot/$proj{'path'}";
7633                 my %co = parse_commit($head);
7634                 if (!%co) {
7635                         next;
7636                 }
7637
7638                 my $path = esc_html(chop_str($proj{'path'}, 25, 5));
7639                 my $rss  = href('project' => $proj{'path'}, 'action' => 'rss', -full => 1);
7640                 my $html = href('project' => $proj{'path'}, 'action' => 'summary', -full => 1);
7641                 print "<outline type=\"rss\" text=\"$path\" title=\"$path\" xmlUrl=\"$rss\" htmlUrl=\"$html\"/>\n";
7642         }
7643         print <<XML;
7644 </outline>
7645 </body>
7646 </opml>
7647 XML
7648 }